Concurrent requests

nshiab · nshiab · commit c23cc4449725 · 2025-05-01T20:06:23.000-04:00
diff --git a/src/class/SimpleTable.ts b/src/class/SimpleTable.ts
@@ -520,18 +520,20 @@ export default class SimpleTable extends Simple {
    *
    * This method currently supports Google Gemini and Vertex AI. It retrieves credentials and the model from environment variables (`AI_KEY`, `AI_PROJECT`, `AI_LOCATION`, `AI_MODEL`) or accepts them as options. Options take precedence over environment variables.
    *
-   * This method can be slow for large tables. To avoid exceeding rate limits, you can process multiple rows at once with the `batchSize` option. You can also use the `rateLimitPerMinute` option to automatically add a delay between requests to comply with the rate limit.
+   * To avoid exceeding rate limits, you can process multiple rows at once with the `batchSize` option. You can also use the `rateLimitPerMinute` option to automatically add a delay between requests to comply with the rate limit.
+   *
+   * On the other hand, if you have a business or professional account with high rate limits, you can set the `concurrent` option to process multiple requests concurrently and speed up the process.
    *
    * The `cache` option allows you to cache locally the results of each request, saving resources and time. The data is cached in the local hidden folder `.journalism` (because this method uses the `askAI` function from the [journalism library](https://github.com/nshiab/journalism)). So don't forget to add `.journalism` to your `.gitignore` file!
    *
-   * Sometimes, the AI returns less items than the batch size, which throws an error. If you want to automatically retry the request, you can use the `retry` option. The method will retry the request up to the specified number of times.
+   * Sometimes, the AI returns fewer items than the batch size, which throws an error. If you want to automatically retry the request, you can use the `retry` option. The method will retry the request up to the specified number of times.
    *
    * The temperature is set to 0 to ensure reproducible results. However, consistent results cannot be guaranteed.
    *
    * This method won't work if you have geometries in your table.
    *
    * @example
-   * Basic usage with cache, batchSize and retry options
+   * Basic usage with cache, batchSize and rate limit
    * ```ts
    * // New table with column "city".
    * await table.loadArray([
@@ -547,7 +549,7 @@ export default class SimpleTable extends Simple {
    *   "country",
    *   `Give me the country of the city.`,
    *   // Don't forget to add .journalism to your .gitignore file!
-   *   { cache: true, batchSize: 10, retry: 3, verbose: true },
+   *   { cache: true, batchSize: 10, rateLimitPerMinute: 15, verbose: true },
    * );
    *
    * // Result:
@@ -563,6 +565,7 @@ export default class SimpleTable extends Simple {
    * @param prompt - The input string to guide the AI's response.
    * @param options - Configuration options for the AI request.
    *   @param options.batchSize - The number of rows to process in each batch. By default, it is 1.
+   *   @param options.concurrent - The number of concurrent requests to send. By default, it is 1.
    *   @param options.cache - If true, the results will be cached locally. By default, it is false.
    *   @param options.retry - The number of times to retry the request in case of failure. By default, it is 0.
    *   @param options.rateLimitPerMinute - The rate limit for the AI requests in requests per minute. If necessary, the method will wait between requests. By default, there is no limit.
@@ -579,6 +582,7 @@ export default class SimpleTable extends Simple {
     prompt: string,
     options: {
       batchSize?: number;
+      concurrent?: number;
       cache?: boolean;
       retry?: number;
       model?: string;
diff --git a/src/helpers/tryAI.ts b/src/helpers/tryAI.ts
@@ -0,0 +1,102 @@
+import { formatNumber } from "@nshiab/journalism";
+import { askAI } from "@nshiab/journalism";
+
+export default async function tryAI(
+  i: number,
+  batchSize: number,
+  rows: {
+    [key: string]: string | number | boolean | Date | null;
+  }[],
+  column: string,
+  newColumn: string,
+  prompt: string,
+  options: {
+    batchSize?: number;
+    concurrent?: number;
+    cache?: boolean;
+    retry?: number;
+    model?: string;
+    apiKey?: string;
+    vertex?: boolean;
+    project?: string;
+    location?: string;
+    verbose?: boolean;
+    rateLimitPerMinute?: number;
+  } = {},
+) {
+  options.verbose &&
+    console.log(
+      `\n${Math.min(i + batchSize, rows.length)}/${rows.length} | ${
+        formatNumber(
+          (Math.min(i + batchSize, rows.length)) / rows.length * 100,
+          {
+            significantDigits: 3,
+            suffix: "%",
+          },
+        )
+      }`,
+    );
+  const batch = rows.slice(i, i + batchSize);
+  const fullPrompt = `${prompt}\nHere are the ${column} values as a list: ${
+    JSON.stringify(batch.map((d) => d[column]))
+  }\nReturn the results in a list as well. It's critical you return the same number of items, which is ${batch.length}, exactly in the same order.`;
+
+  if (options.verbose) {
+    console.log("\nPrompt:");
+    console.log(fullPrompt);
+  }
+
+  const retry = options.retry ?? 1;
+
+  let testPassed = false;
+  let iterations = 1;
+  let newValues: (string | number | boolean | Date | null)[] = [];
+  while (!testPassed && iterations <= retry) {
+    try {
+      // Types could be improved
+      newValues = await askAI(
+        fullPrompt,
+        {
+          ...options,
+          returnJson: true,
+          test: (response: unknown) => {
+            if (!Array.isArray(response)) {
+              throw new Error(
+                `The AI returned a non-array value: ${
+                  JSON.stringify(response)
+                }`,
+              );
+            }
+            if (response.length !== batch.length) {
+              throw new Error(
+                `The AI returned ${response.length} values, but the batch size is ${batch.length}.`,
+              );
+            }
+          },
+        },
+      ) as (string | number | boolean | Date | null)[];
+
+      testPassed = true;
+    } catch (e: unknown) {
+      if (iterations < retry) {
+        console.log(
+          `Error: the AI didn't return the expected number of items.\nRetrying... (${iterations}/${retry})`,
+        );
+        iterations++;
+      } else {
+        console.log(
+          `Error: the AI didn't return the expected number of items.\nNo more retries left. (${iterations}/${retry}).`,
+        );
+        throw e;
+      }
+    }
+  }
+
+  if (options.verbose) {
+    console.log("\nResponse:", newValues);
+  }
+
+  for (let j = 0; j < newValues.length; j++) {
+    rows[i + j][newColumn] = newValues[j];
+  }
+}
diff --git a/src/methods/aiRowByRow.ts b/src/methods/aiRowByRow.ts
@@ -1,5 +1,6 @@
-import { askAI, formatNumber, prettyDuration, sleep } from "@nshiab/journalism";
+import { prettyDuration, sleep } from "@nshiab/journalism";
 import type { SimpleTable } from "../index.ts";
+import tryAI from "../helpers/tryAI.ts";
 
 export default async function aiRowByRow(
   simpleTable: SimpleTable,
@@ -8,6 +9,7 @@ export default async function aiRowByRow(
   prompt: string,
   options: {
     batchSize?: number;
+    concurrent?: number;
     cache?: boolean;
     retry?: number;
     model?: string;
@@ -25,99 +27,82 @@ export default async function aiRowByRow(
     }
 
     const batchSize = options.batchSize ?? 1;
+    const concurrent = options.concurrent ?? 1;
 
+    let requests = [];
     for (let i = 0; i < rows.length; i += batchSize) {
-      options.verbose &&
-        console.log(
-          `\n${Math.min(i + batchSize, rows.length)}/${rows.length} | ${
-            formatNumber(
-              (Math.min(i + batchSize, rows.length)) / rows.length * 100,
-              {
-                significantDigits: 3,
-                suffix: "%",
-              },
-            )
-          }`,
+      if (concurrent === 1) {
+        const start = new Date();
+        await tryAI(
+          i,
+          batchSize,
+          rows,
+          column,
+          newColumn,
+          prompt,
+          options,
         );
-      const batch = rows.slice(i, i + batchSize);
-      const fullPrompt = `${prompt}\nHere are the ${column} values as a list: ${
-        JSON.stringify(batch.map((d) => d[column]))
-      }\nReturn the results in a list as well. It's critical you return the same number of items, which is ${batch.length}, exactly in the same order.`;
+        const end = new Date();
 
-      if (options.verbose) {
-        console.log("\nPrompt:");
-        console.log(fullPrompt);
-      }
-
-      const start = new Date();
-
-      const retry = options.retry ?? 1;
-      let testPassed = false;
-      let iterations = 1;
-      let newValues: (string | number | boolean | Date | null)[] = [];
-      while (!testPassed && iterations <= retry) {
-        try {
-          // Types could be improved
-          newValues = await askAI(
-            fullPrompt,
-            {
-              ...options,
-              returnJson: true,
-              test: (response: unknown) => {
-                if (!Array.isArray(response)) {
-                  throw new Error(
-                    `The AI returned a non-array value: ${
-                      JSON.stringify(response)
-                    }`,
-                  );
-                }
-                if (response.length !== batch.length) {
-                  throw new Error(
-                    `The AI returned ${response.length} values, but the batch size is ${batchSize}.`,
-                  );
-                }
-              },
-            },
-          ) as (string | number | boolean | Date | null)[];
-
-          testPassed = true;
-        } catch (e: unknown) {
-          if (iterations < retry) {
-            console.log(
-              `Error: the AI didn't return the expected number of items.\nRetrying... (${iterations}/${retry})`,
-            );
-            iterations++;
-          } else {
-            console.log(
-              `Error: the AI didn't return the expected number of items.\nNo more retries left. (${iterations}/${retry}).`,
-            );
-            throw e;
+        const duration = end.getTime() - start.getTime();
+        // If duration is less than 50ms, it means data comes from cache and we don't need to wait
+        if (
+          typeof options.rateLimitPerMinute === "number" && duration > 50
+        ) {
+          const delay = Math.round((60 / options.rateLimitPerMinute) * 1000) -
+            duration;
+          if (delay > 0) {
+            if (options.verbose) {
+              console.log(
+                `Waiting ${
+                  prettyDuration(0, { end: delay })
+                } to respect rate limit...`,
+              );
+            }
+            await sleep(delay);
           }
         }
-      }
-
-      const end = new Date();
-
-      if (options.verbose) {
-        console.log("\nResponse:", newValues);
-      }
+      } else if (concurrent) {
+        if (requests.length < concurrent) {
+          requests.push(
+            tryAI(
+              i,
+              batchSize,
+              rows,
+              column,
+              newColumn,
+              prompt,
+              options,
+            ),
+          );
+        }
+        if (requests.length === concurrent || i + batchSize >= rows.length) {
+          const start = new Date();
+          await Promise.all(requests);
+          const end = new Date();
 
-      for (let j = 0; j < newValues.length; j++) {
-        rows[i + j][newColumn] = newValues[j];
-      }
+          requests = [];
 
-      if (typeof options.rateLimitPerMinute === "number") {
-        const delay = Math.round((60 / options.rateLimitPerMinute) * 1000) -
-          (end.getTime() - start.getTime());
-        if (delay > 0) {
-          if (options.verbose) {
-            console.log(
-              `Waiting ${
-                prettyDuration(0, { end: delay })
-              } to respect rate limit...`,
-            );
+          const duration = end.getTime() - start.getTime();
+          // If duration is less than 50ms, it means data comes from cache and we don't need to wait
+          if (
+            typeof options.rateLimitPerMinute === "number" && duration > 50
+          ) {
+            const delay = Math.round(
+              (60 / (options.rateLimitPerMinute / concurrent)) * 1000,
+            ) -
+              (end.getTime() - start.getTime());
+            if (delay > 0) {
+              if (options.verbose) {
+                console.log(
+                  `Waiting ${
+                    prettyDuration(0, { end: delay })
+                  } to respect rate limit...`,
+                );
+              }
+              await sleep(delay);
+            }
           }
-          await sleep(delay);
         }
       }
     }
diff --git a/test/unit/methods/aiRowByRow.test.ts b/test/unit/methods/aiRowByRow.test.ts