Ollama sequential embedding (#2230)

* ollama: Switch from parallel to sequential chunk embedding * throw error on empty embeddings --------- Co-authored-by: John Blomberg <john.jb.blomberg@gmail.com>
2024-11-19 12:40:09 +01:00 · 2024-09-06 10:06:46 -07:00 · 2024-09-06 10:06:46 -07:00 · 20135835d0
commit 20135835d0
parent fef01550df
1 changed files with 28 additions and 47 deletions
--- a/server/utils/EmbeddingEngines/ollama/index.js
+++ b/server/utils/EmbeddingEngines/ollama/index.js
@ -36,67 +36,48 @@ class OllamaEmbedder {
    return result?.[0] || [];
  }
  /**
   * This function takes an array of text chunks and embeds them using the Ollama API.
   * chunks are processed sequentially to avoid overwhelming the API with too many requests
   * or running out of resources on the endpoint running the ollama instance.
   * @param {string[]} textChunks - An array of text chunks to embed.
   * @returns {Promise<Array<number[]>>} - A promise that resolves to an array of embeddings.
   */
  async embedChunks(textChunks = []) {
    if (!(await this.#isAlive()))
      throw new Error(
        `Ollama service could not be reached. Is Ollama running?`
      );
    const embeddingRequests = [];
    this.log(
      `Embedding ${textChunks.length} chunks of text with ${this.model}.`
    );
    let data = [];
    let error = null;
    for (const chunk of textChunks) {
-      embeddingRequests.push(
+      try {
-        new Promise((resolve) => {
+        const res = await fetch(this.basePath, {
-          fetch(this.basePath, {
+          method: "POST",
-            method: "POST",
+          body: JSON.stringify({
-            body: JSON.stringify({
+            model: this.model,
-              model: this.model,
+            prompt: chunk,
-              prompt: chunk,
+          }),
-            }),
+        });
          })
            .then((res) => res.json())
            .then(({ embedding }) => {
              resolve({ data: embedding, error: null });
              return;
            })
            .catch((error) => {
              resolve({ data: [], error: error.message });
              return;
            });
        })
      );
    }
-    const { data = [], error = null } = await Promise.all(
+        const { embedding } = await res.json();
-      embeddingRequests
+        if (!Array.isArray(embedding) || embedding.length === 0)
-    ).then((results) => {
+          throw new Error("Ollama returned an empty embedding for chunk!");
      // If any errors were returned from Ollama abort the entire sequence because the embeddings
      // will be incomplete.
-      const errors = results
+        data.push(embedding);
-        .filter((res) => !!res.error)
+      } catch (err) {
-        .map((res) => res.error)
+        this.log(err.message);
-        .flat();
+        error = err.message;
-      if (errors.length > 0) {
+        data = [];
-        let uniqueErrors = new Set();
+        break;
        errors.map((error) =>
          uniqueErrors.add(`[${error.type}]: ${error.message}`)
        );
        return {
          data: [],
          error: Array.from(uniqueErrors).join(", "),
        };
      }
-
+    }
      return {
        data: results.map((res) => res?.data || []),
        error: null,
      };
    });
    if (!!error) throw new Error(`Ollama Failed to embed: ${error}`);
    return data.length > 0 ? data : null;