anything-llm/server/utils/EmbeddingEngines/native/index.js

const path = require("path");
const fs = require("fs");
const { toChunks } = require("../../helpers");

class NativeEmbedder {
  constructor() {
    // Model Card: https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2
    this.model = "Xenova/all-MiniLM-L6-v2";
    this.cacheDir = path.resolve(
      process.env.STORAGE_DIR
        ? path.resolve(process.env.STORAGE_DIR, `models`)
        : path.resolve(__dirname, `../../../storage/models`)
    );
    this.modelPath = path.resolve(this.cacheDir, "Xenova", "all-MiniLM-L6-v2");

    // Limit of how many strings we can process in a single pass to stay with resource or network limits
    this.embeddingMaxChunkLength = 50;

    // Make directory when it does not exist in existing installations
    if (!fs.existsSync(this.cacheDir)) fs.mkdirSync(this.cacheDir);
  }

  async embedderClient() {
    if (!fs.existsSync(this.modelPath)) {
      console.log(
        "\x1b[34m[INFO]\x1b[0m The native embedding model has never been run and will be downloaded right now. Subsequent runs will be faster. (~23MB)\n\n"
      );
    }

    try {
      // Convert ESM to CommonJS via import so we can load this library.
      const pipeline = (...args) =>
        import("@xenova/transformers").then(({ pipeline }) =>
          pipeline(...args)
        );
      return await pipeline("feature-extraction", this.model, {
        cache_dir: this.cacheDir,
        ...(!fs.existsSync(this.modelPath)
          ? {
              // Show download progress if we need to download any files
              progress_callback: (data) => {
                if (!data.hasOwnProperty("progress")) return;
                console.log(
                  `\x1b[34m[Embedding - Downloading Model Files]\x1b[0m ${
                    data.file
                  } ${~~data?.progress}%`
                );
              },
            }
          : {}),
      });
    } catch (error) {
      console.error("Failed to load the native embedding model:", error);
      throw error;
    }
  }

  async embedTextInput(textInput) {
    const result = await this.embedChunks(textInput);
    return result?.[0] || [];
  }

  async embedChunks(textChunks = []) {
    const Embedder = await this.embedderClient();
    const embeddingResults = [];
    for (const chunk of toChunks(textChunks, this.embeddingMaxChunkLength)) {
      const output = await Embedder(chunk, {
        pooling: "mean",
        normalize: true,
      });
      if (output.length === 0) continue;
      embeddingResults.push(output.tolist());
    }

    return embeddingResults.length > 0 ? embeddingResults.flat() : null;
  }
}

module.exports = {
  NativeEmbedder,
};
Add built-in embedding engine into AnythingLLM (#411) * Implement use of native embedder (all-Mini-L6-v2) stop showing prisma queries during dev * Add native embedder as an available embedder selection * wrap model loader in try/catch * print progress on download * Update to progress output for embedder * move embedder selection options to component * forgot import * add Data privacy alert updates for local embedder 2023-12-06 19:36:22 +01:00			`const path = require("path");`
			`const fs = require("fs");`
			`const { toChunks } = require("../../helpers");`

			`class NativeEmbedder {`
			`constructor() {`
feat: add support for variable chunk length (#415) fix: cleanup code for embedding length clarify resolves #388 2023-12-08 01:27:36 +01:00			`// Model Card: https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2`
Add built-in embedding engine into AnythingLLM (#411) * Implement use of native embedder (all-Mini-L6-v2) stop showing prisma queries during dev * Add native embedder as an available embedder selection * wrap model loader in try/catch * print progress on download * Update to progress output for embedder * move embedder selection options to component * forgot import * add Data privacy alert updates for local embedder 2023-12-06 19:36:22 +01:00			`this.model = "Xenova/all-MiniLM-L6-v2";`
			`this.cacheDir = path.resolve(`
			`process.env.STORAGE_DIR`
			? path.resolve(process.env.STORAGE_DIR, `models`)
			: path.resolve(__dirname, `../../../storage/models`)
			`);`
			`this.modelPath = path.resolve(this.cacheDir, "Xenova", "all-MiniLM-L6-v2");`

fix: set lower maxChunk limit on native embedder to stay within resource constraints chore: update comment for what embedding chunk means 2023-12-20 01:20:34 +01:00			`// Limit of how many strings we can process in a single pass to stay with resource or network limits`
			`this.embeddingMaxChunkLength = 50;`
Add built-in embedding engine into AnythingLLM (#411) * Implement use of native embedder (all-Mini-L6-v2) stop showing prisma queries during dev * Add native embedder as an available embedder selection * wrap model loader in try/catch * print progress on download * Update to progress output for embedder * move embedder selection options to component * forgot import * add Data privacy alert updates for local embedder 2023-12-06 19:36:22 +01:00
			`// Make directory when it does not exist in existing installations`
			`if (!fs.existsSync(this.cacheDir)) fs.mkdirSync(this.cacheDir);`
			`}`

			`async embedderClient() {`
			`if (!fs.existsSync(this.modelPath)) {`
			`console.log(`
			`"\x1b[34m[INFO]\x1b[0m The native embedding model has never been run and will be downloaded right now. Subsequent runs will be faster. (~23MB)\n\n"`
			`);`
			`}`

			`try {`
			`// Convert ESM to CommonJS via import so we can load this library.`
			`const pipeline = (...args) =>`
			`import("@xenova/transformers").then(({ pipeline }) =>`
			`pipeline(...args)`
			`);`
			`return await pipeline("feature-extraction", this.model, {`
			`cache_dir: this.cacheDir,`
			`...(!fs.existsSync(this.modelPath)`
			`? {`
			`// Show download progress if we need to download any files`
			`progress_callback: (data) => {`
			`if (!data.hasOwnProperty("progress")) return;`
			`console.log(`
			`\x1b[34m[Embedding - Downloading Model Files]\x1b[0m ${
			`data.file`
			} ${~~data?.progress}%`
			`);`
			`},`
			`}`
			`: {}),`
			`});`
			`} catch (error) {`
			`console.error("Failed to load the native embedding model:", error);`
			`throw error;`
			`}`
			`}`

			`async embedTextInput(textInput) {`
			`const result = await this.embedChunks(textInput);`
			`return result?.[0] \|\| [];`
			`}`

			`async embedChunks(textChunks = []) {`
			`const Embedder = await this.embedderClient();`
			`const embeddingResults = [];`
feat: add support for variable chunk length (#415) fix: cleanup code for embedding length clarify resolves #388 2023-12-08 01:27:36 +01:00			`for (const chunk of toChunks(textChunks, this.embeddingMaxChunkLength)) {`
Add built-in embedding engine into AnythingLLM (#411) * Implement use of native embedder (all-Mini-L6-v2) stop showing prisma queries during dev * Add native embedder as an available embedder selection * wrap model loader in try/catch * print progress on download * Update to progress output for embedder * move embedder selection options to component * forgot import * add Data privacy alert updates for local embedder 2023-12-06 19:36:22 +01:00			`const output = await Embedder(chunk, {`
			`pooling: "mean",`
			`normalize: true,`
			`});`
			`if (output.length === 0) continue;`
			`embeddingResults.push(output.tolist());`
			`}`

			`return embeddingResults.length > 0 ? embeddingResults.flat() : null;`
			`}`
			`}`

			`module.exports = {`
			`NativeEmbedder,`
			`};`