anything-llm/server/endpoints/chat.js

const { v4: uuidv4 } = require("uuid");
const { reqBody, userFromSession, multiUserMode } = require("../utils/http");
const { validatedRequest } = require("../utils/middleware/validatedRequest");
const { WorkspaceChats } = require("../models/workspaceChats");
const { SystemSettings } = require("../models/systemSettings");
const { Telemetry } = require("../models/telemetry");
const { streamChatWithWorkspace } = require("../utils/chats/stream");
const {
  ROLES,
  flexUserRoleValid,
} = require("../utils/middleware/multiUserProtected");
const { EventLogs } = require("../models/eventLogs");
const {
  validWorkspaceAndThreadSlug,
  validWorkspaceSlug,
} = require("../utils/middleware/validWorkspace");
const { writeResponseChunk } = require("../utils/helpers/chat/responses");

function chatEndpoints(app) {
  if (!app) return;

  app.post(
    "/workspace/:slug/stream-chat",
    [validatedRequest, flexUserRoleValid([ROLES.all]), validWorkspaceSlug],
    async (request, response) => {
      try {
        const user = await userFromSession(request, response);
        const { message } = reqBody(request);
        const workspace = response.locals.workspace;

        if (!message?.length) {
          response.status(400).json({
            id: uuidv4(),
            type: "abort",
            textResponse: null,
            sources: [],
            close: true,
            error: !message?.length ? "Message is empty." : null,
          });
          return;
        }

        response.setHeader("Cache-Control", "no-cache");
        response.setHeader("Content-Type", "text/event-stream");
        response.setHeader("Access-Control-Allow-Origin", "*");
        response.setHeader("Connection", "keep-alive");
        response.flushHeaders();

        if (multiUserMode(response) && user.role !== ROLES.admin) {
          const limitMessagesSetting = await SystemSettings.get({
            label: "limit_user_messages",
          });
          const limitMessages = limitMessagesSetting?.value === "true";

          if (limitMessages) {
            const messageLimitSetting = await SystemSettings.get({
              label: "message_limit",
            });
            const systemLimit = Number(messageLimitSetting?.value);

            if (!!systemLimit) {
              const currentChatCount = await WorkspaceChats.count({
                user_id: user.id,
                createdAt: {
                  gte: new Date(new Date() - 24 * 60 * 60 * 1000),
                },
              });

              if (currentChatCount >= systemLimit) {
                writeResponseChunk(response, {
                  id: uuidv4(),
                  type: "abort",
                  textResponse: null,
                  sources: [],
                  close: true,
                  error: `You have met your maximum 24 hour chat quota of ${systemLimit} chats set by the instance administrators. Try again later.`,
                });
                return;
              }
            }
          }
        }

        await streamChatWithWorkspace(
          response,
          workspace,
          message,
          workspace?.chatMode,
          user
        );
        await Telemetry.sendTelemetry("sent_chat", {
          multiUserMode: multiUserMode(response),
          LLMSelection: process.env.LLM_PROVIDER || "openai",
          Embedder: process.env.EMBEDDING_ENGINE || "inherit",
          VectorDbSelection: process.env.VECTOR_DB || "pinecone",
        });

        await EventLogs.logEvent(
          "sent_chat",
          {
            workspaceName: workspace?.name,
            chatModel: workspace?.chatModel || "System Default",
          },
          user?.id
        );
        response.end();
      } catch (e) {
        console.error(e);
        writeResponseChunk(response, {
          id: uuidv4(),
          type: "abort",
          textResponse: null,
          sources: [],
          close: true,
          error: e.message,
        });
        response.end();
      }
    }
  );

  app.post(
    "/workspace/:slug/thread/:threadSlug/stream-chat",
    [
      validatedRequest,
      flexUserRoleValid([ROLES.all]),
      validWorkspaceAndThreadSlug,
    ],
    async (request, response) => {
      try {
        const user = await userFromSession(request, response);
        const { message } = reqBody(request);
        const workspace = response.locals.workspace;
        const thread = response.locals.thread;

        if (!message?.length) {
          response.status(400).json({
            id: uuidv4(),
            type: "abort",
            textResponse: null,
            sources: [],
            close: true,
            error: !message?.length ? "Message is empty." : null,
          });
          return;
        }

        response.setHeader("Cache-Control", "no-cache");
        response.setHeader("Content-Type", "text/event-stream");
        response.setHeader("Access-Control-Allow-Origin", "*");
        response.setHeader("Connection", "keep-alive");
        response.flushHeaders();

        if (multiUserMode(response) && user.role !== ROLES.admin) {
          const limitMessagesSetting = await SystemSettings.get({
            label: "limit_user_messages",
          });
          const limitMessages = limitMessagesSetting?.value === "true";

          if (limitMessages) {
            const messageLimitSetting = await SystemSettings.get({
              label: "message_limit",
            });
            const systemLimit = Number(messageLimitSetting?.value);

            if (!!systemLimit) {
              // Chat qty includes all threads because any user can freely
              // create threads and would bypass this rule.
              const currentChatCount = await WorkspaceChats.count({
                user_id: user.id,
                createdAt: {
                  gte: new Date(new Date() - 24 * 60 * 60 * 1000),
                },
              });

              if (currentChatCount >= systemLimit) {
                writeResponseChunk(response, {
                  id: uuidv4(),
                  type: "abort",
                  textResponse: null,
                  sources: [],
                  close: true,
                  error: `You have met your maximum 24 hour chat quota of ${systemLimit} chats set by the instance administrators. Try again later.`,
                });
                return;
              }
            }
          }
        }

        await streamChatWithWorkspace(
          response,
          workspace,
          message,
          workspace?.chatMode,
          user,
          thread
        );
        await Telemetry.sendTelemetry("sent_chat", {
          multiUserMode: multiUserMode(response),
          LLMSelection: process.env.LLM_PROVIDER || "openai",
          Embedder: process.env.EMBEDDING_ENGINE || "inherit",
          VectorDbSelection: process.env.VECTOR_DB || "pinecone",
        });

        await EventLogs.logEvent(
          "sent_chat",
          {
            workspaceName: workspace.name,
            thread: thread.name,
            chatModel: workspace?.chatModel || "System Default",
          },
          user?.id
        );
        response.end();
      } catch (e) {
        console.error(e);
        writeResponseChunk(response, {
          id: uuidv4(),
          type: "abort",
          textResponse: null,
          sources: [],
          close: true,
          error: e.message,
        });
        response.end();
      }
    }
  );
}

module.exports = { chatEndpoints };
dump error message to frontend instead of generic error (#114) 2023-06-27 02:54:55 +02:00			`const { v4: uuidv4 } = require("uuid");`
[FEATURE] Enable the ability to have multi user instances (#158) * multi user wip * WIP MUM features * invitation mgmt * suspend or unsuspend users * workspace mangement * manage chats * manage chats * add Support for admin system settings for users to delete workspaces and limit chats per user * fix issue ith system var update app to lazy load invite page * cleanup and bug fixes * wrong method * update readme * update readme * update readme * bump version to 0.1.0 2023-07-25 19:37:04 +02:00			`const { reqBody, userFromSession, multiUserMode } = require("../utils/http");`
			`const { validatedRequest } = require("../utils/middleware/validatedRequest");`
			`const { WorkspaceChats } = require("../models/workspaceChats");`
			`const { SystemSettings } = require("../models/systemSettings");`
Enable optional Telemetry integration via posthog (#190) * Enable optional Telemetry integration via posthog 2023-08-15 02:42:17 +02:00			`const { Telemetry } = require("../models/telemetry");`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`const { streamChatWithWorkspace } = require("../utils/chats/stream");`
Implement total permission overhaul (#629) * Implement total permission overhaul Add explicit permissions on each flex and strict route Patch issues with role escalation and CRUD of users Patch permissions on all routes for coverage Improve middleware to accept role array for clarity * update comments * remove permissions to API-keys for manager. Manager could generate API-key and using high-privelege api-key give themselves admin * update sidebar permissions for multi-user and single user * update options for mobile sidebar 2024-01-22 23:14:01 +01:00			`const {`
			`ROLES,`
			`flexUserRoleValid,`
			`} = require("../utils/middleware/multiUserProtected");`
[FEAT] Automated audit logging (#667) * WIP event logging - new table for events and new settings view for viewing * WIP add logging * UI for log rows * rename files to Logging to prevent getting gitignore * add metadata for all logging events and colored badges in logs page * remove unneeded comment * cleanup namespace for logging * clean up backend calls * update logging to show to => from settings changes * add logging for invitations, created, deleted, and accepted * add logging for user created, updated, suspended, or removed * add logging for workspace deleted * add logging for chat logs exported * add logging for API keys, LLM, embedder, vector db, embed chat, and reset button * modify event logs * update to event log types * simplify rendering of event badges --------- Co-authored-by: timothycarambat <rambat1010@gmail.com> 2024-02-07 00:21:40 +01:00			`const { EventLogs } = require("../models/eventLogs");`
Implement workspace threading that is backwards compatible (#699) * Implement workspace thread that is compatible with legacy versions * last touches * comment on chat qty enforcement 2024-02-09 03:37:22 +01:00			`const {`
			`validWorkspaceAndThreadSlug,`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`validWorkspaceSlug,`
Implement workspace threading that is backwards compatible (#699) * Implement workspace thread that is compatible with legacy versions * last touches * comment on chat qty enforcement 2024-02-09 03:37:22 +01:00			`} = require("../utils/middleware/validWorkspace");`
Refactor LLM chat backend (#717) * refactor stream/chat/embed-stram to be a single execution logic path so that it is easier to maintain and build upon * no thread in sync chat since only api uses it adjust import locations 2024-02-14 21:32:07 +01:00			`const { writeResponseChunk } = require("../utils/helpers/chat/responses");`
inital commit ⚡ 2023-06-04 04:28:07 +02:00
			`function chatEndpoints(app) {`
			`if (!app) return;`

Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00			`app.post(`
			`"/workspace/:slug/stream-chat",`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`[validatedRequest, flexUserRoleValid([ROLES.all]), validWorkspaceSlug],`
Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00			`async (request, response) => {`
			`try {`
			`const user = await userFromSession(request, response);`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`const { message } = reqBody(request);`
			`const workspace = response.locals.workspace;`
Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`if (!message?.length) {`
Implement streaming for workspace chats via API (#604) 2024-01-16 19:37:46 +01:00			`response.status(400).json({`
			`id: uuidv4(),`
			`type: "abort",`
			`textResponse: null,`
			`sources: [],`
			`close: true,`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`error: !message?.length ? "Message is empty." : null,`
Implement streaming for workspace chats via API (#604) 2024-01-16 19:37:46 +01:00			`});`
			`return;`
			`}`

Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00			`response.setHeader("Cache-Control", "no-cache");`
			`response.setHeader("Content-Type", "text/event-stream");`
			`response.setHeader("Access-Control-Allow-Origin", "*");`
			`response.setHeader("Connection", "keep-alive");`
			`response.flushHeaders();`

Implement total permission overhaul (#629) * Implement total permission overhaul Add explicit permissions on each flex and strict route Patch issues with role escalation and CRUD of users Patch permissions on all routes for coverage Improve middleware to accept role array for clarity * update comments * remove permissions to API-keys for manager. Manager could generate API-key and using high-privelege api-key give themselves admin * update sidebar permissions for multi-user and single user * update options for mobile sidebar 2024-01-22 23:14:01 +01:00			`if (multiUserMode(response) && user.role !== ROLES.admin) {`
Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00			`const limitMessagesSetting = await SystemSettings.get({`
			`label: "limit_user_messages",`
			`});`
			`const limitMessages = limitMessagesSetting?.value === "true";`

			`if (limitMessages) {`
			`const messageLimitSetting = await SystemSettings.get({`
			`label: "message_limit",`
			`});`
			`const systemLimit = Number(messageLimitSetting?.value);`

			`if (!!systemLimit) {`
			`const currentChatCount = await WorkspaceChats.count({`
			`user_id: user.id,`
			`createdAt: {`
			`gte: new Date(new Date() - 24 * 60 * 60 * 1000),`
			`},`
			`});`

			`if (currentChatCount >= systemLimit) {`
			`writeResponseChunk(response, {`
			`id: uuidv4(),`
			`type: "abort",`
			`textResponse: null,`
			`sources: [],`
			`close: true,`
			error: `You have met your maximum 24 hour chat quota of ${systemLimit} chats set by the instance administrators. Try again later.`,
			`});`
			`return;`
			`}`
			`}`
			`}`
			`}`

Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`await streamChatWithWorkspace(`
			`response,`
			`workspace,`
			`message,`
			`workspace?.chatMode,`
			`user`
			`);`
Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00			`await Telemetry.sendTelemetry("sent_chat", {`
			`multiUserMode: multiUserMode(response),`
			`LLMSelection: process.env.LLM_PROVIDER \|\| "openai",`
add embedding engine to telem 2023-12-07 17:53:37 +01:00			`Embedder: process.env.EMBEDDING_ENGINE \|\| "inherit",`
Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00			`VectorDbSelection: process.env.VECTOR_DB \|\| "pinecone",`
			`});`
[FEAT] Automated audit logging (#667) * WIP event logging - new table for events and new settings view for viewing * WIP add logging * UI for log rows * rename files to Logging to prevent getting gitignore * add metadata for all logging events and colored badges in logs page * remove unneeded comment * cleanup namespace for logging * clean up backend calls * update logging to show to => from settings changes * add logging for invitations, created, deleted, and accepted * add logging for user created, updated, suspended, or removed * add logging for workspace deleted * add logging for chat logs exported * add logging for API keys, LLM, embedder, vector db, embed chat, and reset button * modify event logs * update to event log types * simplify rendering of event badges --------- Co-authored-by: timothycarambat <rambat1010@gmail.com> 2024-02-07 00:21:40 +01:00
			`await EventLogs.logEvent(`
			`"sent_chat",`
			`{`
			`workspaceName: workspace?.name,`
			`chatModel: workspace?.chatModel \|\| "System Default",`
			`},`
			`user?.id`
			`);`
Enable chat streaming for LLMs (#354) * [Draft] Enable chat streaming for LLMs * stream only, move sendChat to deprecated * Update TODO deprecation comments update console output color for streaming disabled 2023-11-14 00:07:30 +01:00			`response.end();`
			`} catch (e) {`
			`console.error(e);`
			`writeResponseChunk(response, {`
			`id: uuidv4(),`
			`type: "abort",`
			`textResponse: null,`
			`sources: [],`
			`close: true,`
			`error: e.message,`
			`});`
			`response.end();`
			`}`
			`}`
			`);`
Implement workspace threading that is backwards compatible (#699) * Implement workspace thread that is compatible with legacy versions * last touches * comment on chat qty enforcement 2024-02-09 03:37:22 +01:00
			`app.post(`
			`"/workspace/:slug/thread/:threadSlug/stream-chat",`
			`[`
			`validatedRequest,`
			`flexUserRoleValid([ROLES.all]),`
			`validWorkspaceAndThreadSlug,`
			`],`
			`async (request, response) => {`
			`try {`
			`const user = await userFromSession(request, response);`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`const { message } = reqBody(request);`
Implement workspace threading that is backwards compatible (#699) * Implement workspace thread that is compatible with legacy versions * last touches * comment on chat qty enforcement 2024-02-09 03:37:22 +01:00			`const workspace = response.locals.workspace;`
			`const thread = response.locals.thread;`

Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`if (!message?.length) {`
Implement workspace threading that is backwards compatible (#699) * Implement workspace thread that is compatible with legacy versions * last touches * comment on chat qty enforcement 2024-02-09 03:37:22 +01:00			`response.status(400).json({`
			`id: uuidv4(),`
			`type: "abort",`
			`textResponse: null,`
			`sources: [],`
			`close: true,`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`error: !message?.length ? "Message is empty." : null,`
Implement workspace threading that is backwards compatible (#699) * Implement workspace thread that is compatible with legacy versions * last touches * comment on chat qty enforcement 2024-02-09 03:37:22 +01:00			`});`
			`return;`
			`}`

			`response.setHeader("Cache-Control", "no-cache");`
			`response.setHeader("Content-Type", "text/event-stream");`
			`response.setHeader("Access-Control-Allow-Origin", "*");`
			`response.setHeader("Connection", "keep-alive");`
			`response.flushHeaders();`

			`if (multiUserMode(response) && user.role !== ROLES.admin) {`
			`const limitMessagesSetting = await SystemSettings.get({`
			`label: "limit_user_messages",`
			`});`
			`const limitMessages = limitMessagesSetting?.value === "true";`

			`if (limitMessages) {`
			`const messageLimitSetting = await SystemSettings.get({`
			`label: "message_limit",`
			`});`
			`const systemLimit = Number(messageLimitSetting?.value);`

			`if (!!systemLimit) {`
			`// Chat qty includes all threads because any user can freely`
			`// create threads and would bypass this rule.`
			`const currentChatCount = await WorkspaceChats.count({`
			`user_id: user.id,`
			`createdAt: {`
			`gte: new Date(new Date() - 24 * 60 * 60 * 1000),`
			`},`
			`});`

			`if (currentChatCount >= systemLimit) {`
			`writeResponseChunk(response, {`
			`id: uuidv4(),`
			`type: "abort",`
			`textResponse: null,`
			`sources: [],`
			`close: true,`
			error: `You have met your maximum 24 hour chat quota of ${systemLimit} chats set by the instance administrators. Try again later.`,
			`});`
			`return;`
			`}`
			`}`
			`}`
			`}`

			`await streamChatWithWorkspace(`
			`response,`
			`workspace,`
			`message,`
Breakout Chat/Query mode as a workspace setting (#734) Remove useless icons in prompt bar Add chatMode column to workspaces that defaults to chat Add UI for toggle of chat mode with hint Update UI for workspace settings to match designs 2024-02-16 23:50:40 +01:00			`workspace?.chatMode,`
Implement workspace threading that is backwards compatible (#699) * Implement workspace thread that is compatible with legacy versions * last touches * comment on chat qty enforcement 2024-02-09 03:37:22 +01:00			`user,`
			`thread`
			`);`
			`await Telemetry.sendTelemetry("sent_chat", {`
			`multiUserMode: multiUserMode(response),`
			`LLMSelection: process.env.LLM_PROVIDER \|\| "openai",`
			`Embedder: process.env.EMBEDDING_ENGINE \|\| "inherit",`
			`VectorDbSelection: process.env.VECTOR_DB \|\| "pinecone",`
			`});`

			`await EventLogs.logEvent(`
			`"sent_chat",`
			`{`
			`workspaceName: workspace.name,`
			`thread: thread.name,`
			`chatModel: workspace?.chatModel \|\| "System Default",`
			`},`
			`user?.id`
			`);`
			`response.end();`
			`} catch (e) {`
			`console.error(e);`
			`writeResponseChunk(response, {`
			`id: uuidv4(),`
			`type: "abort",`
			`textResponse: null,`
			`sources: [],`
			`close: true,`
			`error: e.message,`
			`});`
			`response.end();`
			`}`
			`}`
			`);`
inital commit ⚡ 2023-06-04 04:28:07 +02:00			`}`

Implement Chroma Support (#1) 2023-06-08 06:31:35 +02:00			`module.exports = { chatEndpoints };`