From 7c941c462c39ee47999ac4176e22525a5d91195d Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Tue, 19 Dec 2023 12:39:49 -0800
Subject: [PATCH 1/6] Add ignore-paths for github actions

---
 .github/workflows/build-and-push-image.yaml | 5 +++++
 1 file changed, 5 insertions(+)
diff --git a/.github/workflows/build-and-push-image.yaml b/.github/workflows/build-and-push-image.yaml
index 76b6dac15..ca5fb52a0 100644
--- a/.github/workflows/build-and-push-image.yaml
+++ b/.github/workflows/build-and-push-image.yaml
@@ -3,6 +3,11 @@ name: Publish Docker image and Github Registry
 on:
   push:
     branches: ['master']
+     paths-ignore:
+      - '*.md'
+      - 'cloud-deployments/*'
+      - 'images/*'
+      - '.vscode/*'
 
 jobs:
   push_to_registries:

From f1fc2d90fa27fe016c34e0aa36a6194789cc91ba Mon Sep 17 00:00:00 2001
From: Timothy Carambat <rambat1010@gmail.com>
Date: Tue, 19 Dec 2023 13:24:50 -0800
Subject: [PATCH 2/6] Readme updates (#475)

* wip

* btn links

* button updates

* update dev instructions

* typo
---
 README.md                    | 100 ++++++++++++++++++-----------------
 docker/HOW_TO_USE_DOCKER.md  |  34 +++++++-----
 images/deployBtns/aws.png    | Bin 0 -> 3560 bytes
 images/deployBtns/docker.png | Bin 0 -> 2746 bytes
 4 files changed, 74 insertions(+), 60 deletions(-)
 create mode 100644 images/deployBtns/aws.png
 create mode 100644 images/deployBtns/docker.png

diff --git a/README.md b/README.md
index e91520ab4..879cf2dd7 100644
--- a/README.md
+++ b/README.md
@@ -26,10 +26,13 @@ A full-stack application that enables you to turn any document, resource, or pie
 
 ![Chatting](/images/screenshots/chatting.gif)
 
-### Watch the demo!
+<details>
+<summary><kbd>Watch the demo!</kbd></summary>
 
 [![Watch the video](/images/youtube.png)](https://youtu.be/f95rGD9trL0)
 
+</details>
+
 
 ### Product Overview
 AnythingLLM is a full-stack application where you can use commercial off-the-shelf LLMs or popular open source LLMs and vectorDB solutions to build a private ChatGPT with no compromises that you can run locally as well as host remotely and be able to chat intelligently with any documents you provide it.
@@ -79,64 +82,28 @@ This monorepo consists of three main sections:
 - `docker`: Docker instructions and build process + information for building from source.
 - `collector`: NodeJS express server that process and parses documents from the UI.
 
-### Minimum Requirements
-> [!TIP]
-> Running AnythingLLM on AWS/GCP/Azure? 
-> You should aim for at least 2GB of RAM. Disk storage is proportional to however much data
-> you will be storing (documents, vectors, models, etc). Minimum 10GB recommended.
+## 🛳 Self Hosting
+Mintplex Labs & the community maintain a number of deployment methods, scripts, and templates that you can use to run AnythingLLM locally. Refer to the table below to read how to deploy on your preferred environment or to automatically deploy.
+| Docker                                 | AWS | GCP | Digital Ocean | Render.com |
+|----------------------------------------|----:|-----|---------------|------------|
+| [![Deploy on Docker][docker-btn]][docker-deploy] |  [![Deploy on AWS][aws-btn]][aws-deploy] | [![Deploy on GCP][gcp-btn]][gcp-deploy]  | [![Deploy on DigitalOcean][do-btn]][aws-deploy]  |  [![Deploy on Render.com][render-btn]][render-deploy] |
 
-- `yarn` and `node` on your machine
-- access to an LLM running locally or remotely.
 
-*AnythingLLM by default uses a built-in vector database powered by [LanceDB](https://github.com/lancedb/lancedb)
-
-*AnythingLLM by default embeds text on instance privately [Learn More](/server/storage/models/README.md)
-
-## Recommended usage with Docker (easy!)
-> [!IMPORTANT]
-> If you are running another service on localhost like Chroma, LocalAi, or LMStudio
-> you will need to use http://host.docker.internal:xxxx to access the service from within
-> the docker container using AnythingLLM as `localhost:xxxx` will not resolve for the host system.
-> eg: Chroma host URL running on localhost:8000 on host machine needs to be http://host.docker.internal:8000
-> when used in AnythingLLM.
-
-> [!TIP]
-> It is best to mount the containers storage volume to a folder on your host machine
-> so that you can pull in future updates without deleting your existing data!
-
-`docker pull mintplexlabs/anythingllm:master`
-
-```shell
-export STORAGE_LOCATION=$HOME/anythingllm && \
-mkdir -p $STORAGE_LOCATION && \
-touch "$STORAGE_LOCATION/.env" && \
-docker run -d -p 3001:3001 \
---cap-add SYS_ADMIN \
--v ${STORAGE_LOCATION}:/app/server/storage \
--v ${STORAGE_LOCATION}/.env:/app/server/.env \
--e STORAGE_DIR="/app/server/storage" \
-mintplexlabs/anythingllm:master
-```
-
-Open [http://localhost:3001](http://localhost:3001) and you are now using AnythingLLM! 
-All your data and progress will now persist between container rebuilds or pulls from Docker Hub.
-
-[Learn more about running AnythingLLM with Docker](./docker/HOW_TO_USE_DOCKER.md)
-
-### How to get started (Development environment)
+## How to setup for development
 - `yarn setup` from the project root directory.
   - This will fill in the required `.env` files you'll need in each of the application sections. Go fill those out before proceeding or else things won't work right.
 - `yarn prisma:setup` To build the Prisma client and migrate the database.
 
-To boot the server locally (run commands from root of repo):
+To boot the server locally (from root of repo):
 - ensure `server/.env.development` is set and filled out.
 `yarn dev:server`
  
-To boot the frontend locally (run commands from root of repo):
-- ensure `frontend/.env` is set and filled out.
-- ensure `VITE_API_BASE="http://localhost:3001/api"`
+To boot the frontend locally (from root of repo):
 `yarn dev:frontend`
 
+To then run the document collector (from root of repo)
+`yarn dev:collector`
+
 [Learn about documents](./server/storage/documents/DOCUMENTS.md)
 
 [Learn about vector caching](./server/storage/vector-cache/VECTOR_CACHE.md)
@@ -146,6 +113,9 @@ To boot the frontend locally (run commands from root of repo):
 - create PR with branch name format of `<issue number>-<short name>`
 - yee haw let's merge
 
+<details>
+<summary><kbd>Telemetry for AnythingLLM</kbd></summary>
+
 ## Telemetry
 AnythingLLM by Mintplex Labs Inc contains a telemetry feature that collects anonymous usage information.
 
@@ -168,3 +138,37 @@ We will only track usage details that help us make product and roadmap decisions
 - Chat is sent. This is the most regular "event" and gives us an idea of the daily-activity of this project across all installations. Again, only the event is sent - we have no information on the nature or content of the chat itself.
 
 You can verify these claims by finding all locations `Telemetry.sendTelemetry` is called. Additionally these events are written to the output log so you can also see the specific data which was sent - if enabled. No IP or other identifying information is collected. The Telemetry provider is [PostHog](https://posthog.com/) - an open-source telemetry collection service.
+
+</details>
+
+## 🔗 More Products
+
+- **[VectorAdmin][vector-admin]:** An all-in-one GUI & tool-suite for managing vector databases.
+- **[OpenAI Assistant Swarm][assistant-swarm]:** Turn your entire library of OpenAI assistants into one single army commanded from a single agent.
+
+<div align="right">
+
+[![][back-to-top]](#readme-top)
+
+</div>
+
+---
+
+Copyright © 2023 [Mintplex Labs][profile-link]. <br />
+This project is [MIT](./LICENSE) licensed.
+
+<!-- LINK GROUP -->
+[back-to-top]: https://img.shields.io/badge/-BACK_TO_TOP-222628?style=flat-square
+[profile-link]: https://github.com/mintplex-labs
+[vector-admin]: https://github.com/mintplex-labs/vector-admin
+[assistant-swarm]: https://github.com/Mintplex-Labs/openai-assistant-swarm
+[docker-btn]: ./images/deployBtns/docker.png
+[docker-deploy]: ./docker/HOW_TO_USE_DOCKER.md
+[aws-btn]: ./images/deployBtns/aws.png
+[aws-deploy]: ./cloud-deployments/aws/cloudformation/DEPLOY.md
+[gcp-btn]: https://deploy.cloud.run/button.svg
+[gcp-deploy]: ./cloud-deployments/gcp/deployment/DEPLOY.md
+[do-btn]: https://www.deploytodo.com/do-btn-blue.svg
+[do-deploy]: ./cloud-deployments/digitalocean/terraform/DEPLOY.md
+[render-btn]: https://render.com/images/deploy-to-render-button.svg
+[render-deploy]: https://render.com/deploy?repo=https://github.com/Mintplex-Labs/anything-llm&branch=render
diff --git a/docker/HOW_TO_USE_DOCKER.md b/docker/HOW_TO_USE_DOCKER.md
index a74b11d45..5b5a58067 100644
--- a/docker/HOW_TO_USE_DOCKER.md
+++ b/docker/HOW_TO_USE_DOCKER.md
@@ -2,8 +2,20 @@
 
 Use the Dockerized version of AnythingLLM for a much faster and complete startup of AnythingLLM.
 
-## Requirements
-- Install [Docker](https://www.docker.com/) on your computer or machine.
+
+### Minimum Requirements
+> [!TIP]
+> Running AnythingLLM on AWS/GCP/Azure? 
+> You should aim for at least 2GB of RAM. Disk storage is proportional to however much data
+> you will be storing (documents, vectors, models, etc). Minimum 10GB recommended.
+
+- `docker` installed on your machine
+- `yarn` and `node` on your machine
+- access to an LLM running locally or remotely
+
+*AnythingLLM by default uses a built-in vector database powered by [LanceDB](https://github.com/lancedb/lancedb)
+
+*AnythingLLM by default embeds text on instance privately [Learn More](../server/storage/models/README.md)
 
 ## Recommend way to run dockerized AnythingLLM!
 > [!IMPORTANT]
@@ -34,7 +46,13 @@ mintplexlabs/anythingllm:master
 Go to `http://localhost:3001` and you are now using AnythingLLM! All your data and progress will persist between
 container rebuilds or pulls from Docker Hub.
 
-## Build locally from source
+## How to use the user interface
+- To access the full application, visit `http://localhost:3001` in your browser.
+
+## About UID and GID in the ENV
+- The UID and GID are set to 1000 by default. This is the default user in the Docker container and on most host operating systems. If there is a mismatch between your host user UID and GID and what is set in the `.env` file, you may experience permission issues.
+
+## Build locally from source _not recommended for casual use_
 - `git clone` this repo and `cd anything-llm` to get to the root directory.
 - `touch server/storage/anythingllm.db` to create empty SQLite DB file.
 - `cd docker/`
@@ -43,12 +61,6 @@ container rebuilds or pulls from Docker Hub.
 
 Your docker host will show the image as online once the build process is completed. This will build the app to `http://localhost:3001`.
 
-## How to use the user interface
-- To access the full application, visit `http://localhost:3001` in your browser.
-
-## About UID and GID in the ENV
-- The UID and GID are set to 1000 by default. This is the default user in the Docker container and on most host operating systems. If there is a mismatch between your host user UID and GID and what is set in the `.env` file, you may experience permission issues.
-
 ## ⚠️ Vector DB support ⚠️
 Out of the box, all vector databases are supported. Any vector databases requiring special configuration are listed below.
 
@@ -80,6 +92,4 @@ VITE_API_BASE="http://<YOUR_REACHABLE_IP_ADDRESS>:3001/api"
 For example, if the docker instance is available on `192.186.1.222` your `VITE_API_BASE` would look like `VITE_API_BASE="http://192.186.1.222:3001/api"` in `frontend/.env.production`.
 
 ### Still not working?
-[Ask for help on Discord](https://discord.gg/6UyHPeGZAC)
-
-
+[Ask for help on Discord](https://discord.gg/6UyHPeGZAC)
\ No newline at end of file
diff --git a/images/deployBtns/aws.png b/images/deployBtns/aws.png
new file mode 100644
index 0000000000000000000000000000000000000000..fde4a2a8d836ad6393e5e5188b173889894f071d
GIT binary patch
literal 3560
zcmb`K`#%$o_s1t=ZfUuvxzEU*2)WEc?vnfco-kV$a=&e#n8+=1saSZsCnRj{k)hm`
z%a{!1l1nacrtt0iH+()noacF+AI=Z2UtW*LE5*vv=pvgS8vp>fXku(&4FE83{?#fh
z%zybNPL2F`F@#tf-C~#>l#Bm+um&4Dg#ZBT-2XoefWnsoe?Om^7$9sTUT(R9@_7vT
z>Lg{c2?+@TEK$IZ!BL_t%vP3Gnwpmmzv+$Y8yK=aVZFP%qL(Eq!y;qyFx`|n>*Za&
zhn(4^zD1`tlu)~{qn}ehYqf%RVi&vKO&*fU%iA{J<^=*{uL+0Oe_&7+;JD2OaL|Um
zgkR<MRN`P>ru9T+0dSs50{mC<H3T@4)c#lW7Edpxa!>t4Aac!ENXs|rC$p2-^my3X
zKn2!WN5+38wdkxt0jpanR=NKSJMw5hJ^ZairJ))kS&Mz{SJt2N*Vb5>1?ft(CW71D
z;+#Fy<XcUUK`&ZL(7K-vN1kLz$?tBd8AuFizI{9yFSnlPPE29W6Bl$U@*gY4N4Xc2
z7xQytw5@NCd7!~lgluT0)?5CZYdC`CduSxjsA6TP7^0#x^CW}{&KVCF4I>gfD4%>p
zQ;`o@Wn2u#sGQj99G)CXKzz^o{=!DKMj%yqnO`e9TU9gs`PwnMgi$u-k-3yJrP$x(
z>V5GAE@JVUMVl#=wv@Q-{;Va^eM_*=ta%fXZ@kt4E46>;)nUjk^}FDKyg^f(()c*)
zY!pt)^<My#=sIlvh;dkGMc;>fAWF2JC#q{s)0^txr?Ue-bGnizn*l@9v!|!S$Ct*7
zK8_q}qg@x5_cZ2~)tut!bMW$~64)@zf*pPPa@WXb{xG35^~$&0zqN&2AIM#p(+N4D
zwrC$0zS3UN-novq4-E@_Hc_l`BSv~{t%4fu$ZojDMyhBfEJA3NHuhtyPC!(EEX4&5
zllI_5%&M>#&Kn5hzFcSwpyQ#>IZU!uM<iXK5jtba{fd5EM$lR9{sKMvxg$+!b><P#
zyFXQ<{G1Z$&sqM5DD^M5Mb(?)HZ-B`-TD2J?JG}5gM~kM{8)>kz$&!sA})hi9#G2G
zMsP(Yna$n4I$?c_N3%8~Lq(t7!fUeXS`H+-IPosLa_B|Z*PGoBtyZTaqkjMFANT0m
zzVg?BYj+7iX;36oE{Th2#aCoMn@|R&vvpMe!_?vIWYrLZEws-fcUH?vBVmXdXI5u=
zC*c#s`kI~9*q;{QtL?%eML&H==5jQinI}~d6C`*~J!xx_rVp7c`gQblvmrbM%HXI~
zZvJNZ)uL=h=Mdt1dwG2S=cFhtSguJ-fFVSu5iI1o^#I;%lReuYbk?lDY5k*Q>Eu7G
z#vi6cqF&VDFa<Xe%aHT>y6dH#)Xv(DTQZW+*-GqV&qbAzh5gk-LWsMIxFZA!2OqRh
zfV{)9@=qTcGOdQoJ;`R0#QfZmmQRD(`Nk}hw6hI19C&PB=R*qxTi9f59JBkbfVKin
zQ-R&TzT4e{W5m)E)rZ)pTL{abJW1yTO8jJS&v5P+C})1&czREhh630uJElHvn<mox
zZK6sdo$5fBzvu|wD5IaKlw9l$6#`d~9$Hra(^7mkoGRpbc*9|Fsuc)hMZFSmieHK*
zoeeS?_y~`M?VcUGyFFO?-H?IV1a>Go3fBE}TAL<s)VWKv3bbycqtC^oUdX1xr+zz4
z8lBIxs<q!}eOwK^EU>Lb)BU9TI#i0&{5vv)opiH;Q1_n60wv>b%&0l*Mhlh)w|h{n
zt<r<AH<~Z2)^|elEl?};xA2w2RKhj6jP&=wg)m%Nis)_>Z9n32^6TrX0egd=`O`o!
zdAxq&m3XU#BuBi@R?CSdD2{d9BD<zurlxZu>_)~HigIM|d{bEo=B{{8l18w|aO==Y
z1vX6T%x${YH+lVmmae1q#!v^c`CQQRP<@o5;y!(M5asN)(`w486+iY{=?#}74o#VO
z6h*0wwhkAO^Rj^Wcs#P?!cyaAw3tg;cVHPB!L^@kCQc)U#geb?v)^0?cW->1&_OUW
zzx_nLc*e2Txt9<c{*B}q-{6mDRB~|N@Bc>)^V6wp^K-z)`&lld4D&LbZ<)r=6Ry1M
z{g17KWM8c3Np&MB?@YKRunTE(1fBzvvCl~g*!Iq2GnM)ck=e4%<rvDZ;b@zkWpbXR
zQxz9aZ~oEqx>9HDny3ge+5TTw{dvZDqqT!JclddC^}wl!^PK~I99$0RX90O8_=)wR
z0~4BMK5a?SxQ15!6MN(Q&PGr5K#`r5@Q;~&-c{vkRN_Z$#K530(i`cr<O(Xt>WK!r
z7t1R$mItTSb~!fnc@;)$+(EUZV7ia&M=eq`>Tl&QLyj`1(PohR?(%L)wn>q=Jddt$
zcQ+896;xTi$<b3EBHJ|;*05)^an<RPo&BSCB8y8Gsq_IAv8@!(s=`4;{|HoR-ovi>
z&f(m=z(sGKHRLJy&I4P+s_TayC-fT9=4l2|@wn()!G*zum9F@ybJu>>uYHMwvEg@3
zgpJ!i47Cz7U#=BgH|0tcW?`yhu6>3$?AS-<<&r(`wvzkRxk3%?O=N;2cb{}ptG?fJ
zs`V^<=LOrSWIJQe0QI6Wq%Z`<+MB7)k}pU}VfFEksmbz~?!3d;Jnf|uyj{M^fqhre
zdSh#2h+mBGt*bO8awBbjAoc|Y>N^(H@8@nauit_~!8=fYJPt#=G%H8N@XX}kJFc@G
zdK==BJ41iMSCqfVBzAWwlkfNIVS(HAB+-wo%1lN}=>!71@Aw%jqD}X?{RNs3dW*S!
z3S)R%HAn60wsPN1J%u((G+9q2*d((sw!EFA+7b!NARm0>O4JBylyQvwY=Sg{RGKI=
z^-L(8Qt5wAaHc1R-x~879DrtCrsQR@Cb9HGT<8L?hru?bJt^1%)t__%vYQ%2er*@+
z2rRlZ?U0)l&TSF(A-b!*bV?sXeY{g_Zt3@(g~4u7;F+)K4QYL!p&6N9M32E%RkM-O
zFgq}#6%&K%mr?Z;Ms-1$H~4d9m~G#ZqtMl45P!)m7bwQX1}n$H-+LCsu^JRn7as|7
zo8~AhXTH(LfV9Z9D3v%ukz`VJ@o}y?DxcDx%GL`^-DGct1#%1of%wiH&i@eKZXShs
z53h7)KGu}W5JLm=?(%~5O_#Ugar@eEsW&n_aRppCrzT9bc*c)z%0y1SghQ3%$n|nn
zl7|(gaKf}<LrO4}(NDs<zB>PVxHhhIz_i<rq24r&SX_C3WOv_Zuv%2F{E1+YnsN)V
zF1312$qjgJi>MWIKblX{_-rl!Gj>!0A5EJNTGH<yEUVZ|jI(SgOzHO9{Y{msyJ8zp
zHcZj<5v}y5S{cMwb7%tIeB#!rCFDmHFNVO!_~jMSo7M4lB5DixrOm~@NY?>jb?D-o
zz!U9Jdty3B>+Vg`E4UVcx9gY!CkJ2*3i}ZF#~OO3)ez^aB`=_6R6E4KqP2?#Vw~VN
z1?vc~vN1pOHQUH<n9;%Voc73hOc_)we(HAuQ%Qg0w>_evOR%Bs0{y{eR5eg1yxL6Y
z=A|4ap6z>(8lyLEyqTaUo%MOX_92SgT#AGuM#-(2Z%OANe%w><itfQ-7{cBqS#A5;
z$Op%hp_%?{-Qq-<z+ZfsfwZ-<;w~@$<NFf&*bqIuw1<OaCE&B1EGVU0_0m<d5->S3
zR^llH#gI>wHn>284-opq{p4=FSF-J)^4mQK{byGf=W1!YUs4XN@_OI;xr01FtHK6O
zXpBtedqZY$)?0o~6^X+^!BTuJnOZ(R>z5e5SPU|G*Q>Ct@JzKf$_anUHfeS`yka&O
zX|+2D(+Fgy(oh%!uAJ<)A56JM6}AtzPv*Rgp)>$-IXeI0>y?;_F4W?kr9)vv{-ilP
z-eNJ>O%7Hq7bvt4tEvtZmq(Ijz<s({IVNzjtSGU=Y?axvPX%i{8d_?dl8-B`>{;8d
zt=;SMQ!@`P^H}l@Jx(T!E1IYvV!WfZuC&e28=ykAcyZ*Og^rWXlMcB`1_V*F`OBRk
zIiG9z5Y=||q+hdO(1oB_cHmKnG8ZV}RAwCgkll1&QUwDrmVA+0;Dxn7&s+<-4x2($
zVmVCn6`C7rum=@_(hl#Wt2v~%ci7whvFJJCIC0I@u+H9390$(Slw7c9W&!fCG=D7Z
zWDFAooRJlrateIdV|!#*zeeReYuf@0jTX1tkPv}4`2%Kkiu;rl!W0v)`Qv7p9Yl*L
z8{8=x0CT=p_1BaQ&`^igc$(xmzL%-C#+b5UGxuEt_$MtvMszx-mUnVUv-qAF+Gg{H
z!U0jSwOA5$O2Wqi*Rc`19K91PF49Z=^8S}KSwtjg&(n4C+NaB0P)>^sW@W)>6CTk^
zj@%JUL_&8>j50l1xTA=5w6M>W+%tw*N{&I(;m2ad(vQ~N0~2I%KmZH!pkoj8V&ptW
zFXjygZ-70SL40-^kv%xCeovJ5-s;Tl_<EZQu0hPW%hwf#FDNnNvdTSae{0Iu|DFI$
zki`x{NgyqiZ4&{>&~nTL;JlOsQZjfsg-?Z+?bF1l+|Qf-wl#o>p`}6HEl=$K0o|mm
AumAu6

literal 0
HcmV?d00001

diff --git a/images/deployBtns/docker.png b/images/deployBtns/docker.png
new file mode 100644
index 0000000000000000000000000000000000000000..e79604afd1e6d9f80c4efc7845aecaa47e812ff3
GIT binary patch
literal 2746
zcmbW3`9BkmAIE1k$5zg05g{Gs%vJj2nq#Oi=E#xUwB(x1u{jE{VL3jC+-GBq@No>u
zh}>k35II6-l~D@cKHvY~`~Bhle7|0g$NT;M@%?xuSePMBf<?gq0N|vFv4JH3z`^@R
zt8fGVQ2J~U=}+SbvP8f+ru*b0{}>*B<2ykB07U5D;s89)g#rLzXA=WG6gGD&Hxz?<
zFW!4_zP_ZfyrFS&V|0A{_Lfhz@7ANRmc6OT-HE^X8;^7I8<TKyt;Pj*dR^^ChNwhK
zLbYpHcad}*suV)tCo4#P?8?cOQSEcz#c%(jg#>+H9UORfD>XU@zZY?Y-40xM5xzjn
z|MlyDiCe5o#fuW?{gv+$=Yb-dsr<!Vu9|}XGc5gzEX$gW&`c_v@^UF8gAOyGCG_hK
zI@Dy$D=jyZe>izi!2<uD{dbZQy6T;02xpqmw_yb9r(vAJd)Pr$Tkg{@7(!~p@`Lpj
zZ?&lZT|o{PELEzCS6}CdYa3!lHOHZuefE6?OC7Oo>}mTW1uGz>ZmDTmdNlJQ=fi(g
zN%d1npMXtf=))07=TWgQj&uXMs<Yf&NvLNcO=Yd4fgPKio+nM65L;V{)H>_50A=p|
zvI%a-hXzV|WR__|i-7iM%R!xO^Ba3LpZV4r-iiXHkRN>&TxR3=cz3GNCw|2kT_{Xm
z-o=UMLlrp>zeTqn(K2;CZ#;vmE}ySI=TqF}u#2&~pEJT=6uD2AF6MB~nY^W`)FF{Z
z7v)2cgpx1LdCVZ>A`b5fhOIVmAFgLyb!|K--61bD9AfbhryATvdAZ-y@bf`*E0@`a
zL$jW*&fxUQ4|lh{-!NHE-@hIUME9kfWNUqMMW9>1!dbf(-_Gk-$v9r^?{JGW5YZ3&
zYL`B;zdmQ=X7fDh=MUwDuc`sdGHJ5EF9$YmZ5eMnA=FG(daL+e{)8^+-=;RFG~%%S
z!+<*g*ow6OX&A$?;dyuqzv6O3tIZE5qeE!5d(@rwjzer@HKv$%%#)gv%LV)U)t=oc
zC599%@Nb7PR>tex3P<Oy$nP((`}NyRGVR*5Ga$VC(7QK&J=`D7lXjaB2C>_mg0?pH
z2qxJoX;Lw?=tbbg=dA7}*&1!7Xs*H9wG@K@f@wwP&E8^KJa{$RH#Y0Fa(Ug<U>fkV
zZ5Va@wBUW}tjH_1rs=lbnUjSW6opb3IOc?MpV@B<_T50EN-lhz-|T!@!3gU9L~-e<
zetV~?8K!1i%4?|zIghNI=5KK`k&6>*j1An)e;T?Uq6dOVc_y4HledQ3tW=qk{0(Ex
z6@U8CgoYFPt!fM^SWDttSzrc{l`;pF7BtIC8c&3b>v`O};{WT5PBG@M&+U^t;AlN%
zd5K=Zo0=(GLMgpF4{;%loqP`^-q*6IjTlta<zW5_EA5x5wD$X1HM*#g@!3uLGCv*;
ze1G&asp9B{DBYwUD=P`^Mc;@pqVw}&Ed)`*ML4`>x^sR0#a68h_Uz!@TAJ_Y!~#$T
z8nK@<bVn13th_6hPD^W#G5|paxj4P8$uT>?D{9O<7KspV>TwC?|E3L%sUEpe9~`~{
z5WdzL_>$(yyGUB8hQT7SeRxA8Qp$zLz)U(@dP=1*ki0Is6|VJi)eo<6>t_br)q9aN
z0*6>h-aZa}HzE7aGugRjX|ceeOL@4Dnxo@)_#hfRej2dXzs(Sa8<0;)$vOcA@BD<H
zni}HPB5=P~o`Mw|om+4izf4=&rgibu-s)2q`<D6_562J8Qw>1+lkOB;@g(Pa6~T;}
zTU4HS6zcNYM-w-jsNA--X4I%fG@C`S_P(;>L}|T0rw59OEgVp9?XI|qs!e@;C9SRj
zb|Fl8W>P9pmwUw>4tk7GA6}R&Tjg`~9Dok+^q+~yf2Pm#=orDH%&gA?s<Eu9j(6<r
z{lykU9$R%x@bS`B=_-L+=w+_VUJLBcdd80Q2}w@GD7jDr!uK8(6I*`k*D9x*KN2pK
zoa>q$NCsaZXi*DdGLXAK5hZcqsYgWa<|=G(Y*6ZH*a3YggKT=_U24M}V7$iuOkt?6
z#w)n(ptE&MA6y8xEiJ4w2}*f43P=EhIAxA^r<<T1%IrX@CWaRTg#?l@Fp`ay_)xOx
z+^3!myLzdTRky8@h$q!5K~0)EB<6=x{bQBq2GnPCg3w}`NLKA)Q3<B?32^P8Yp9?S
zrR|4$U^P^G*Kj4sEh)dC$Jq9JCc$CC>nrz)Q2Y^&(WzoZ^3?<J<`Hj<Ba!3zM-tS6
zqKkG&KbuRXr;!|&N;iG0^bYTjm@<6kGh8!IWUM{VeMGKnrxL8G-LSxrvASb%$H~By
zn6?`E3gTTaB3JGM^~lb#$sM0~<2V(8+aBAe;?mA;mOCerlo0J)3cs^rQNtTfi$LUb
zsIv4z4>5jbVmg=d#Re2tWN_y%Bg(q#@iJ|1BDZg;q<7)0Sno<Lj0Im``ds<L+R2BS
zWc@JjRBZw9am2>KlL(#KF++H%sodO1S_Rg2Q^U)Sw?hsB%knzH%9ZiHd}Fr)zbUva
z>J~ZvBg*5Lnh<OuAAOFj_C>>0_(aw~TTxfm2$xyUgPg+qM?9mTDUw?`NFtxnWWi96
z^J%M;xF!rLvcy(>D}QXn4>b07@UiE6M=tveS>L_x;`<RgzSTxaCQtZ6h&=_%Y4ODT
zYxs+l8Id(AxQk)<*NHeE9h!gexs1ZyD@OAd4Rgtua*hpNsAuQ!>BbS6;%r<qv)`)@
zb~T$9>MN4}efnI^TOfDvL~jRs*7KgMQ^Xm}Qogss@$ik2N01B;b5VW56X)_<H#_wa
zS8*xeC5{PJTC4rXEeo@7nb5h*I_zf}Qbhq&IbR<Q5v-^{)qwymoxfh-h72~Z!p0Dk
z6zy9+Mf7fN>G#qzY=H68{nlL$Ac&KW*3PtT3)wUBxup`Svh3tsMF*5T&p0ZMnC&WD
zb-;_1BD<Pgnis)OG<j(t2Hi6LJXrVRmq!mB@D(4ZC25H|&pG(YiU*#wDna&6!c=Ui
zGS|rW-M{68+Y7DEcF7e9O{KR_SLbb*%?hTfk1)H=;26{%rX$_DOzQzJW?b{J$gCYG
z!OX8jNPGQ|RLW2epzD_2I{SF%1T06L@$_NSR1CQ1)AIDSuCHh#OiKwZ5xhfBh%PQ~
z$%VUqdGGU#3szTqeTsC0**&rDhLT5+`bs+4g<9h4`IOH2epb|2<WR4lNl+R9nk|{l
zt4?oMC2NWcJJ`1nz?jYtN<BcvTE&i#7fV`12`U_N)v1PXJHP7N`MX{6&FwS8`O%9f
zJ2~+|MyhQu&<M{6DbyD+)$VNByZ1(Owj6&JEQyYV8mE?Pte4Aay(09wvZKG<h{0H&
zzGo+@ws+$DO=XcyLF8dMo7wksWXVZtNV=6Rdxa2urJ^8(C6FGTdA&hqK72=q<!Wq~
zSq44`7iL&2-VV)75DGDngo%}k(Rqj=&DY{W%=ra)gSuKU@AV@coE5VIlGL>K1tS|Q
x6&@u2ptN7o-f*WTDjq6*x06S>qW*vE>vVh|HkRYPjQ-?LfQg}*0R?_9=0Aj}KDYn?

literal 0
HcmV?d00001


From f2fadd6d2e233d683dcd0b30dadaded29ef3685a Mon Sep 17 00:00:00 2001
From: Timothy Carambat <rambat1010@gmail.com>
Date: Tue, 19 Dec 2023 13:27:09 -0800
Subject: [PATCH 3/6] Add placeholder collector ENV file (#476)

resolves #474
---
 collector/.env.example | 1 +
 1 file changed, 1 insertion(+)
 create mode 100644 collector/.env.example

diff --git a/collector/.env.example b/collector/.env.example
new file mode 100644
index 000000000..91d0e10a5
--- /dev/null
+++ b/collector/.env.example
@@ -0,0 +1 @@
+# Placeholder .env file for collector runtime
\ No newline at end of file

From 32b1f050628763fb48663dd63648561e4acd848d Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Tue, 19 Dec 2023 13:30:17 -0800
Subject: [PATCH 4/6] add Top link

---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index 879cf2dd7..9ed7cc609 100644
--- a/README.md
+++ b/README.md
@@ -1,3 +1,4 @@
+<a name="readme-top"></a>
 <p align="center">
   <a href="https://useanything.com"><img src="https://github.com/Mintplex-Labs/anything-llm/blob/master/images/wordmark.png?raw=true" alt="AnythingLLM logo"></a>
 </p>

From a7f6003277143c25f838ae26165d9a8a5fb69f50 Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Tue, 19 Dec 2023 16:20:34 -0800
Subject: [PATCH 5/6] fix: set lower maxChunk limit on native embedder to stay
 within resource constraints chore: update comment for what embedding chunk
 means

---
 server/utils/EmbeddingEngines/azureOpenAi/index.js | 2 +-
 server/utils/EmbeddingEngines/localAi/index.js     | 2 +-
 server/utils/EmbeddingEngines/native/index.js      | 4 ++--
 server/utils/EmbeddingEngines/openAi/index.js      | 2 +-
 4 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/server/utils/EmbeddingEngines/azureOpenAi/index.js b/server/utils/EmbeddingEngines/azureOpenAi/index.js
index 8959b0007..3f36b576b 100644
--- a/server/utils/EmbeddingEngines/azureOpenAi/index.js
+++ b/server/utils/EmbeddingEngines/azureOpenAi/index.js
@@ -14,7 +14,7 @@ class AzureOpenAiEmbedder {
     );
     this.openai = openai;
 
-    // The maximum amount of "inputs" that OpenAI API can process in a single call.
+    // Limit of how many strings we can process in a single pass to stay with resource or network limits
     // https://learn.microsoft.com/en-us/azure/ai-services/openai/faq#i-am-trying-to-use-embeddings-and-received-the-error--invalidrequesterror--too-many-inputs--the-max-number-of-inputs-is-1---how-do-i-fix-this-:~:text=consisting%20of%20up%20to%2016%20inputs%20per%20API%20request
     this.embeddingMaxChunkLength = 16;
   }
diff --git a/server/utils/EmbeddingEngines/localAi/index.js b/server/utils/EmbeddingEngines/localAi/index.js
index 0f43cc7dc..68fe66544 100644
--- a/server/utils/EmbeddingEngines/localAi/index.js
+++ b/server/utils/EmbeddingEngines/localAi/index.js
@@ -17,7 +17,7 @@ class LocalAiEmbedder {
     });
     this.openai = new OpenAIApi(config);
 
-    // Arbitrary limit of string size in chars to ensure we stay within reasonable POST request size.
+    // Limit of how many strings we can process in a single pass to stay with resource or network limits
     this.embeddingMaxChunkLength = maximumChunkLength();
   }
 
diff --git a/server/utils/EmbeddingEngines/native/index.js b/server/utils/EmbeddingEngines/native/index.js
index 2081e3fde..81189d4e2 100644
--- a/server/utils/EmbeddingEngines/native/index.js
+++ b/server/utils/EmbeddingEngines/native/index.js
@@ -13,8 +13,8 @@ class NativeEmbedder {
     );
     this.modelPath = path.resolve(this.cacheDir, "Xenova", "all-MiniLM-L6-v2");
 
-    // Arbitrary limit of string size in chars to ensure we stay within reasonable POST request size.
-    this.embeddingMaxChunkLength = 1_000;
+    // Limit of how many strings we can process in a single pass to stay with resource or network limits
+    this.embeddingMaxChunkLength = 50;
 
     // Make directory when it does not exist in existing installations
     if (!fs.existsSync(this.cacheDir)) fs.mkdirSync(this.cacheDir);
diff --git a/server/utils/EmbeddingEngines/openAi/index.js b/server/utils/EmbeddingEngines/openAi/index.js
index 8cfa23516..6ba38c898 100644
--- a/server/utils/EmbeddingEngines/openAi/index.js
+++ b/server/utils/EmbeddingEngines/openAi/index.js
@@ -10,7 +10,7 @@ class OpenAiEmbedder {
     const openai = new OpenAIApi(config);
     this.openai = openai;
 
-    // Arbitrary limit of string size in chars to ensure we stay within reasonable POST request size.
+    // Limit of how many strings we can process in a single pass to stay with resource or network limits
     this.embeddingMaxChunkLength = 1_000;
   }
 

From 67725e807ae9680fde87f90c700e8ff4bfe04d14 Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Tue, 19 Dec 2023 16:22:25 -0800
Subject: [PATCH 6/6] fix: broken build file

---
 .github/workflows/build-and-push-image.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build-and-push-image.yaml b/.github/workflows/build-and-push-image.yaml
index ca5fb52a0..943af5526 100644
--- a/.github/workflows/build-and-push-image.yaml
+++ b/.github/workflows/build-and-push-image.yaml
@@ -3,7 +3,7 @@ name: Publish Docker image and Github Registry
 on:
   push:
     branches: ['master']
-     paths-ignore:
+    paths-ignore:
       - '*.md'
       - 'cloud-deployments/*'
       - 'images/*'