From 49ad77efded77e589f8b185f43213df48ab6b644 Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:34:27 -0700 Subject: [PATCH 1/8] Update compose.cpu.yml --- docker/compose.cpu.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docker/compose.cpu.yml b/docker/compose.cpu.yml index 3650e8a..6c33e0a 100644 --- a/docker/compose.cpu.yml +++ b/docker/compose.cpu.yml @@ -1,6 +1,6 @@ services: infinity: - image: michaelf34/infinity:0.0.32 + image: michaelf34/infinity:0.0.63 container_name: jamai_infinity entrypoint: [ From cfb9edb00c03964ac8ba8cd87b427bb417d1347f Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:54:22 -0700 Subject: [PATCH 2/8] Update models.json --- services/api/src/owl/configs/models.json | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/services/api/src/owl/configs/models.json b/services/api/src/owl/configs/models.json index 6989c0b..ff5b897 100644 --- a/services/api/src/owl/configs/models.json +++ b/services/api/src/owl/configs/models.json @@ -137,7 +137,7 @@ { "id": "ellm/sentence-transformers/all-MiniLM-L6-v2", "litellm_id": "openai/sentence-transformers/all-MiniLM-L6-v2", - "context_length": 8192, + "context_length": 512, "embedding_size": 1024, "languages": ["mul"], "api_base": "http://infinity:6909", @@ -150,9 +150,9 @@ { "id": "cohere/rerank-multilingual-v3.0", "context_length": 512, "languages": ["mul"], "owned_by": "cohere" }, { "id": "ellm/cross-encoder/ms-marco-TinyBERT-L-2", - "context_length": 8192, + "context_length": 512, "languages": ["mul"], - "api_base": "http://infinity:6919", + "api_base": "http://infinity:6909", "owned_by": "ellm" } ] From 63844feb74929549863643f41212825e25cae0fb Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:55:42 -0700 Subject: [PATCH 3/8] Update models.json --- services/api/src/owl/configs/models.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/services/api/src/owl/configs/models.json b/services/api/src/owl/configs/models.json index ff5b897..213cdef 100644 --- a/services/api/src/owl/configs/models.json +++ b/services/api/src/owl/configs/models.json @@ -149,7 +149,7 @@ { "id": "cohere/rerank-english-v3.0", "context_length": 512, "languages": ["en"], "owned_by": "cohere" }, { "id": "cohere/rerank-multilingual-v3.0", "context_length": 512, "languages": ["mul"], "owned_by": "cohere" }, { - "id": "ellm/cross-encoder/ms-marco-TinyBERT-L-2", + "id": "ellm/mixedbread-ai/mxbai-rerank-xsmall-v1", "context_length": 512, "languages": ["mul"], "api_base": "http://infinity:6909", From 512cdf004d2b6d4693722f8fca785e578171fe34 Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:57:05 -0700 Subject: [PATCH 4/8] Update .env --- .env | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.env b/.env index 56f5fa2..16dbeb2 100644 --- a/.env +++ b/.env @@ -15,7 +15,7 @@ OWL_DB_DIR=db OWL_LOG_DIR=logs DOCIO_WORKERS=1 DOCIO_DEVICE=cpu -EMBEDDING_MODEL=sentence-transformers/all-MiniLM-L6-v2 -RERANKER_MODEL=cross-encoder/ms-marco-TinyBERT-L-2 +EMBEDDING_MODEL=michaelfeil/bge-small-en-v1.5 +RERANKER_MODEL=mixedbread-ai/mxbai-rerank-xsmall-v1 OWL_CONCURRENT_ROWS_BATCH_SIZE=3 -OWL_CONCURRENT_COLS_BATCH_SIZE=5 \ No newline at end of file +OWL_CONCURRENT_COLS_BATCH_SIZE=5 From 595960d0577e31f01d3afb36888b445a62ff17cf Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:57:36 -0700 Subject: [PATCH 5/8] Update ci.yml --- .github/workflows/ci.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 9e788d9..3f68680 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -55,8 +55,8 @@ jobs: run: | set -e export API_DEVICE=cpu - export EMBEDDING_MODEL=sentence-transformers/all-MiniLM-L6-v2 - export RERANKER_MODEL=cross-encoder/ms-marco-TinyBERT-L-2 + export EMBEDDING_MODEL=michaelfeil/bge-small-en-v1.5 + export RERANKER_MODEL=mixedbread-ai/mxbai-rerank-xsmall-v1 # Edit .env file ORGS=$(printenv | grep API_KEY | xargs -I {} echo {} | cut -d '=' -f 1) From bbf8359d57e7507a6a52be261b1560fdd6575a11 Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:58:48 -0700 Subject: [PATCH 6/8] Update models.json --- services/api/src/owl/configs/models.json | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/services/api/src/owl/configs/models.json b/services/api/src/owl/configs/models.json index 213cdef..fc8bc3d 100644 --- a/services/api/src/owl/configs/models.json +++ b/services/api/src/owl/configs/models.json @@ -135,8 +135,8 @@ "owned_by": "cohere" }, { - "id": "ellm/sentence-transformers/all-MiniLM-L6-v2", - "litellm_id": "openai/sentence-transformers/all-MiniLM-L6-v2", + "id": "ellm/BAAI/bge-small-en-v1.5", + "litellm_id": "openai/BAAI/bge-small-en-v1.5", "context_length": 512, "embedding_size": 1024, "languages": ["mul"], From dc7419677758b2b31280227504fb19136587022d Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:59:05 -0700 Subject: [PATCH 7/8] Update .env --- .env | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.env b/.env index 16dbeb2..6d75f13 100644 --- a/.env +++ b/.env @@ -15,7 +15,7 @@ OWL_DB_DIR=db OWL_LOG_DIR=logs DOCIO_WORKERS=1 DOCIO_DEVICE=cpu -EMBEDDING_MODEL=michaelfeil/bge-small-en-v1.5 +EMBEDDING_MODEL=BAAI/bge-small-en-v1.5 RERANKER_MODEL=mixedbread-ai/mxbai-rerank-xsmall-v1 OWL_CONCURRENT_ROWS_BATCH_SIZE=3 OWL_CONCURRENT_COLS_BATCH_SIZE=5 From e35a3c63eabeee46eb9765298fb39fb807e4606f Mon Sep 17 00:00:00 2001 From: Michael Feil <63565275+michaelfeil@users.noreply.github.com> Date: Thu, 10 Oct 2024 22:59:19 -0700 Subject: [PATCH 8/8] Update ci.yml --- .github/workflows/ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 3f68680..af40c9f 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -55,7 +55,7 @@ jobs: run: | set -e export API_DEVICE=cpu - export EMBEDDING_MODEL=michaelfeil/bge-small-en-v1.5 + export EMBEDDING_MODEL=BAAI/bge-small-en-v1.5 export RERANKER_MODEL=mixedbread-ai/mxbai-rerank-xsmall-v1 # Edit .env file