From 1b307832d707754067bbbf8471c6aab7346b1dcc Mon Sep 17 00:00:00 2001 From: Sihan Chen <39623753+Spycsh@users.noreply.github.com> Date: Fri, 28 Jun 2024 21:06:22 +0800 Subject: [PATCH] Add key TEI and TGI parameters for handling long retrievals (#340) --- ChatQnA/docker/gaudi/docker_compose.yaml | 2 +- ChatQnA/docker/xeon/docker_compose.yaml | 4 ++-- SearchQnA/docker/gaudi/docker_compose.yaml | 2 +- SearchQnA/docker/xeon/docker_compose.yaml | 4 ++-- 4 files changed, 6 insertions(+), 6 deletions(-) diff --git a/ChatQnA/docker/gaudi/docker_compose.yaml b/ChatQnA/docker/gaudi/docker_compose.yaml index 5015ff44e..0e709c449 100644 --- a/ChatQnA/docker/gaudi/docker_compose.yaml +++ b/ChatQnA/docker/gaudi/docker_compose.yaml @@ -92,7 +92,7 @@ services: HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN} HF_HUB_DISABLE_PROGRESS_BARS: 1 HF_HUB_ENABLE_HF_TRANSFER: 0 - command: --model-id ${RERANK_MODEL_ID} + command: --model-id ${RERANK_MODEL_ID} --auto-truncate reranking: image: opea/reranking-tei:latest container_name: reranking-tei-gaudi-server diff --git a/ChatQnA/docker/xeon/docker_compose.yaml b/ChatQnA/docker/xeon/docker_compose.yaml index e3be9ed52..9cc80c82e 100644 --- a/ChatQnA/docker/xeon/docker_compose.yaml +++ b/ChatQnA/docker/xeon/docker_compose.yaml @@ -36,7 +36,7 @@ services: no_proxy: ${no_proxy} http_proxy: ${http_proxy} https_proxy: ${https_proxy} - command: --model-id ${EMBEDDING_MODEL_ID} + command: --model-id ${EMBEDDING_MODEL_ID} --auto-truncate embedding: image: opea/embedding-tei:latest container_name: embedding-tei-server @@ -88,7 +88,7 @@ services: HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN} HF_HUB_DISABLE_PROGRESS_BARS: 1 HF_HUB_ENABLE_HF_TRANSFER: 0 - command: --model-id ${RERANK_MODEL_ID} + command: --model-id ${RERANK_MODEL_ID} --auto-truncate reranking: image: opea/reranking-tei:latest container_name: reranking-tei-xeon-server diff --git a/SearchQnA/docker/gaudi/docker_compose.yaml b/SearchQnA/docker/gaudi/docker_compose.yaml index 6593f112f..8132abfd7 100644 --- a/SearchQnA/docker/gaudi/docker_compose.yaml +++ b/SearchQnA/docker/gaudi/docker_compose.yaml @@ -66,7 +66,7 @@ services: no_proxy: ${no_proxy} http_proxy: ${http_proxy} https_proxy: ${https_proxy} - command: --model-id ${RERANK_MODEL_ID} + command: --model-id ${RERANK_MODEL_ID} --auto-truncate reranking: image: opea/reranking-tei:latest container_name: reranking-tei-xeon-server diff --git a/SearchQnA/docker/xeon/docker_compose.yaml b/SearchQnA/docker/xeon/docker_compose.yaml index 85f672bae..9a81a989f 100644 --- a/SearchQnA/docker/xeon/docker_compose.yaml +++ b/SearchQnA/docker/xeon/docker_compose.yaml @@ -17,7 +17,7 @@ services: no_proxy: ${no_proxy} http_proxy: ${http_proxy} https_proxy: ${https_proxy} - command: --model-id ${EMBEDDING_MODEL_ID} + command: --model-id ${EMBEDDING_MODEL_ID} --auto-truncate embedding: image: opea/embedding-tei:latest container_name: embedding-tei-server @@ -62,7 +62,7 @@ services: no_proxy: ${no_proxy} http_proxy: ${http_proxy} https_proxy: ${https_proxy} - command: --model-id ${RERANK_MODEL_ID} + command: --model-id ${RERANK_MODEL_ID} --auto-truncate reranking: image: opea/reranking-tei:latest container_name: reranking-tei-xeon-server