update tgi-gaudi version (#389)

Signed-off-by: chensuyue <suyue.chen@intel.com>
Co-authored-by: Spycsh <sihan.chen@intel.com>
This commit is contained in:
chen, suyue
2024-07-12 15:01:03 +08:00
committed by GitHub
parent 49789595e5
commit 3505bd25a4
22 changed files with 63 additions and 41 deletions

View File

@@ -6,7 +6,7 @@ version: "3.8"
services:
tgi_service:
image: ghcr.io/huggingface/tgi-gaudi:1.2.1
image: ghcr.io/huggingface/tgi-gaudi:2.0.1
container_name: codetrans-tgi-service
ports:
- "8008:80"
@@ -23,7 +23,7 @@ services:
cap_add:
- SYS_NICE
ipc: host
command: --model-id ${LLM_MODEL_ID}
command: --model-id ${LLM_MODEL_ID} --max-input-length 1024 --max-total-tokens 2048
llm:
image: opea/llm-tgi:latest
container_name: llm-tgi-gaudi-server