Upgrade TGI Gaudi version to v2.0.6 (#1088)

Signed-off-by: lvliang-intel <liang1.lv@intel.com>
Co-authored-by: chen, suyue <suyue.chen@intel.com>
This commit is contained in:
lvliang-intel
2024-11-12 14:38:22 +08:00
committed by GitHub
parent f7a7f8aa3f
commit 1ff85f6a85
74 changed files with 94 additions and 85 deletions

View File

@@ -25,7 +25,7 @@ Should you desire to use the Gaudi accelerator, two alternate images are used fo
For Gaudi:
- tei-embedding-service: ghcr.io/huggingface/tei-gaudi:latest
- tgi-service: gghcr.io/huggingface/tgi-gaudi:2.0.5
- tgi-service: gghcr.io/huggingface/tgi-gaudi:2.0.6
> [NOTE]
> Please refer to [Xeon README](https://github.com/opea-project/GenAIExamples/blob/main/ChatQnA/docker_compose/intel/cpu/xeon/README.md) or [Gaudi README](https://github.com/opea-project/GenAIExamples/blob/main/ChatQnA/docker_compose/intel/hpu/gaudi/README.md) to build the OPEA images. These too will be available on Docker Hub soon to simplify use.

View File

@@ -1103,7 +1103,7 @@ spec:
runAsUser: 1000
seccompProfile:
type: RuntimeDefault
image: "ghcr.io/huggingface/tgi-gaudi:2.0.5"
image: "ghcr.io/huggingface/tgi-gaudi:2.0.6"
imagePullPolicy: Always
volumeMounts:
- mountPath: /data
@@ -1184,8 +1184,13 @@ spec:
runAsUser: 1000
seccompProfile:
type: RuntimeDefault
<<<<<<< HEAD
image: "ghcr.io/huggingface/tgi-gaudi:2.0.6"
imagePullPolicy: IfNotPresent
=======
image: "ghcr.io/huggingface/tgi-gaudi:2.0.5"
imagePullPolicy: Always
>>>>>>> e3187be819ad088c24bf1b2cbb419255af0f2be3
volumeMounts:
- mountPath: /data
name: model-volume

View File

@@ -924,7 +924,7 @@ spec:
runAsUser: 1000
seccompProfile:
type: RuntimeDefault
image: "ghcr.io/huggingface/tgi-gaudi:2.0.5"
image: "ghcr.io/huggingface/tgi-gaudi:2.0.6"
imagePullPolicy: Always
volumeMounts:
- mountPath: /data