diff --git a/ChatQnA/benchmark/performance/helm_charts/customize.yaml b/ChatQnA/benchmark/performance/helm_charts/customize.yaml index b55f5e150..1462eb679 100644 --- a/ChatQnA/benchmark/performance/helm_charts/customize.yaml +++ b/ChatQnA/benchmark/performance/helm_charts/customize.yaml @@ -1,8 +1,6 @@ # Copyright (C) 2024 Intel Corporation # SPDX-License-Identifier: Apache-2.0 -HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN} - podSpecs: - name: chatqna-backend-server-deploy replicas: 2 diff --git a/ChatQnA/benchmark/performance/helm_charts/templates/configmap.yaml b/ChatQnA/benchmark/performance/helm_charts/templates/configmap.yaml index a5cfd04b2..24da6bdea 100644 --- a/ChatQnA/benchmark/performance/helm_charts/templates/configmap.yaml +++ b/ChatQnA/benchmark/performance/helm_charts/templates/configmap.yaml @@ -9,7 +9,7 @@ metadata: data: EMBEDDING_MODEL_ID: {{ .Values.config.EMBEDDING_MODEL_ID }} EMBEDDING_SERVER_HOST_IP: embedding-dependency-svc - HUGGINGFACEHUB_API_TOKEN: {{ .Values.HUGGINGFACEHUB_API_TOKEN }} + HUGGINGFACEHUB_API_TOKEN: {{ .Values.config.HUGGINGFACEHUB_API_TOKEN }} INDEX_NAME: rag-redis LLM_MODEL_ID: {{ .Values.config.LLM_MODEL_ID }} LLM_SERVER_HOST_IP: llm-dependency-svc diff --git a/ChatQnA/benchmark/performance/helm_charts/values.yaml b/ChatQnA/benchmark/performance/helm_charts/values.yaml index 387bbd5cb..ddb76b0bb 100644 --- a/ChatQnA/benchmark/performance/helm_charts/values.yaml +++ b/ChatQnA/benchmark/performance/helm_charts/values.yaml @@ -9,6 +9,7 @@ config: EMBEDDING_MODEL_ID: BAAI/bge-base-en-v1.5 LLM_MODEL_ID: Intel/neural-chat-7b-v3-3 RERANK_MODEL_ID: BAAI/bge-reranker-base + HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN} microservices: - name: chatqna-backend-server-deploy @@ -76,8 +77,6 @@ microservices: value: habana - name: HABANA_VISIBLE_DEVICES value: all - - name: HF_TOKEN - value: ${HF_TOKEN} - name: MAX_WARMUP_SEQUENCE_LENGTH value: "512" volumeMounts: @@ -119,8 +118,6 @@ microservices: value: habana - name: HABANA_VISIBLE_DEVICES value: all - - name: HF_TOKEN - value: ${HF_TOKEN} volumeMounts: - mountPath: /data name: model-volume