Files
GenAIExamples/ChatQnA/benchmark/performance/helm_charts/customize.yaml
2024-10-21 10:41:20 +03:00

49 lines
874 B
YAML

# Copyright (C) 2024 Intel Corporation
# SPDX-License-Identifier: Apache-2.0
podSpecs:
- name: chatqna-backend-server-deploy
replicas: 2
resources:
limits:
cpu: "8"
memory: "8000Mi"
requests:
cpu: "8"
memory: "8000Mi"
- name: embedding-dependency-deploy
replicas: 1
resources:
limits:
cpu: "80"
memory: "20000Mi"
requests:
cpu: "80"
memory: "20000Mi"
- name: reranking-dependency-deploy
replicas: 1
resources:
limits:
habana.ai/gaudi: 1
- name: llm-dependency-deploy
replicas: 7
resources:
limits:
habana.ai/gaudi: 1
- name: dataprep-deploy
replicas: 1
- name: vector-db
replicas: 1
- name: retriever-deploy
replicas: 2
resources:
requests:
cpu: "4"
memory: "4000Mi"