49 lines
874 B
YAML
49 lines
874 B
YAML
# Copyright (C) 2024 Intel Corporation
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
podSpecs:
|
|
- name: chatqna-backend-server-deploy
|
|
replicas: 2
|
|
resources:
|
|
limits:
|
|
cpu: "8"
|
|
memory: "8000Mi"
|
|
requests:
|
|
cpu: "8"
|
|
memory: "8000Mi"
|
|
|
|
- name: embedding-dependency-deploy
|
|
replicas: 1
|
|
resources:
|
|
limits:
|
|
cpu: "80"
|
|
memory: "20000Mi"
|
|
requests:
|
|
cpu: "80"
|
|
memory: "20000Mi"
|
|
|
|
- name: reranking-dependency-deploy
|
|
replicas: 1
|
|
resources:
|
|
limits:
|
|
habana.ai/gaudi: 1
|
|
|
|
- name: llm-dependency-deploy
|
|
replicas: 7
|
|
resources:
|
|
limits:
|
|
habana.ai/gaudi: 1
|
|
|
|
- name: dataprep-deploy
|
|
replicas: 1
|
|
|
|
- name: vector-db
|
|
replicas: 1
|
|
|
|
- name: retriever-deploy
|
|
replicas: 2
|
|
resources:
|
|
requests:
|
|
cpu: "4"
|
|
memory: "4000Mi"
|