removed spec

This commit is contained in:
Zhenzhong Xu
2024-10-21 09:01:00 +03:00
parent a0b2263fd3
commit 24166615d7
3 changed files with 142 additions and 156 deletions

View File

@@ -5,7 +5,6 @@ HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
podSpecs:
- name: chatqna-backend-server-deploy
spec:
replicas: 2
resources:
limits:
@@ -16,7 +15,6 @@ podSpecs:
memory: "8000Mi"
- name: embedding-dependency-deploy
spec:
replicas: 1
resources:
limits:
@@ -27,29 +25,24 @@ podSpecs:
memory: "20000Mi"
- name: reranking-dependency-deploy
spec:
replicas: 1
resources:
limits:
habana.ai/gaudi: 1
- name: llm-dependency-deploy
spec:
replicas: 7890
replicas: 7
resources:
limits:
habana.ai/gaudi: 1
- name: dataprep-deploy
spec:
replicas: 1
- name: vector-db
spec:
replicas: 1
- name: retriever-deploy
spec:
replicas: 2
resources:
requests:

View File

@@ -12,7 +12,7 @@ spec:
{{- $replicas := $deployment.replicas }}
{{- range $podSpec := $global.podSpecs }}
{{- if eq $podSpec.name $deployment.name }}
{{- $replicas = $podSpec.spec.replicas | default $deployment.replicas }}
{{- $replicas = $podSpec.replicas | default $deployment.replicas }}
{{- end }}
{{- end }}
replicas: {{ $replicas }}
@@ -31,9 +31,9 @@ spec:
- envFrom:
- configMapRef:
name: {{ $global.config.CONFIG_MAP_NAME }}
{{- if $deployment.spec.args }}
{{- if $deployment.args }}
args:
{{- range $arg := $deployment.spec.args }}
{{- range $arg := $deployment.args }}
{{- if $arg.name }}
- {{ $arg.name }}
{{- end }}
@@ -43,9 +43,9 @@ spec:
{{- end }}
{{- end }}
{{- if $deployment.spec.env }}
{{- if $deployment.env }}
env:
{{- range $env := $deployment.spec.env }}
{{- range $env := $deployment.env }}
- name: {{ $env.name }}
value: "{{ $env.value }}"
{{- end }}
@@ -55,20 +55,20 @@ spec:
imagePullPolicy: IfNotPresent
name: {{ $deployment.name }}
{{- if $deployment.spec.ports }}
{{- if $deployment.ports }}
ports:
{{- range $port := $deployment.spec.ports }}
{{- range $port := $deployment.ports }}
{{- range $port_name, $port_id := $port }}
- {{ $port_name }}: {{ $port_id }}
{{- end }}
{{- end }}
{{- end }}
{{- $resources := $deployment.spec.resources }}
{{- $resources := $deployment.resources }}
{{- range $podSpec := $global.podSpecs }}
{{- if eq $podSpec.name $deployment.name }}
{{- if $podSpec.spec.resources }}
{{- $resources = $podSpec.spec.resources }}
{{- if $podSpec.resources }}
{{- $resources = $podSpec.resources }}
{{- end }}
{{- end }}
{{- end }}
@@ -83,9 +83,9 @@ spec:
{{- end }}
{{- end }}
{{- if $deployment.spec.volumeMounts }}
{{- if $deployment.volumeMounts }}
volumeMounts:
{{- range $volumeMount := $deployment.spec.volumeMounts }}
{{- range $volumeMount := $deployment.volumeMounts }}
- mountPath: {{ $volumeMount.mountPath }}
name: {{ $volumeMount.name }}
{{- end }}
@@ -104,9 +104,9 @@ spec:
whenUnsatisfiable: ScheduleAnyway
{{- if $deployment.spec.volumes }}
{{- if $deployment.volumes }}
volumes:
{{- range $index, $volume := $deployment.spec.volumes }}
{{- range $index, $volume := $deployment.volumes }}
- name: {{ $volume.name }}
{{- if $volume.hostPath }}
hostPath:

View File

@@ -14,21 +14,18 @@ deployments:
- name: chatqna-backend-server-deploy
image: opea/chatqna:latest
replicas: 1
spec:
ports:
- containerPort: 8888
- name: dataprep-deploy
image: opea/dataprep-redis:latest
replicas: 1
spec:
ports:
- containerPort: 6007
- name: vector-db
image: redis/redis-stack:7.2.0-v9
replicas: 1
spec:
ports:
- containerPort: 6379
- containerPort: 8001
@@ -36,14 +33,12 @@ deployments:
- name: retriever-deploy
image: opea/retriever-redis:latest
replicas: 1
spec:
ports:
- containerPort: 7000
- name: embedding-dependency-deploy
image: ghcr.io/huggingface/text-embeddings-inference:cpu-1.5
replicas: 1
spec:
ports:
- containerPort: 80
args:
@@ -68,7 +63,6 @@ deployments:
- name: reranking-dependency-deploy
image: opea/tei-gaudi:latest
replicas: 1
spec:
args:
- name: "--model-id"
- value: $(RERANK_MODEL_ID)
@@ -104,7 +98,6 @@ deployments:
- name: llm-dependency-deploy
image: ghcr.io/huggingface/tgi-gaudi:2.0.4
replicas: 1
spec:
ports:
- containerPort: 80
resources: