284 lines
6.9 KiB
YAML
284 lines
6.9 KiB
YAML
---
|
|
# Source: codegen/charts/llm-uservice/charts/tgi/templates/service.yaml
|
|
# Copyright (C) 2024 Intel Corporation
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
apiVersion: v1
|
|
kind: Service
|
|
metadata:
|
|
name: docsum-tgi
|
|
labels:
|
|
helm.sh/chart: tgi-0.1.0
|
|
app.kubernetes.io/name: tgi
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.4"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
type: ClusterIP
|
|
ports:
|
|
- port: 80
|
|
targetPort: 80
|
|
protocol: TCP
|
|
name: tgi
|
|
selector:
|
|
app.kubernetes.io/name: tgi
|
|
app.kubernetes.io/instance: docsum
|
|
---
|
|
apiVersion: v1
|
|
kind: Service
|
|
metadata:
|
|
name: docsum-llm-uservice
|
|
labels:
|
|
helm.sh/chart: llm-uservice-0.1.0
|
|
app.kubernetes.io/name: llm-uservice
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.0.0"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
type: ClusterIP
|
|
ports:
|
|
- port: 9000
|
|
targetPort: 9000
|
|
protocol: TCP
|
|
name: llm-uservice
|
|
selector:
|
|
app.kubernetes.io/name: llm-uservice
|
|
app.kubernetes.io/instance: docsum
|
|
---
|
|
apiVersion: v1
|
|
kind: Service
|
|
metadata:
|
|
name: docsum
|
|
labels:
|
|
helm.sh/chart: docsum-0.1.0
|
|
app.kubernetes.io/name: docsum
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.0.0"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
type: ClusterIP
|
|
ports:
|
|
- port: 8888
|
|
targetPort: 8888
|
|
protocol: TCP
|
|
name: docsum
|
|
selector:
|
|
app.kubernetes.io/name: docsum
|
|
app.kubernetes.io/instance: docsum
|
|
---
|
|
apiVersion: v1
|
|
kind: Service
|
|
metadata:
|
|
name: docsum-react-ui
|
|
labels:
|
|
helm.sh/chart: docsum-react-ui-0.1.0
|
|
app.kubernetes.io/name: react-ui
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.0.0"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
type: ClusterIP
|
|
ports:
|
|
- port: 80
|
|
targetPort: 80
|
|
protocol: TCP
|
|
name: react-ui
|
|
selector:
|
|
app.kubernetes.io/name: react-ui
|
|
app.kubernetes.io/instance: docsum
|
|
---
|
|
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: docsum-tgi
|
|
labels:
|
|
helm.sh/chart: tgi-0.1.0
|
|
app.kubernetes.io/name: tgi
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.4"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
replicas: 1
|
|
selector:
|
|
matchLabels:
|
|
app.kubernetes.io/name: tgi
|
|
app.kubernetes.io/instance: docsum
|
|
template:
|
|
metadata:
|
|
labels:
|
|
app.kubernetes.io/name: tgi
|
|
app.kubernetes.io/instance: docsum
|
|
spec:
|
|
securityContext: {}
|
|
containers:
|
|
- name: tgi
|
|
env:
|
|
- name: MODEL_ID
|
|
value: Intel/neural-chat-7b-v3-3
|
|
- name: PORT
|
|
value: "80"
|
|
- name: CUDA_GRAPHS
|
|
value: "0"
|
|
- name: http_proxy
|
|
value:
|
|
- name: https_proxy
|
|
value:
|
|
- name: no_proxy
|
|
value:
|
|
securityContext: {}
|
|
image: "ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu"
|
|
imagePullPolicy: IfNotPresent
|
|
volumeMounts:
|
|
- mountPath: /data
|
|
name: model-volume
|
|
ports:
|
|
- name: http
|
|
containerPort: 80
|
|
protocol: TCP
|
|
resources: {}
|
|
volumes:
|
|
- name: model-volume
|
|
hostPath:
|
|
path: /mnt
|
|
type: Directory
|
|
---
|
|
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: docsum-llm-uservice
|
|
labels:
|
|
helm.sh/chart: llm-uservice-0.1.0
|
|
app.kubernetes.io/name: llm-uservice
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.0.0"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
replicas: 1
|
|
selector:
|
|
matchLabels:
|
|
app.kubernetes.io/name: llm-uservice
|
|
app.kubernetes.io/instance: docsum
|
|
template:
|
|
metadata:
|
|
labels:
|
|
app.kubernetes.io/name: llm-uservice
|
|
app.kubernetes.io/instance: docsum
|
|
spec:
|
|
securityContext: {}
|
|
containers:
|
|
- name: docsum
|
|
env:
|
|
- name: TGI_LLM_ENDPOINT
|
|
value: "http://docsum-tgi:80"
|
|
- name: HUGGINGFACEHUB_API_TOKEN
|
|
value: "insert-your-huggingface-token-here"
|
|
- name: http_proxy
|
|
value:
|
|
- name: https_proxy
|
|
value:
|
|
- name: no_proxy
|
|
value:
|
|
|
|
securityContext: {}
|
|
image: "opea/llm-docsum-tgi:latest"
|
|
imagePullPolicy: IfNotPresent
|
|
ports:
|
|
- name: llm-uservice
|
|
containerPort: 9000
|
|
protocol: TCP
|
|
startupProbe:
|
|
exec:
|
|
command:
|
|
- curl
|
|
- http://docsum-tgi:80
|
|
initialDelaySeconds: 5
|
|
periodSeconds: 5
|
|
failureThreshold: 120
|
|
resources: {}
|
|
---
|
|
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: docsum
|
|
labels:
|
|
helm.sh/chart: docsum-0.1.0
|
|
app.kubernetes.io/name: docsum
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.0.0"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
replicas: 1
|
|
selector:
|
|
matchLabels:
|
|
app.kubernetes.io/name: docsum
|
|
app.kubernetes.io/instance: docsum
|
|
template:
|
|
metadata:
|
|
labels:
|
|
app.kubernetes.io/name: docsum
|
|
app.kubernetes.io/instance: docsum
|
|
spec:
|
|
securityContext: null
|
|
containers:
|
|
- name: docsum
|
|
env:
|
|
- name: LLM_SERVICE_HOST_IP
|
|
value: docsum-llm-uservice
|
|
- name: http_proxy
|
|
value:
|
|
- name: https_proxy
|
|
value:
|
|
- name: no_proxy
|
|
value:
|
|
securityContext: null
|
|
image: "opea/docsum:latest"
|
|
imagePullPolicy: IfNotPresent
|
|
ports:
|
|
- name: docsum
|
|
containerPort: 8888
|
|
protocol: TCP
|
|
resources: null
|
|
---
|
|
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: docsum-react-ui
|
|
labels:
|
|
helm.sh/chart: docsum-react-ui-0.1.0
|
|
app.kubernetes.io/name: react-ui
|
|
app.kubernetes.io/instance: docsum
|
|
app.kubernetes.io/version: "1.0.0"
|
|
app.kubernetes.io/managed-by: Helm
|
|
spec:
|
|
replicas: 1
|
|
selector:
|
|
matchLabels:
|
|
app.kubernetes.io/name: react-ui
|
|
app.kubernetes.io/instance: docsum
|
|
template:
|
|
metadata:
|
|
labels:
|
|
app.kubernetes.io/name: react-ui
|
|
app.kubernetes.io/instance: docsum
|
|
spec:
|
|
securityContext: null
|
|
containers:
|
|
- name: docsum-react-ui
|
|
env:
|
|
- name: DOC_BASE_URL
|
|
value: "http://docsum:8888/v1/docsum"
|
|
- name: http_proxy
|
|
value:
|
|
- name: https_proxy
|
|
value:
|
|
- name: no_proxy
|
|
value:
|
|
securityContext: null
|
|
image: "opea/docsum-react-ui:latest"
|
|
imagePullPolicy: IfNotPresent
|
|
ports:
|
|
- name: react-ui
|
|
containerPort: 80
|
|
protocol: TCP
|
|
resources: null
|