Files
GenAIExamples/VisualQnA/kubernetes/gmc/visualqna_gaudi.yaml
dolpher c795ef2203 Add helm deployment instructions for GenAIExamples (#1373)
Add helm deployment instructions for ChatQnA, AgentQnA, AudioQnA, CodeTrans, DocSum, FaqGen and VisualQnA

Signed-off-by: Dolpher Du <dolpher.du@intel.com>
2025-01-10 09:55:31 +08:00

35 lines
859 B
YAML

# Copyright (C) 2024 Intel Corporation
# SPDX-License-Identifier: Apache-2.0
apiVersion: gmc.opea.io/v1alpha3
kind: GMConnector
metadata:
labels:
app.kubernetes.io/name: gmconnector
app.kubernetes.io/managed-by: kustomize
gmc/platform: gaudi
name: visualqna
namespace: visualqna
spec:
routerConfig:
name: router
serviceName: router-service
nodes:
root:
routerType: Sequence
steps:
- name: Lvm
data: $response
internalService:
serviceName: visualqna-service
config:
endpoint: /v1/lvm
LVM_ENDPOINT: visualqna-tgi-svc
- name: TgiGaudi
internalService:
serviceName: visualqna-tgi-svc
config:
MODEL_ID: llava-hf/llava-v1.6-mistral-7b-hf
endpoint: /generate
isDownstreamService: true