Files
GenAIExamples/VisualQnA/kubernetes/visualqna_xeon.yaml
lvliang-intel 4f7fc39d66 Add kubernetes support for VisualQnA (#578)
* Add kubernetes support for VisualQnA

Signed-off-by: lvliang-intel <liang1.lv@intel.com>

* update gmc file

Signed-off-by: lvliang-intel <liang1.lv@intel.com>

* update pic

Signed-off-by: lvliang-intel <liang1.lv@intel.com>

---------

Signed-off-by: lvliang-intel <liang1.lv@intel.com>
2024-08-13 17:14:03 +08:00

35 lines
853 B
YAML

# Copyright (C) 2024 Intel Corporation
# SPDX-License-Identifier: Apache-2.0
apiVersion: gmc.opea.io/v1alpha3
kind: GMConnector
metadata:
labels:
app.kubernetes.io/name: gmconnector
app.kubernetes.io/managed-by: kustomize
gmc/platform: xeon
name: visualqna
namespace: visualqna
spec:
routerConfig:
name: router
serviceName: router-service
nodes:
root:
routerType: Sequence
steps:
- name: Lvm
data: $response
internalService:
serviceName: visualqna-service
config:
endpoint: /v1/lvm
LVM_ENDPOINT: visualqna-tgi-svc
- name: Tgi
internalService:
serviceName: visualqna-tgi-svc
config:
MODEL_ID: llava-hf/llava-v1.6-mistral-7b-hf
endpoint: /generate
isDownstreamService: true