Files
GenAIExamples/DocSum/kubernetes/gmc/docsum_xeon.yaml
XinyaoWa ff1310b11a Refactor docsum (#1336)
Signed-off-by: Xinyao Wang <xinyao.wang@intel.com>
2025-01-13 15:49:48 +08:00

37 lines
900 B
YAML

# Copyright (C) 2024 Intel Corporation
# SPDX-License-Identifier: Apache-2.0
apiVersion: gmc.opea.io/v1alpha3
kind: GMConnector
metadata:
labels:
app.kubernetes.io/name: gmconnector
app.kubernetes.io/managed-by: kustomize
gmc/platform: xeon
name: docsum
namespace: docsum
spec:
routerConfig:
name: router
serviceName: router-service
nodes:
root:
routerType: Sequence
steps:
- name: DocSum
data: $response
internalService:
serviceName: docsum-llm-uservice
config:
endpoint: /v1/docsum
PORT: "9009"
TGI_LLM_ENDPOINT: tgi-svc
- name: Tgi
internalService:
serviceName: tgi-svc
config:
LANGCHAIN_TRACING_V2: "false"
LANGCHAIN_PROJECT: "opea-llm-service"
endpoint: /generate
isDownstreamService: true