fixed visualqna image issues & tgi params issues
This commit is contained in:
@@ -69,7 +69,7 @@ def generate_yaml(num_nodes, mode="oob", with_rerank="True"):
|
|||||||
{
|
{
|
||||||
"name": "llm-dependency-deploy",
|
"name": "llm-dependency-deploy",
|
||||||
"args": [
|
"args": [
|
||||||
{"name": "--max-input-length", "values": 1280},
|
{"name": "--max-input-length", "value": 1280},
|
||||||
{"name": "--max-total-tokens", "value": 2048},
|
{"name": "--max-total-tokens", "value": 2048},
|
||||||
{"name": "--max-batch-total-tokens", "value": 35536},
|
{"name": "--max-batch-total-tokens", "value": 35536},
|
||||||
{"name": "--max-batch-prefill-tokens", "value": 4096},
|
{"name": "--max-batch-prefill-tokens", "value": 4096},
|
||||||
|
|||||||
@@ -30,7 +30,7 @@ microservices:
|
|||||||
- containerPort: 8399
|
- containerPort: 8399
|
||||||
|
|
||||||
- name: visualqna-tgi
|
- name: visualqna-tgi
|
||||||
image: opea/llava-tgi:latest
|
image: ghcr.io/huggingface/tgi-gaudi:2.0.5
|
||||||
replicas: 1
|
replicas: 1
|
||||||
ports:
|
ports:
|
||||||
- containerPort: 8399
|
- containerPort: 8399
|
||||||
|
|||||||
Reference in New Issue
Block a user