update llm default model id

Signed-off-by: chensuyue <suyue.chen@intel.com>
This commit is contained in:
chensuyue
2025-05-21 22:53:29 +08:00
parent d6255cf38c
commit 8fa1119850

View File

@@ -37,7 +37,7 @@ deploy:
llm:
engine: vllm # or tgi
model_id: "meta-llama/Meta-Llama-3-8B-Instruct" # mandatory
model_id: "meta-llama/Llama-3.1-8B-Instruct" # mandatory
replicaCount:
with_teirerank: [7, 15, 31, 63] # When teirerank.enabled is True
without_teirerank: [8, 16, 32, 64] # When teirerank.enabled is False