diff --git a/ChatQnA/benchmark_chatqna.yaml b/ChatQnA/benchmark_chatqna.yaml index ae74aa9b9..e528bb9d7 100644 --- a/ChatQnA/benchmark_chatqna.yaml +++ b/ChatQnA/benchmark_chatqna.yaml @@ -37,7 +37,7 @@ deploy: llm: engine: vllm # or tgi - model_id: "meta-llama/Meta-Llama-3-8B-Instruct" # mandatory + model_id: "meta-llama/Llama-3.1-8B-Instruct" # mandatory replicaCount: with_teirerank: [7, 15, 31, 63] # When teirerank.enabled is True without_teirerank: [8, 16, 32, 64] # When teirerank.enabled is False