Use model cache for docker compose test (#1582)
Signed-off-by: ZePan110 <ze.pan@intel.com>
This commit is contained in:
@@ -21,7 +21,7 @@ services:
|
||||
timeout: 10s
|
||||
retries: 100
|
||||
volumes:
|
||||
- "./data:/data"
|
||||
- "${MODEL_CACHE}:/data"
|
||||
shm_size: 1g
|
||||
command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0
|
||||
llm:
|
||||
|
||||
@@ -30,7 +30,7 @@ services:
|
||||
- SYS_NICE
|
||||
ipc: host
|
||||
volumes:
|
||||
- "./data:/data"
|
||||
- "${MODEL_CACHE}:/data"
|
||||
command: --model-id ${LLM_MODEL_ID} --max-input-length 1024 --max-total-tokens 2048
|
||||
llm:
|
||||
image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}
|
||||
|
||||
Reference in New Issue
Block a user