Update compose.yaml (#1619)
Update compose.yaml for CodeGen, CodeTrans and DocSum Signed-off-by: ZePan110 <ze.pan@intel.com>
This commit is contained in:
@@ -8,7 +8,7 @@ services:
|
||||
ports:
|
||||
- "8028:80"
|
||||
volumes:
|
||||
- "${MODEL_CACHE}:/data"
|
||||
- "${MODEL_CACHE:-./data}:/data"
|
||||
shm_size: 1g
|
||||
environment:
|
||||
no_proxy: ${no_proxy}
|
||||
|
||||
@@ -8,7 +8,7 @@ services:
|
||||
ports:
|
||||
- "8028:80"
|
||||
volumes:
|
||||
- "${MODEL_CACHE}:/data"
|
||||
- "${MODEL_CACHE:-./data}:/data"
|
||||
environment:
|
||||
no_proxy: ${no_proxy}
|
||||
http_proxy: ${http_proxy}
|
||||
|
||||
@@ -8,7 +8,7 @@ services:
|
||||
ports:
|
||||
- "8008:80"
|
||||
volumes:
|
||||
- "${MODEL_CACHE}:/data"
|
||||
- "${MODEL_CACHE:-./data}:/data"
|
||||
shm_size: 1g
|
||||
environment:
|
||||
no_proxy: ${no_proxy}
|
||||
|
||||
@@ -8,7 +8,7 @@ services:
|
||||
ports:
|
||||
- "8008:80"
|
||||
volumes:
|
||||
- "${MODEL_CACHE}:/data"
|
||||
- "${MODEL_CACHE:-./data}:/data"
|
||||
environment:
|
||||
no_proxy: ${no_proxy}
|
||||
http_proxy: ${http_proxy}
|
||||
|
||||
@@ -21,7 +21,7 @@ services:
|
||||
timeout: 10s
|
||||
retries: 100
|
||||
volumes:
|
||||
- "${MODEL_CACHE}:/data"
|
||||
- "${MODEL_CACHE:-./data}:/data"
|
||||
shm_size: 1g
|
||||
command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0 --max-input-length ${MAX_INPUT_TOKENS} --max-total-tokens ${MAX_TOTAL_TOKENS}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user