Update compose.yaml (#1619)
Update compose.yaml for CodeGen, CodeTrans and DocSum Signed-off-by: ZePan110 <ze.pan@intel.com>
This commit is contained in:
@@ -8,7 +8,7 @@ services:
|
|||||||
ports:
|
ports:
|
||||||
- "8028:80"
|
- "8028:80"
|
||||||
volumes:
|
volumes:
|
||||||
- "${MODEL_CACHE}:/data"
|
- "${MODEL_CACHE:-./data}:/data"
|
||||||
shm_size: 1g
|
shm_size: 1g
|
||||||
environment:
|
environment:
|
||||||
no_proxy: ${no_proxy}
|
no_proxy: ${no_proxy}
|
||||||
|
|||||||
@@ -8,7 +8,7 @@ services:
|
|||||||
ports:
|
ports:
|
||||||
- "8028:80"
|
- "8028:80"
|
||||||
volumes:
|
volumes:
|
||||||
- "${MODEL_CACHE}:/data"
|
- "${MODEL_CACHE:-./data}:/data"
|
||||||
environment:
|
environment:
|
||||||
no_proxy: ${no_proxy}
|
no_proxy: ${no_proxy}
|
||||||
http_proxy: ${http_proxy}
|
http_proxy: ${http_proxy}
|
||||||
|
|||||||
@@ -8,7 +8,7 @@ services:
|
|||||||
ports:
|
ports:
|
||||||
- "8008:80"
|
- "8008:80"
|
||||||
volumes:
|
volumes:
|
||||||
- "${MODEL_CACHE}:/data"
|
- "${MODEL_CACHE:-./data}:/data"
|
||||||
shm_size: 1g
|
shm_size: 1g
|
||||||
environment:
|
environment:
|
||||||
no_proxy: ${no_proxy}
|
no_proxy: ${no_proxy}
|
||||||
|
|||||||
@@ -8,7 +8,7 @@ services:
|
|||||||
ports:
|
ports:
|
||||||
- "8008:80"
|
- "8008:80"
|
||||||
volumes:
|
volumes:
|
||||||
- "${MODEL_CACHE}:/data"
|
- "${MODEL_CACHE:-./data}:/data"
|
||||||
environment:
|
environment:
|
||||||
no_proxy: ${no_proxy}
|
no_proxy: ${no_proxy}
|
||||||
http_proxy: ${http_proxy}
|
http_proxy: ${http_proxy}
|
||||||
|
|||||||
@@ -21,7 +21,7 @@ services:
|
|||||||
timeout: 10s
|
timeout: 10s
|
||||||
retries: 100
|
retries: 100
|
||||||
volumes:
|
volumes:
|
||||||
- "${MODEL_CACHE}:/data"
|
- "${MODEL_CACHE:-./data}:/data"
|
||||||
shm_size: 1g
|
shm_size: 1g
|
||||||
command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0 --max-input-length ${MAX_INPUT_TOKENS} --max-total-tokens ${MAX_TOTAL_TOKENS}
|
command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0 --max-input-length ${MAX_INPUT_TOKENS} --max-total-tokens ${MAX_TOTAL_TOKENS}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user