Enable vllm for CodeTrans (#1626)

Set vllm as default llm serving, and add related docker compose files, readmes, and test scripts. Issue: https://github.com/opea-project/GenAIExamples/issues/1436 Signed-off-by: letonghan <letong.han@intel.com> Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
2025-03-07 10:56:21 +08:00
parent 5aecea8e47
commit 9180f1066d
12 changed files with 801 additions and 73 deletions
--- a/CodeTrans/docker_image_build/build.yaml
+++ b/CodeTrans/docker_image_build/build.yaml
@@ -23,6 +23,18 @@ services:
      dockerfile: comps/llms/src/text-generation/Dockerfile
    extends: codetrans
    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}
+  vllm:
+    build:
+      context: vllm
+      dockerfile: Dockerfile.cpu
+    extends: codetrans
+    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+  vllm-gaudi:
+    build:
+      context: vllm-fork
+      dockerfile: Dockerfile.hpu
+    extends: codetrans
+    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
  nginx:
    build:
      context: GenAIComps