Files
GenAIExamples/EdgeCraftRAG/tests/test_compose_vllm_on_arc.sh

181 lines
5.0 KiB
Bash
Executable File

#!/bin/bash
# Copyright (C) 2024 Intel Corporation
# SPDX-License-Identifier: Apache-2.0
set -e
source ./common.sh
IMAGE_REPO=${IMAGE_REPO:-"opea"}
IMAGE_TAG=${IMAGE_TAG:-"latest"}
echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
export REGISTRY=${IMAGE_REPO}
export TAG=${IMAGE_TAG}
WORKPATH=$(dirname "$PWD")
LOG_PATH="$WORKPATH/tests"
ip_address=$(hostname -I | awk '{print $1}')
HOST_IP=$ip_address
COMPOSE_FILE="compose_vllm.yaml"
EC_RAG_SERVICE_PORT=16010
MODEL_PATH="/home/media/models"
# MODEL_PATH="$WORKPATH/models"
DOC_PATH="$WORKPATH/tests"
UI_TMPFILE_PATH="$WORKPATH/tests"
#HF_ENDPOINT=https://hf-mirror.com
LLM_MODEL="Qwen/Qwen2-7B-Instruct"
VLLM_SERVICE_PORT=8008
vLLM_ENDPOINT="http://${HOST_IP}:${VLLM_SERVICE_PORT}"
function build_docker_images() {
opea_branch=${opea_branch:-"main"}
cd $WORKPATH/docker_image_build
git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
pushd GenAIComps
echo "GenAIComps test commit is $(git rev-parse HEAD)"
docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
popd && sleep 1s
echo "Build all the images with --no-cache, check docker_image_build.log for details..."
docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
echo "Build vllm_openvino image from GenAIComps..."
cd $WORKPATH && git clone --single-branch --branch "${opea_branch:-"main"}" https://github.com/opea-project/GenAIComps.git
cd GenAIComps/comps/third_parties/vllm/src/
bash ./build_docker_vllm_openvino.sh gpu
docker images && sleep 1s
}
function start_services() {
cd $WORKPATH/docker_compose/intel/gpu/arc
source set_env.sh
# Start Docker Containers
docker compose -f $COMPOSE_FILE up -d > ${LOG_PATH}/start_services_with_compose.log
n=0
until [[ "$n" -ge 100 ]]; do
docker logs vllm-openvino-server > ${LOG_PATH}/vllm_service_start.log
if grep -q "metrics.py" ${LOG_PATH}/vllm_service_start.log; then
break
fi
sleep 5s
n=$((n+1))
done
}
function validate_services() {
local URL="$1"
local EXPECTED_RESULT="$2"
local SERVICE_NAME="$3"
local DOCKER_NAME="$4"
local INPUT_DATA="$5"
echo "[ $SERVICE_NAME ] Validating $SERVICE_NAME service..."
local RESPONSE=$(curl -s -w "%{http_code}" -o ${LOG_PATH}/${SERVICE_NAME}.log -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
while [ ! -f ${LOG_PATH}/${SERVICE_NAME}.log ]; do
sleep 1
done
local HTTP_STATUS="${RESPONSE: -3}"
local CONTENT=$(cat ${LOG_PATH}/${SERVICE_NAME}.log)
if [ "$HTTP_STATUS" -eq 200 ]; then
echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
echo "[ $SERVICE_NAME ] Content is as expected."
else
echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
exit 1
fi
else
echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
exit 1
fi
sleep 1s
}
function validate_rag() {
cd $WORKPATH/tests
# setup pipeline
validate_services \
"${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/settings/pipelines" \
"active" \
"pipeline" \
"edgecraftrag-server" \
'@configs/test_pipeline_vllm.json'
# add data
validate_services \
"${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/data" \
"Done" \
"data" \
"edgecraftrag-server" \
'@configs/test_data.json'
# query
validate_services \
"${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/chatqna" \
"1234567890" \
"query" \
"vllm-openvino-server" \
'{"messages":"What is the test id?"}'
}
function validate_megaservice() {
# Curl the Mega Service
validate_services \
"${HOST_IP}:16011/v1/chatqna" \
"1234567890" \
"query" \
"vllm-openvino-server" \
'{"messages":"What is the test id?"}'
}
function stop_docker() {
cd $WORKPATH/docker_compose/intel/gpu/arc
docker compose -f $COMPOSE_FILE down
}
function main() {
mkdir -p "$LOG_PATH"
echo "::group::stop_docker"
stop_docker
echo "::endgroup::"
echo "::group::build_docker_images"
if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
echo "::endgroup::"
echo "::group::start_services"
start_services
echo "::endgroup::"
echo "::group::validate_rag"
validate_rag
echo "::endgroup::"
echo "::group::validate_megaservice"
validate_megaservice
echo "::endgroup::"
echo "::group::stop_docker"
stop_docker
echo y | docker system prune
echo "::endgroup::"
}
main