Files
GenAIExamples/EdgeCraftRAG/tests/test_compose_vllm_on_arc.sh
Mingyuan Qi edcd7c9d6a Fix code scanning alert no. 21: Uncontrolled data used in path expression (#1171)
Signed-off-by: Mingyuan Qi <mingyuan.qi@intel.com>
Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com>
2024-11-21 20:36:28 +08:00

166 lines
4.6 KiB
Bash
Executable File

#!/bin/bash
# Copyright (C) 2024 Intel Corporation
# SPDX-License-Identifier: Apache-2.0
set -e
source ./common.sh
IMAGE_REPO=${IMAGE_REPO:-"opea"}
IMAGE_TAG=${IMAGE_TAG:-"latest"}
echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
export REGISTRY=${IMAGE_REPO}
export TAG=${IMAGE_TAG}
WORKPATH=$(dirname "$PWD")
LOG_PATH="$WORKPATH/tests"
ip_address=$(hostname -I | awk '{print $1}')
HOST_IP=$ip_address
COMPOSE_FILE="compose_vllm.yaml"
EC_RAG_SERVICE_PORT=16010
#MODEL_PATH="$WORKPATH/models"
MODEL_PATH="/home/media/models"
#HF_ENDPOINT=https://hf-mirror.com
LLM_MODEL="Qwen/Qwen2-7B-Instruct"
VLLM_SERVICE_PORT=8008
vLLM_ENDPOINT="http://${HOST_IP}:${VLLM_SERVICE_PORT}"
function build_docker_images() {
cd $WORKPATH/docker_image_build
echo "Build all the images with --no-cache, check docker_image_build.log for details..."
docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
echo "Build vllm_openvino image from GenAIComps..."
cd $WORKPATH && git clone https://github.com/opea-project/GenAIComps.git && cd GenAIComps && git checkout "${opea_branch:-"main"}"
cd comps/llms/text-generation/vllm/langchain/dependency
bash ./build_docker_vllm_openvino.sh gpu
docker images && sleep 1s
}
function start_services() {
export MODEL_PATH=${MODEL_PATH}
export HOST_IP=${HOST_IP}
export LLM_MODEL=${LLM_MODEL}
export HF_ENDPOINT=${HF_ENDPOINT}
export vLLM_ENDPOINT=${vLLM_ENDPOINT}
export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
export no_proxy="localhost, 127.0.0.1, 192.168.1.1"
cd $WORKPATH/docker_compose/intel/gpu/arc
# Start Docker Containers
docker compose -f $COMPOSE_FILE up -d > ${LOG_PATH}/start_services_with_compose.log
n=0
until [[ "$n" -ge 100 ]]; do
docker logs vllm-openvino-server > ${LOG_PATH}/vllm_service_start.log
if grep -q "metrics.py" ${LOG_PATH}/vllm_service_start.log; then
break
fi
sleep 5s
n=$((n+1))
done
}
function validate_services() {
local URL="$1"
local EXPECTED_RESULT="$2"
local SERVICE_NAME="$3"
local DOCKER_NAME="$4"
local INPUT_DATA="$5"
echo "[ $SERVICE_NAME ] Validating $SERVICE_NAME service..."
local RESPONSE=$(curl -s -w "%{http_code}" -o ${LOG_PATH}/${SERVICE_NAME}.log -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
while [ ! -f ${LOG_PATH}/${SERVICE_NAME}.log ]; do
sleep 1
done
local HTTP_STATUS="${RESPONSE: -3}"
local CONTENT=$(cat ${LOG_PATH}/${SERVICE_NAME}.log)
if [ "$HTTP_STATUS" -eq 200 ]; then
echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
echo "[ $SERVICE_NAME ] Content is as expected."
else
echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
exit 1
fi
else
echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
exit 1
fi
sleep 1s
}
function validate_rag() {
cd $WORKPATH/tests
# setup pipeline
validate_services \
"${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/settings/pipelines" \
"active" \
"pipeline" \
"edgecraftrag-server" \
'@configs/test_pipeline_vllm.json'
# add data
validate_services \
"${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/data" \
"Done" \
"data" \
"edgecraftrag-server" \
'@configs/test_data.json'
# query
validate_services \
"${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/chatqna" \
"1234567890" \
"query" \
"vllm-openvino-server" \
'{"messages":"What is the test id?"}'
}
function validate_megaservice() {
# Curl the Mega Service
validate_services \
"${HOST_IP}:16011/v1/chatqna" \
"1234567890" \
"query" \
"vllm-openvino-server" \
'{"messages":"What is the test id?"}'
}
function stop_docker() {
cd $WORKPATH/docker_compose/intel/gpu/arc
docker compose -f $COMPOSE_FILE down
}
function main() {
mkdir -p "$LOG_PATH"
stop_docker
if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
start_time=$(date +%s)
start_services
end_time=$(date +%s)
duration=$((end_time-start_time))
echo "EC_RAG service start duration is $duration s" && sleep 1s
validate_rag
validate_megaservice
stop_docker
echo y | docker system prune
}
main