Files
GenAIExamples/tests/retrievers/test_retrievers_pgvector_langchain.sh
Letong Han bea9bb0242 [Reorg] Reorg Folder to Support Different Vendors (#625)
Signed-off-by: letonghan <letong.han@intel.com>
Signed-off-by: chensuyue <suyue.chen@intel.com>
2024-09-10 23:24:09 +08:00

86 lines
3.0 KiB
Bash

#!/bin/bash
# Copyright (C) 2024 Intel Corporation
# SPDX-License-Identifier: Apache-2.0
set -x
WORKPATH=$(dirname "$PWD")
LOG_PATH="$WORKPATH/tests"
ip_address=$(hostname -I | awk '{print $1}')
function build_docker_images() {
cd $WORKPATH
docker build --no-cache -t opea/retriever-pgvector:comps --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/retrievers/pgvector/langchain/Dockerfile .
if [ $? -ne 0 ]; then
echo "opea/retriever-pgvector built fail"
exit 1
else
echo "opea/retriever-pgvector built successful"
fi
}
function start_service() {
# pgvector
export POSTGRES_USER=testuser
export POSTGRES_PASSWORD=testpwd
export POSTGRES_DB=vectordb
pgvector_port=5079
docker run --name test-comps-retriever-pgvector-vectorstore -e POSTGRES_USER=${POSTGRES_USER} -e POSTGRES_HOST_AUTH_METHOD=trust -e POSTGRES_DB=${POSTGRES_DB} -e POSTGRES_PASSWORD=${POSTGRES_PASSWORD} -d -v $WORKPATH/comps/vectorstores/pgvector/init.sql:/docker-entrypoint-initdb.d/init.sql -p $pgvector_port:5432 pgvector/pgvector:0.7.0-pg16
sleep 10s
# tei endpoint
tei_endpoint=5431
model="BAAI/bge-base-en-v1.5"
docker run -d --name="test-comps-retriever-pgvector-tei-endpoint" -p $tei_endpoint:80 -v ./data:/data --pull always ghcr.io/huggingface/text-embeddings-inference:cpu-1.5 --model-id $model
sleep 30s
export TEI_EMBEDDING_ENDPOINT="http://${ip_address}:${tei_endpoint}"
# pgvector retriever
docker run -d --name="test-comps-retriever-pgvector-ms" -p 5003:7000 --ipc=host -e http_proxy=$http_proxy -e https_proxy=$https_proxy -e PG_CONNECTION_STRING=postgresql+psycopg2://${POSTGRES_USER}:${POSTGRES_PASSWORD}@$ip_address:$pgvector_port/${POSTGRES_DB} -e INDEX_NAME=$INDEX_NAME -e TEI_ENDPOINT=$TEI_ENDPOINT opea/retriever-pgvector:comps
sleep 3m
}
function validate_microservice() {
retriever_port=5003
test_embedding=$(python -c "import random; embedding = [random.uniform(-1, 1) for _ in range(768)]; print(embedding)")
result=$(http_proxy=''
curl http://${ip_address}:$retriever_port/v1/retrieval \
-X POST \
-d "{\"text\":\"test\",\"embedding\":${test_embedding}}" \
-H 'Content-Type: application/json')
if [[ $result == *"retrieved_docs"* ]]; then
echo "Result correct."
else
echo "Result wrong. Received was $result"
docker logs test-comps-retriever-pgvector-vectorstore >> ${LOG_PATH}/vectorstore.log
docker logs test-comps-retriever-pgvector-tei-endpoint >> ${LOG_PATH}/tei-endpoint.log
docker logs test-comps-retriever-pgvector-ms >> ${LOG_PATH}/retriever-pgvector.log
exit 1
fi
}
function stop_docker() {
cid_retrievers=$(docker ps -aq --filter "name=test-comps-retriever-pgvector*")
if [[ ! -z "$cid_retrievers" ]]; then
docker stop $cid_retrievers && docker rm $cid_retrievers && sleep 1s
fi
}
function main() {
stop_docker
build_docker_images
start_service
validate_microservice
stop_docker
echo y | docker system prune
}
main