73 lines
3.0 KiB
Bash
73 lines
3.0 KiB
Bash
# Copyright (C) 2024 Intel Corporation
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
pushd "../../../../../" > /dev/null
|
|
source .set_env.sh
|
|
popd > /dev/null
|
|
WORKPATH=$(dirname "$PWD")/..
|
|
# export WORKDIR=$WORKPATH/../../
|
|
if [[ -z "${WORKDIR}" ]]; then
|
|
echo "Please set WORKDIR environment variable"
|
|
exit 0
|
|
fi
|
|
echo "WORKDIR=${WORKDIR}"
|
|
export ip_address=$(hostname -I | awk '{print $1}')
|
|
|
|
# LLM related environment variables
|
|
export HF_CACHE_DIR=${HF_CACHE_DIR}
|
|
ls $HF_CACHE_DIR
|
|
export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
|
|
export HF_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
|
|
export LLM_MODEL_ID="meta-llama/Llama-3.3-70B-Instruct"
|
|
export NUM_SHARDS=4
|
|
export LLM_ENDPOINT_URL="http://${ip_address}:8086"
|
|
export temperature=0
|
|
export max_new_tokens=4096
|
|
|
|
# agent related environment variables
|
|
export TOOLSET_PATH=$WORKDIR/GenAIExamples/AgentQnA/tools/
|
|
echo "TOOLSET_PATH=${TOOLSET_PATH}"
|
|
export recursion_limit_worker=12
|
|
export recursion_limit_supervisor=10
|
|
export WORKER_AGENT_URL="http://${ip_address}:9095/v1/chat/completions"
|
|
export SQL_AGENT_URL="http://${ip_address}:9096/v1/chat/completions"
|
|
export RETRIEVAL_TOOL_URL="http://${ip_address}:8889/v1/retrievaltool"
|
|
export CRAG_SERVER=http://${ip_address}:8080
|
|
|
|
export db_name=Chinook
|
|
export db_path="sqlite:////home/user/chinook-db/Chinook_Sqlite.sqlite"
|
|
if [ ! -f $WORKDIR/GenAIExamples/AgentQnA/tests/Chinook_Sqlite.sqlite ]; then
|
|
echo "Download Chinook_Sqlite!"
|
|
wget -O $WORKDIR/GenAIExamples/AgentQnA/tests/Chinook_Sqlite.sqlite https://github.com/lerocha/chinook-database/releases/download/v1.4.5/Chinook_Sqlite.sqlite
|
|
fi
|
|
|
|
# configure agent ui
|
|
# echo "AGENT_URL = 'http://$ip_address:9090/v1/chat/completions'" | tee ${WORKDIR}/GenAIExamples/AgentQnA/ui/svelte/.env
|
|
|
|
# retriever
|
|
export host_ip=$(hostname -I | awk '{print $1}')
|
|
export no_proxy=${no_proxy}
|
|
export http_proxy=${http_proxy}
|
|
export https_proxy=${https_proxy}
|
|
export EMBEDDING_MODEL_ID="BAAI/bge-base-en-v1.5"
|
|
export RERANK_MODEL_ID="BAAI/bge-reranker-base"
|
|
export TEI_EMBEDDING_ENDPOINT="http://${host_ip}:6006"
|
|
export TEI_RERANKING_ENDPOINT="http://${host_ip}:8808"
|
|
export REDIS_URL="redis://${host_ip}:6379"
|
|
export INDEX_NAME="rag-redis"
|
|
export RERANK_TYPE="tei"
|
|
export MEGA_SERVICE_HOST_IP=${host_ip}
|
|
export EMBEDDING_SERVICE_HOST_IP=${host_ip}
|
|
export RETRIEVER_SERVICE_HOST_IP=${host_ip}
|
|
export RERANK_SERVICE_HOST_IP=${host_ip}
|
|
export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:8889/v1/retrievaltool"
|
|
export DATAPREP_SERVICE_ENDPOINT="http://${host_ip}:6007/v1/dataprep/ingest"
|
|
export DATAPREP_GET_FILE_ENDPOINT="http://${host_ip}:6008/v1/dataprep/get"
|
|
export DATAPREP_DELETE_FILE_ENDPOINT="http://${host_ip}:6009/v1/dataprep/delete"
|
|
# Set OpenTelemetry Tracing Endpoint
|
|
export JAEGER_IP=$(ip route get 8.8.8.8 | grep -oP 'src \K[^ ]+')
|
|
export OTEL_EXPORTER_OTLP_TRACES_ENDPOINT=grpc://$JAEGER_IP:4317
|
|
export TELEMETRY_ENDPOINT=http://$JAEGER_IP:4318/v1/traces
|
|
|
|
export no_proxy="$no_proxy,rag-agent-endpoint,sql-agent-endpoint,react-agent-endpoint,agent-ui,vllm-gaudi-server,jaeger,grafana,prometheus,node-exporter,gaudi-exporter,127.0.0.1,localhost,0.0.0.0,$host_ip,,$JAEGER_IP"
|