Update GraphRAG to be compatible with latest component changes (#1427)
- Updated ENV VARS to align with recent changes in neo4j dataprep and retriever. - upgraded tgi-gaudi image version Related to GenAIComps repo issue #1025 (opea-project/GenAIComps#1025) Original PR #1384 Original contributor is @rbrugaro Signed-off-by: Xinyao Wang <xinyao.wang@intel.com> Co-authored-by: Liang Lv <liang1.lv@intel.com>
This commit is contained in:
@@ -60,6 +60,7 @@ services:
|
||||
LIMIT_HPU_GRAPH: true
|
||||
USE_FLASH_ATTENTION: true
|
||||
FLASH_ATTENTION_RECOMPUTE: true
|
||||
TEXT_GENERATION_SERVER_IGNORE_EOS_TOKEN: false
|
||||
runtime: habana
|
||||
cap_add:
|
||||
- SYS_NICE
|
||||
@@ -93,6 +94,7 @@ services:
|
||||
OPENAI_LLM_MODEL: ${OPENAI_LLM_MODEL}
|
||||
EMBEDDING_MODEL_ID: ${EMBEDDING_MODEL_ID}
|
||||
LLM_MODEL_ID: ${LLM_MODEL_ID}
|
||||
MAX_OUTPUT_TOKENS: ${MAX_OUTPUT_TOKENS}
|
||||
LOGFLAG: ${LOGFLAG}
|
||||
restart: unless-stopped
|
||||
retriever-neo4j-llamaindex:
|
||||
@@ -122,6 +124,7 @@ services:
|
||||
OPENAI_LLM_MODEL: ${OPENAI_LLM_MODEL}
|
||||
EMBEDDING_MODEL_ID: ${EMBEDDING_MODEL_ID}
|
||||
LLM_MODEL_ID: ${LLM_MODEL_ID}
|
||||
MAX_OUTPUT_TOKENS: ${MAX_OUTPUT_TOKENS}
|
||||
LOGFLAG: ${LOGFLAG}
|
||||
RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_NEO4J"
|
||||
restart: unless-stopped
|
||||
@@ -144,6 +147,7 @@ services:
|
||||
- RETRIEVER_SERVICE_PORT=7000
|
||||
- LLM_SERVER_HOST_IP=tgi-gaudi-service
|
||||
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
|
||||
- LLM_MODEL_ID=${LLM_MODEL_ID}
|
||||
- LOGFLAG=${LOGFLAG}
|
||||
ipc: host
|
||||
restart: always
|
||||
|
||||
@@ -12,7 +12,7 @@ popd > /dev/null
|
||||
|
||||
export EMBEDDING_MODEL_ID="BAAI/bge-base-en-v1.5"
|
||||
export OPENAI_EMBEDDING_MODEL="text-embedding-3-small"
|
||||
export LLM_MODEL_ID="meta-llama/Meta-Llama-3-8B-Instruct"
|
||||
export LLM_MODEL_ID="meta-llama/Meta-Llama-3.1-8B-Instruct"
|
||||
export OPENAI_LLM_MODEL="gpt-4o"
|
||||
export TEI_EMBEDDING_ENDPOINT="http://${host_ip}:6006"
|
||||
export TGI_LLM_ENDPOINT="http://${host_ip}:6005"
|
||||
@@ -21,3 +21,5 @@ export NEO4J_USERNAME=neo4j
|
||||
export DATAPREP_SERVICE_ENDPOINT="http://${host_ip}:5000/v1/dataprep/ingest"
|
||||
export LOGFLAG=True
|
||||
export RETRIEVER_SERVICE_PORT=80
|
||||
export LLM_SERVER_PORT=80
|
||||
export MAX_OUTPUT_TOKENS=1024
|
||||
|
||||
Reference in New Issue
Block a user