diff --git a/ChatQnA/microservice/gaudi/README.md b/ChatQnA/microservice/gaudi/README.md
index 50fe8124d..e9183c471 100644
--- a/ChatQnA/microservice/gaudi/README.md
+++ b/ChatQnA/microservice/gaudi/README.md
@@ -95,8 +95,6 @@ export INDEX_NAME="rag-redis"
 export HUGGINGFACEHUB_API_TOKEN=${your_hf_api_token}
 ```
 
-Note: Please replace with `your_ip` with you external IP address, do not use localhost.
-
 Note: Please replace with `host_ip` with you external IP address, do not use localhost.
 
 ### Start Microservice Docker Containers
@@ -185,10 +183,21 @@ Following the validation of all aforementioned microservices, we are now prepare
 
 ## 🚀 Construct Mega Service
 
-Modify the `initial_inputs` of line 34 in `chatqna.py`, then you will get the ChatQnA result of this mega service.
+To construct the Mega Service, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `chatqna.py` Python script. Upon executing the script, each microservice's intermediate results will be displayed, allowing users to verify the accuracy of the outcomes and make targeted modifications if necessary.
 
-All of the intermediate results will be printed for each microservice. Users can check the accuracy of the results to make targeted modifications.
+To launch the Mega Service, simply run the following command:
 
 ```bash
 python chatqna.py
 ```
+
+## 🚀 Access the Mega Service
+
+Once the script is executed, a FastAPI server will be initiated. Users can interact with the service through the `/v1/chatqna` endpoint. Here's an example using `curl`:
+
+```bash
+curl http://127.0.0.1:8888/v1/chatqna -H "Content-Type: application/json" -d '{
+    "model": "Intel/neural-chat-7b-v3-3",
+    "messages": "What is the revenue of Nike in 2023?"
+    }'
+```
diff --git a/ChatQnA/microservice/gaudi/chatqna.py b/ChatQnA/microservice/gaudi/chatqna.py
index 61598a0c1..ea82c098a 100644
--- a/ChatQnA/microservice/gaudi/chatqna.py
+++ b/ChatQnA/microservice/gaudi/chatqna.py
@@ -37,6 +37,7 @@ class ChatQnAService:
         self.service_builder.flow_to(embedding, retriever)
         self.service_builder.flow_to(retriever, rerank)
         self.service_builder.flow_to(rerank, llm)
+        self.service_builder.start_server()
 
     def schedule(self):
         self.service_builder.schedule(initial_inputs={"text": "What is the revenue of Nike in 2023?"})
diff --git a/ChatQnA/microservice/xeon/README.md b/ChatQnA/microservice/xeon/README.md
index 1663368bf..0d2fad967 100644
--- a/ChatQnA/microservice/xeon/README.md
+++ b/ChatQnA/microservice/xeon/README.md
@@ -70,6 +70,8 @@ export INDEX_NAME="rag-redis"
 export HUGGINGFACEHUB_API_TOKEN=${your_hf_api_token}
 ```
 
+Note: Please replace with `host_ip` with you external IP address, do not use localhost.
+
 ### Start Microservice Docker Containers
 
 ```bash
@@ -154,9 +156,9 @@ Following the validation of all aforementioned microservices, we are now prepare
 
 ## 🚀 Construct Mega Service
 
-Modify the `initial_inputs` of line 34 in `chatqna.py`, then you will get the ChatQnA result of this mega service.
+To construct the Mega Service, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `chatqna.py` Python script. Upon executing the script, each microservice's intermediate results will be displayed, allowing users to verify the accuracy of the outcomes and make targeted modifications if necessary.
 
-All of the intermediate results will be printed for each microservices. Users can check the accuracy of the results to make targeted modifications.
+To launch the Mega Service, simply run the following command:
 
 ### Run Mega Service with Python
 
@@ -184,3 +186,14 @@ Then you can check the result of your chatqna service with the command below.
 ```bash
 docker logs chatqna-xeon-server
 ```
+
+## 🚀 Access the Mega Service
+
+Once the mega service docker is launched, a FastAPI server will be initiated. Users can interact with the service through the `/v1/chatqna` endpoint. Here's an example using `curl`:
+
+```bash
+curl http://127.0.0.1:8888/v1/chatqna -H "Content-Type: application/json" -d '{
+     "model": "Intel/neural-chat-7b-v3-3",
+     "messages": "What is the revenue of Nike in 2023?"
+     }
+```
diff --git a/ChatQnA/microservice/xeon/chatqna.py b/ChatQnA/microservice/xeon/chatqna.py
index 52851ce64..a673e5af1 100644
--- a/ChatQnA/microservice/xeon/chatqna.py
+++ b/ChatQnA/microservice/xeon/chatqna.py
@@ -41,6 +41,7 @@ class ChatQnAService:
         self.service_builder.flow_to(embedding, retriever)
         self.service_builder.flow_to(retriever, rerank)
         self.service_builder.flow_to(rerank, llm)
+        self.service_builder.start_server()
 
     def schedule(self):
         self.service_builder.schedule(initial_inputs={"text": "What is the revenue of Nike in 2023?"})
diff --git a/ChatQnA/tests/test_chatqna_on_gaudi.sh b/ChatQnA/tests/test_chatqna_on_gaudi.sh
index e5317ca2d..ab7ebe789 100644
--- a/ChatQnA/tests/test_chatqna_on_gaudi.sh
+++ b/ChatQnA/tests/test_chatqna_on_gaudi.sh
@@ -115,7 +115,12 @@ function check_microservices() {
 }
 
 function run_megaservice() {
+    # Construct Mega Service
     python chatqna.py > ${LOG_PATH}/run_megaservice.log
+    # Access the Mega Service
+    curl http://127.0.0.1:8888/v1/chatqna -H "Content-Type: application/json" -d '{
+        "model": "Intel/neural-chat-7b-v3-3",
+        "messages": "What is the revenue of Nike in 2023?"}' > ${LOG_PATH}/curl_megaservice.log
 }
 
 function check_results() {
@@ -125,6 +130,10 @@ function check_results() {
         status=true
     fi
 
+    if [[ -f $LOG_PATH/curl_megaservice.log ]] && [[ $(grep -c "\$51.2 billion" $LOG_PATH/curl_megaservice.log) == 0 ]]; then
+        status=false
+    fi
+
     if [ $status == false ]; then
         echo "Response check failed, please check the logs in artifacts!"
         exit 1
diff --git a/ChatQnA/tests/test_chatqna_on_xeon.sh b/ChatQnA/tests/test_chatqna_on_xeon.sh
index b50e70aea..71a2930be 100644
--- a/ChatQnA/tests/test_chatqna_on_xeon.sh
+++ b/ChatQnA/tests/test_chatqna_on_xeon.sh
@@ -108,16 +108,26 @@ function check_microservices() {
 }
 
 function run_megaservice() {
+    # Construct Mega Service
     python chatqna.py > ${LOG_PATH}/run_megaservice.log
+    # Access the Mega Service
+    curl http://127.0.0.1:8888/v1/chatqna -H "Content-Type: application/json" -d '{
+        "model": "Intel/neural-chat-7b-v3-3",
+        "messages": "What is the revenue of Nike in 2023?"}' > ${LOG_PATH}/curl_megaservice.log
 }
 
 function check_results() {
+
     echo "Checking response results, make sure the output is reasonable. "
     local status=false
     if [[ -f $LOG_PATH/run_megaservice.log ]] && [[ $(grep -c "\$51.2 billion" $LOG_PATH/run_megaservice.log) != 0 ]]; then
         status=true
     fi
 
+    if [[ -f $LOG_PATH/curl_megaservice.log ]] && [[ $(grep -c "\$51.2 billion" $LOG_PATH/curl_megaservice.log) == 0 ]]; then
+        status=false
+    fi
+
     if [ $status == false ]; then
         echo "Response check failed, please check the logs in artifacts!"
         exit 1