remove examples gateway. (#1250)
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
This commit is contained in:
@@ -4,7 +4,8 @@
|
||||
import asyncio
|
||||
import os
|
||||
|
||||
from comps import Gateway, MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceType
|
||||
from comps import MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceRoleType, ServiceType
|
||||
from comps.cores.mega.utils import handle_message
|
||||
from comps.cores.proto.api_protocol import (
|
||||
ChatCompletionRequest,
|
||||
ChatCompletionResponse,
|
||||
@@ -21,11 +22,12 @@ LLM_SERVICE_HOST_IP = os.getenv("LLM_SERVICE_HOST_IP", "0.0.0.0")
|
||||
LLM_SERVICE_PORT = int(os.getenv("LLM_SERVICE_PORT", 9000))
|
||||
|
||||
|
||||
class CodeGenService(Gateway):
|
||||
class CodeGenService:
|
||||
def __init__(self, host="0.0.0.0", port=8000):
|
||||
self.host = host
|
||||
self.port = port
|
||||
self.megaservice = ServiceOrchestrator()
|
||||
self.endpoint = str(MegaServiceEndpoint.CODE_GEN)
|
||||
|
||||
def add_remote_service(self):
|
||||
llm = MicroService(
|
||||
@@ -42,7 +44,7 @@ class CodeGenService(Gateway):
|
||||
data = await request.json()
|
||||
stream_opt = data.get("stream", True)
|
||||
chat_request = ChatCompletionRequest.parse_obj(data)
|
||||
prompt = self._handle_message(chat_request.messages)
|
||||
prompt = handle_message(chat_request.messages)
|
||||
parameters = LLMParams(
|
||||
max_tokens=chat_request.max_tokens if chat_request.max_tokens else 1024,
|
||||
top_k=chat_request.top_k if chat_request.top_k else 10,
|
||||
@@ -78,14 +80,17 @@ class CodeGenService(Gateway):
|
||||
return ChatCompletionResponse(model="codegen", choices=choices, usage=usage)
|
||||
|
||||
def start(self):
|
||||
super().__init__(
|
||||
megaservice=self.megaservice,
|
||||
self.service = MicroService(
|
||||
self.__class__.__name__,
|
||||
service_role=ServiceRoleType.MEGASERVICE,
|
||||
host=self.host,
|
||||
port=self.port,
|
||||
endpoint=str(MegaServiceEndpoint.CODE_GEN),
|
||||
endpoint=self.endpoint,
|
||||
input_datatype=ChatCompletionRequest,
|
||||
output_datatype=ChatCompletionResponse,
|
||||
)
|
||||
self.service.add_route(self.endpoint, self.handle_request, methods=["POST"])
|
||||
self.service.start()
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
|
||||
Reference in New Issue
Block a user