Revert max_new_tokens to 1024 (#479)

Signed-off-by: lvliang-intel <liang1.lv@intel.com>
This commit is contained in:
lvliang-intel
2024-08-14 01:05:17 +08:00
committed by GitHub
parent 62ca5bcf55
commit f2497c5638

View File

@@ -160,7 +160,7 @@ class ChatCompletionRequest(BaseModel):
logit_bias: Optional[Dict[str, float]] = None
logprobs: Optional[bool] = False
top_logprobs: Optional[int] = 0
max_tokens: Optional[int] = 16 # use https://platform.openai.com/docs/api-reference/completions/create
max_tokens: Optional[int] = 1024 # use https://platform.openai.com/docs/api-reference/completions/create
n: Optional[int] = 1
presence_penalty: Optional[float] = 0.0
response_format: Optional[ResponseFormat] = None