@@ -107,16 +107,15 @@ class ChatCompletionRequest(BaseModel):
107107 """Chat completion request."""
108108 model : str
109109
110- messages : Union [str , List [Dict [str , Any ]]] = Field (examples = [[{'role' : 'user' , 'content' : 'hi' }]]) # noqa
110+ messages : Union [str , List [Dict [str , Any ]]] = Field (examples = [[{'role' : 'user' , 'content' : 'hi' }]])
111111 temperature : Optional [float ] = 0.7
112112 top_p : Optional [float ] = 1.0
113113 tools : Optional [List [Tool ]] = Field (default = None , examples = [None ])
114- tool_choice : Union [ToolChoice , Literal ['auto' , 'required' , 'none' ]] = Field (default = 'auto' ,
115- examples = ['none' ]) # noqa
114+ tool_choice : Union [ToolChoice , Literal ['auto' , 'required' , 'none' ]] = Field (default = 'auto' , examples = ['none' ])
116115 logprobs : Optional [bool ] = False
117116 top_logprobs : Optional [int ] = None
118117 n : Optional [int ] = 1
119- logit_bias : Optional [Dict [str , float ]] = Field (default = None , examples = [None ]) # noqa
118+ logit_bias : Optional [Dict [str , float ]] = Field (default = None , examples = [None ])
120119 max_completion_tokens : Optional [int ] = Field (
121120 default = None ,
122121 examples = [None ],
@@ -128,15 +127,15 @@ class ChatCompletionRequest(BaseModel):
128127 examples = [None ],
129128 deprecated = 'max_tokens is deprecated in favor of the max_completion_tokens field' ,
130129 )
131- stop : Optional [Union [str , List [str ]]] = Field (default = None , examples = [None ]) # noqa
130+ stop : Optional [Union [str , List [str ]]] = Field (default = None , examples = [None ])
132131
133132 stream : Optional [bool ] = False
134133 stream_options : Optional [StreamOptions ] = Field (default = None , examples = [None ])
135134 presence_penalty : Optional [float ] = 0.0
136135 frequency_penalty : Optional [float ] = 0.0
137136 user : Optional [str ] = None
138137 reasoning_effort : Optional [Literal ['low' , 'medium' , 'high' ]] = None
139- response_format : Optional [ResponseFormat ] = Field (default = None , examples = [None ]) # noqa
138+ response_format : Optional [ResponseFormat ] = Field (default = None , examples = [None ])
140139 # additional argument of lmdeploy
141140 do_preprocess : Optional [bool ] = True
142141 repetition_penalty : Optional [float ] = 1.0
@@ -150,6 +149,7 @@ class ChatCompletionRequest(BaseModel):
150149 min_p : float = 0.0
151150 enable_thinking : Optional [bool ] = None
152151 return_token_ids : Optional [bool ] = False
152+ include_stop_str_in_output : Optional [bool ] = False
153153
154154
155155class FunctionCall (BaseModel ):
0 commit comments