File tree 1 file changed +5
-0
lines changed
1 file changed +5
-0
lines changed Original file line number Diff line number Diff line change @@ -275,6 +275,11 @@ type ChatCompletionRequest struct {
275
275
Metadata map [string ]string `json:"metadata,omitempty"`
276
276
// Configuration for a predicted output.
277
277
Prediction * Prediction `json:"prediction,omitempty"`
278
+ // ChatTemplateKwargs provides a way to add non-standard parameters to the request body.
279
+ // https://github.com/vllm-project/vllm/blob/05a4324f8e3932c25554791ff248e3e0200eef92/vllm/entrypoints/openai/protocol.py#L320
280
+ // Additional kwargs to pass to the template renderer. Will be accessible by the chat template.
281
+ // Such as think mode for qwen3. https://qwen.readthedocs.io/en/latest/deployment/vllm.html#thinking-non-thinking-modes
282
+ ChatTemplateKwargs map [string ]any `json:"chat_template_kwargs,omitempty"`
278
283
}
279
284
280
285
type StreamOptions struct {
You can’t perform that action at this time.
0 commit comments