@@ -390,6 +390,8 @@ public Function(String description, String name, String jsonSchema) {
390
390
* @param maxTokens The maximum number of tokens to generate in the chat completion.
391
391
* The total length of input tokens and generated tokens is limited by the model's
392
392
* context length.
393
+ * @param maxCompletionTokens An upper bound for the number of tokens that can be
394
+ * generated for a completion, including visible output tokens and reasoning tokens.
393
395
* @param n How many chat completion choices to generate for each input message. Note
394
396
* that you will be charged based on the number of generated tokens across all the
395
397
* choices. Keep n as 1 to minimize costs.
@@ -442,6 +444,7 @@ public record ChatCompletionRequest(// @formatter:off
442
444
@ JsonProperty ("logprobs" ) Boolean logprobs ,
443
445
@ JsonProperty ("top_logprobs" ) Integer topLogprobs ,
444
446
@ JsonProperty ("max_tokens" ) Integer maxTokens ,
447
+ @ JsonProperty ("max_completion_tokens" ) Integer maxCompletionTokens ,
445
448
@ JsonProperty ("n" ) Integer n ,
446
449
@ JsonProperty ("presence_penalty" ) Double presencePenalty ,
447
450
@ JsonProperty ("response_format" ) ResponseFormat responseFormat ,
@@ -464,7 +467,7 @@ public record ChatCompletionRequest(// @formatter:off
464
467
* @param temperature What sampling temperature to use, between 0 and 1.
465
468
*/
466
469
public ChatCompletionRequest (List <ChatCompletionMessage > messages , String model , Double temperature ) {
467
- this (messages , model , null , null , null , null , null , null , null ,
470
+ this (messages , model , null , null , null , null , null , null , null , null ,
468
471
null , null , null , false , null , temperature , null ,
469
472
null , null , null , null );
470
473
}
@@ -479,7 +482,7 @@ public ChatCompletionRequest(List<ChatCompletionMessage> messages, String model,
479
482
* as they become available, with the stream terminated by a data: [DONE] message.
480
483
*/
481
484
public ChatCompletionRequest (List <ChatCompletionMessage > messages , String model , Double temperature , boolean stream ) {
482
- this (messages , model , null , null , null , null , null , null , null ,
485
+ this (messages , model , null , null , null , null , null , null , null , null ,
483
486
null , null , null , stream , null , temperature , null ,
484
487
null , null , null , null );
485
488
}
@@ -495,7 +498,7 @@ public ChatCompletionRequest(List<ChatCompletionMessage> messages, String model,
495
498
*/
496
499
public ChatCompletionRequest (List <ChatCompletionMessage > messages , String model ,
497
500
List <FunctionTool > tools , Object toolChoice ) {
498
- this (messages , model , null , null , null , null , null , null , null ,
501
+ this (messages , model , null , null , null , null , null , null , null , null ,
499
502
null , null , null , false , null , 0.8 , null ,
500
503
tools , toolChoice , null , null );
501
504
}
@@ -509,7 +512,7 @@ public ChatCompletionRequest(List<ChatCompletionMessage> messages, String model,
509
512
*/
510
513
public ChatCompletionRequest (List <ChatCompletionMessage > messages , Boolean stream ) {
511
514
this (messages , null , null , null , null , null , null , null , null ,
512
- null , null , null , stream , null , null , null ,
515
+ null , null , null , null , stream , null , null , null ,
513
516
null , null , null , null );
514
517
}
515
518
@@ -520,7 +523,7 @@ public ChatCompletionRequest(List<ChatCompletionMessage> messages, Boolean strea
520
523
* @return A new {@link ChatCompletionRequest} with the specified stream options.
521
524
*/
522
525
public ChatCompletionRequest withStreamOptions (StreamOptions streamOptions ) {
523
- return new ChatCompletionRequest (messages , model , frequencyPenalty , logitBias , logprobs , topLogprobs , maxTokens , n , presencePenalty ,
526
+ return new ChatCompletionRequest (messages , model , frequencyPenalty , logitBias , logprobs , topLogprobs , maxTokens , maxCompletionTokens , n , presencePenalty ,
524
527
responseFormat , seed , stop , stream , streamOptions , temperature , topP ,
525
528
tools , toolChoice , parallelToolCalls , user );
526
529
}
0 commit comments