Skip to content

Commit ff4460d

Browse files
fix: fix the openai frontend's arguments missing error (#8121)
1 parent f27c0aa commit ff4460d

File tree

2 files changed

+4
-2
lines changed

2 files changed

+4
-2
lines changed

src/python/tritonfrontend/_api/_kservegrpc.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
1+
# Copyright 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
22
#
33
# Redistribution and use in source and binary forms, with or without
44
# modification, are permitted provided that the following conditions
@@ -80,6 +80,7 @@ class Options:
8080
int, Grpc_compression_level
8181
] = Grpc_compression_level.NONE
8282
infer_allocation_pool_size: int = Field(8, ge=0)
83+
max_response_pool_size: int = Field(2_147_483_647, ge=0)
8384
forward_header_pattern: str = ""
8485
# DLIS-7215: Add restricted protocol support
8586
# restricted_protocols: str = ""

src/python/tritonfrontend/_api/_kservegrpc.pyi

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
1+
# Copyright 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
22
#
33
# Redistribution and use in source and binary forms, with or without
44
# modification, are permitted provided that the following conditions
@@ -57,6 +57,7 @@ class KServeGrpc:
5757
max_connection_age_grace_ms: int
5858
infer_compression_level: int | Grpc_compression_level
5959
infer_allocation_pool_size: int
60+
max_response_pool_size: int
6061
forward_header_pattern: str
6162
def __post_init__(self) -> None: ...
6263
triton_frontend: Incomplete

0 commit comments

Comments
 (0)