We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1c7aaaa commit 402f574Copy full SHA for 402f574
src/python/tritonfrontend/_api/_kservegrpc.py
@@ -79,6 +79,7 @@ class Options:
79
infer_compression_level: Union[
80
int, Grpc_compression_level
81
] = Grpc_compression_level.NONE
82
+ infer_thread_count: int = Field(2, ge=0)
83
infer_allocation_pool_size: int = Field(8, ge=0)
84
max_response_pool_size: int = Field(2_147_483_647, ge=0)
85
forward_header_pattern: str = ""
src/python/tritonfrontend/_api/_kservegrpc.pyi
@@ -56,6 +56,7 @@ class KServeGrpc:
56
max_connection_age_ms: int
57
max_connection_age_grace_ms: int
58
infer_compression_level: int | Grpc_compression_level
59
+ infer_thread_count: int
60
infer_allocation_pool_size: int
61
max_response_pool_size: int
62
forward_header_pattern: str
0 commit comments