We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 749b2e9 commit e9e8443Copy full SHA for e9e8443
fastdeploy/worker/worker_process.py
@@ -360,11 +360,11 @@ def determine_num_available_blocks(self) -> None:
360
model_block_memory_used)
361
# NOTE(liuzichang): Too many block will lead to illegal memory access
362
# We will develop dynamic limits in future.
363
- if num_blocks_local > 20000:
+ if num_blocks_local > 40000:
364
logger.info(
365
- f"------- Reset num_blocks_local {num_blocks_local} to 20000"
+ f"------- Reset num_blocks_local {num_blocks_local} to 40000"
366
)
367
- num_blocks_local = min(20000, num_blocks_local)
+ num_blocks_local = min(40000, num_blocks_local)
368
369
f"------- model_block_memory_used:{model_block_memory_used} --------"
370
0 commit comments