From 7295bae71aad02c6f17b08c9dedfdbf2038655cb Mon Sep 17 00:00:00 2001 From: liuyumoye Date: Mon, 23 Jun 2025 15:54:01 +0800 Subject: [PATCH] support --no-enable-chunked-prefill for V1 Signed-off-by: liuyumoye --- vllm/engine/arg_utils.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py index dd09f514906d..d50d55de3feb 100644 --- a/vllm/engine/arg_utils.py +++ b/vllm/engine/arg_utils.py @@ -1545,7 +1545,8 @@ def _set_default_args_v1(self, usage_context: UsageContext, # for non-pooling tasks. # For pooling tasks the default is False if model_config.runner_type != "pooling": - self.enable_chunked_prefill = True + if self.enable_chunked_prefill is None: + self.enable_chunked_prefill = True if self.enable_prefix_caching is None: self.enable_prefix_caching = True else: