diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py index dd09f514906d..d50d55de3feb 100644 --- a/vllm/engine/arg_utils.py +++ b/vllm/engine/arg_utils.py @@ -1545,7 +1545,8 @@ def _set_default_args_v1(self, usage_context: UsageContext, # for non-pooling tasks. # For pooling tasks the default is False if model_config.runner_type != "pooling": - self.enable_chunked_prefill = True + if self.enable_chunked_prefill is None: + self.enable_chunked_prefill = True if self.enable_prefix_caching is None: self.enable_prefix_caching = True else: