fix: change assertion to exception for dummy batch execution in NPUWorker

jianzs · jianzs · commit c1feccde2685 · 2025-07-02T23:17:18.000+08:00
Signed-off-by: Jade Zheng &lt;zheng.shoujian@outlook.com&gt;
diff --git a/vllm_ascend/worker/worker_v1.py b/vllm_ascend/worker/worker_v1.py
@@ -247,9 +247,10 @@ def pin_lora(self, lora_id: int) -> bool:
 
     def execute_dummy_batch(self) -> None:
         runner = self.model_runner
-        assert runner.dp_size > 1, "Dummy batch execution should only be " \
-            "performed with data parallelism enabled, but got " \
-            f"dp_size={runner.dp_size}."
+        if runner.dp_size <= 1:
+            raise ValueError("Dummy batch execution should only be "
+                             "performed with data parallelism enabled, but got "
+                             f"dp_size={runner.dp_size}.")
 
         # If torchair graph is enabled, notify the other DP ranks that this is a
         # dummy run by using '-1' as a flag for num_tokens. This will be