fix: change num_tokens_across_dp type from int to torch.Tensor

jianzs · jianzs · commit fe1f5c0741cd · 2025-07-08T14:51:21.000+08:00
Signed-off-by: Jade Zheng &lt;zheng.shoujian@outlook.com&gt;
diff --git a/vllm_ascend/worker/model_runner_v1.py b/vllm_ascend/worker/model_runner_v1.py
@@ -1823,7 +1823,7 @@ def _dummy_run(
         is_compile: bool = False,
         with_prefill: bool = True,
         skip_attn: bool = True,
-        num_tokens_across_dp: Optional[int] = None,
+        num_tokens_across_dp: Optional[torch.Tensor] = None,
     ) -> torch.Tensor:
         # Set num_scheduled_tokens based on num_tokens and max_num_seqs
         # for dummy run with LoRA so that the num_reqs collectively