Update vllm_ascend/worker/model_runner_v1.py

jianzs · jianzs · commit bfec11432712 · 2025-07-08T14:47:01.000+08:00
Co-authored-by: Angazenn &lt;92204292+Angazenn@users.noreply.github.com&gt;

Signed-off-by: jianzs &lt;zhengshoujian.zsj@outlook.com&gt;
diff --git a/vllm_ascend/worker/model_runner_v1.py b/vllm_ascend/worker/model_runner_v1.py
@@ -625,9 +625,9 @@ def _get_forward_metadata_across_dp(
             with_prefill: bool) -> tuple[torch.Tensor, bool]:
         local_forward_metadata = torch.tensor([num_tokens, with_prefill],
                                               device="npu",
-                                              dtype=torch.int32)
+                                              dtype=torch.int32).unsqueeze(0)
         global_forward_metadata = get_dp_group().all_gather(
-            local_forward_metadata)
+            local_forward_metadata, dim=0)
         num_tokens_across_dp = global_forward_metadata[:, 0].cpu()
         with_prefill = bool(global_forward_metadata[:, 1].any())
         return num_tokens_across_dp, with_prefill