Update vllm_ascend/worker/model_runner_v1.py

jianzs · jianzs · commit 7b605f89847b · 2025-07-17T20:46:06.000+08:00
Co-authored-by: Angazenn &lt;92204292+Angazenn@users.noreply.github.com&gt;

Signed-off-by: Jade Zheng &lt;zheng.shoujian@outlook.com&gt;
diff --git a/vllm_ascend/worker/model_runner_v1.py b/vllm_ascend/worker/model_runner_v1.py
@@ -550,9 +550,9 @@ def _get_forward_metadata_across_dp(
             with_prefill: bool) -> tuple[torch.Tensor, bool]:
         local_forward_metadata = torch.tensor([num_tokens, with_prefill],
                                               device="npu",
-                                              dtype=torch.int32)
+                                              dtype=torch.int32).unsqueeze(0)
         global_forward_metadata = get_dp_group().all_gather(
-            local_forward_metadata)
+            local_forward_metadata, dim=0)
         num_tokens_across_dp = global_forward_metadata[:, 0].cpu()
         with_prefill = bool(global_forward_metadata[:, 1].any())
         return num_tokens_across_dp, with_prefill