Skip to content

Commit c2318fe

Browse files
committed
fix: resolve import issue when running with vllm 0.8.4
Signed-off-by: Jade Zheng <zheng.shoujian@outlook.com>
1 parent 720407f commit c2318fe

File tree

1 file changed

+11
-2
lines changed

1 file changed

+11
-2
lines changed

vllm_ascend/worker/model_runner_v1.py

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -32,8 +32,6 @@
3232
from vllm.attention import AttentionType, get_attn_backend
3333
from vllm.attention.layer import Attention
3434
from vllm.config import CompilationLevel, VllmConfig
35-
from vllm.distributed.kv_transfer import (get_kv_transfer_group,
36-
has_kv_transfer_group)
3735
from vllm.distributed.parallel_state import get_pp_group
3836
from vllm.forward_context import set_forward_context
3937
from vllm.inputs import INPUT_REGISTRY
@@ -57,6 +55,17 @@
5755
from vllm_ascend.attention.attention_v1 import AscendAttentionState
5856
from vllm_ascend.platform import NPUPlatform
5957

58+
if vllm_version_is("0.8.4"):
59+
from vllm.distributed import get_kv_transfer_group
60+
61+
def has_kv_transfer_group() -> bool:
62+
# vLLM 0.8.4 does not support disaggregated prefill. This function is
63+
# added to ensure compatibility with vLLM 0.8.4.
64+
return False
65+
else:
66+
from vllm.distributed.kv_transfer import ( # type: ignore
67+
get_kv_transfer_group, has_kv_transfer_group)
68+
6069
if TYPE_CHECKING:
6170
import xgrammar as xgr # type: ignore[import-untyped]
6271
from vllm.v1.core.sched.output import SchedulerOutput

0 commit comments

Comments
 (0)