File tree 1 file changed +11
-2
lines changed
1 file changed +11
-2
lines changed Original file line number Diff line number Diff line change 32
32
from vllm .attention import AttentionType , get_attn_backend
33
33
from vllm .attention .layer import Attention
34
34
from vllm .config import CompilationLevel , VllmConfig
35
- from vllm .distributed .kv_transfer import (get_kv_transfer_group ,
36
- has_kv_transfer_group )
37
35
from vllm .distributed .parallel_state import get_pp_group
38
36
from vllm .forward_context import set_forward_context
39
37
from vllm .inputs import INPUT_REGISTRY
57
55
from vllm_ascend .attention .attention_v1 import AscendAttentionState
58
56
from vllm_ascend .platform import NPUPlatform
59
57
58
+ if vllm_version_is ("0.8.4" ):
59
+ from vllm .distributed import get_kv_transfer_group
60
+
61
+ def has_kv_transfer_group () -> bool :
62
+ # vLLM 0.8.4 does not support disaggregated prefill. This function is
63
+ # added to ensure compatibility with vLLM 0.8.4.
64
+ return False
65
+ else :
66
+ from vllm .distributed .kv_transfer import ( # type: ignore
67
+ get_kv_transfer_group , has_kv_transfer_group )
68
+
60
69
if TYPE_CHECKING :
61
70
import xgrammar as xgr # type: ignore[import-untyped]
62
71
from vllm .v1 .core .sched .output import SchedulerOutput
You can’t perform that action at this time.
0 commit comments