File tree Expand file tree Collapse file tree 1 file changed +2
-11
lines changed Expand file tree Collapse file tree 1 file changed +2
-11
lines changed Original file line number Diff line number Diff line change 32
32
from vllm .attention import AttentionType , get_attn_backend
33
33
from vllm .attention .layer import Attention
34
34
from vllm .config import CompilationLevel , VllmConfig
35
+ from vllm .distributed .kv_transfer import (get_kv_transfer_group ,
36
+ has_kv_transfer_group )
35
37
from vllm .distributed .parallel_state import get_pp_group
36
38
from vllm .forward_context import set_forward_context
37
39
from vllm .inputs import INPUT_REGISTRY
55
57
from vllm_ascend .attention .attention_v1 import AscendAttentionState
56
58
from vllm_ascend .platform import NPUPlatform
57
59
58
- if vllm_version_is ("0.8.4" ):
59
- from vllm .distributed import get_kv_transfer_group
60
-
61
- def has_kv_transfer_group () -> bool :
62
- # vLLM 0.8.4 does not support disaggregated prefill. This function is
63
- # added to ensure compatibility with vLLM 0.8.4.
64
- return False
65
- else :
66
- from vllm .distributed .kv_transfer import ( # type: ignore
67
- get_kv_transfer_group , has_kv_transfer_group )
68
-
69
60
if TYPE_CHECKING :
70
61
import xgrammar as xgr # type: ignore[import-untyped]
71
62
from vllm .v1 .core .sched .output import SchedulerOutput
You can’t perform that action at this time.
0 commit comments