We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 29f8881 commit 49dd290Copy full SHA for 49dd290
vllm/model_executor/layers/quantization/bitsandbytes.py
@@ -5,7 +5,6 @@
5
6
import torch
7
8
-from vllm.model_executor.layers.fused_moe import fused_experts
9
from vllm.model_executor.layers.fused_moe.layer import (FusedMoE,
10
FusedMoEMethodBase)
11
from vllm.model_executor.layers.linear import (LinearBase, LinearMethodBase,
@@ -467,6 +466,7 @@ def apply(
467
466
logical_to_physical_map: Optional[torch.Tensor] = None,
468
logical_replica_count: Optional[torch.Tensor] = None,
469
) -> torch.Tensor:
+ from vllm.model_executor.layers.fused_moe import fused_experts
470
471
if enable_eplb:
472
raise NotImplementedError(
0 commit comments