We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent cd4cfee commit 1567180Copy full SHA for 1567180
vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe.py
@@ -621,8 +621,7 @@ def apply(
621
num_expert_group=num_expert_group,
622
custom_routing_function=custom_routing_function,
623
scoring_func=scoring_func,
624
- e_score_correction_bias=e_score_correction_bias,
625
- indices_type=torch.uint32)
+ e_score_correction_bias=e_score_correction_bias)
626
627
return self.fused_experts(
628
x,
0 commit comments