File tree Expand file tree Collapse file tree 1 file changed +1
-2
lines changed Expand file tree Collapse file tree 1 file changed +1
-2
lines changed Original file line number Diff line number Diff line change @@ -968,7 +968,6 @@ def apply(
968
968
topk_ids = torch .randint_like (topk_ids , 0 , global_num_experts )
969
969
970
970
fused_moe_state = get_forward_context ().fused_moe_state
971
-
972
971
if fused_moe_state == FusedMoEState .MC2 :
973
972
mc2_mask = kwargs .get ("mc2_mask" , None )
974
973
return fused_experts_with_mc2 (
@@ -1209,7 +1208,7 @@ def forward(self,
1209
1208
shared_hidden_states = shared_experts (hidden_states )
1210
1209
1211
1210
attn_metadata = get_forward_context ().attn_metadata
1212
- mc2_mask = attn_metadata .decode .mc2_mask if attn_metadata is not None and attn_metadata . decode is not None else None
1211
+ mc2_mask = attn_metadata .decode .mc2_mask if attn_metadata is not None and getattr ( attn_metadata , " decode" , None ) is not None else None
1213
1212
1214
1213
tp_size = get_tensor_model_parallel_world_size ()
1215
1214
if tp_size > 1 and fused_moe_state != FusedMoEState .AllGather :
You can’t perform that action at this time.
0 commit comments