fix typing

dsikka · dsikka · commit f8c0b98fd413 · 2025-07-09T19:35:19.000Z
diff --git a/src/llmcompressor/modeling/deepseek_v3.py b/src/llmcompressor/modeling/deepseek_v3.py
@@ -1,4 +1,7 @@
 import torch
+from transformers.models.deepseek_v3.modeling_deepseek_v3 import (
+    DeepseekV3MoE as OriginalDeepseekV3MoE,
+)
 
 
 class DeepseekV3MoE(torch.nn.Module):
@@ -45,7 +48,7 @@ def forward(self, hidden_states):
         return hidden_states
 
 
-def replace(module: "DeepseekV3MoE") -> DeepseekV3MoE:
+def replace(module: OriginalDeepseekV3MoE) -> DeepseekV3MoE:
     return DeepseekV3MoE(
         module.config, module.experts, module.gate, module.shared_experts
     )
diff --git a/src/llmcompressor/modeling/prepare.py b/src/llmcompressor/modeling/prepare.py
@@ -30,6 +30,7 @@ def update_qwen3_moe(model, stack):
     for module in model.modules():
         cls_name = module.__class__.__name__
         if cls_name == "Qwen3MoeDecoderLayer":
+            # Optionally update the model.config to pass in other arguments
             stack.enter_context(
                 patch_attr(module, "mlp", replace_Qwen3MoE(model.config, module.mlp))
             )

Original file line number	Diff line number	Diff line change
`@@ -30,6 +30,7 @@ def update_qwen3_moe(model, stack):`
`30`	`30`	`for module in model.modules():`
`31`	`31`	`cls_name = module.__class__.__name__`
`32`	`32`	`if cls_name == "Qwen3MoeDecoderLayer":`
	`33`	`+ # Optionally update the model.config to pass in other arguments`
`33`	`34`	`stack.enter_context(`
`34`	`35`	`patch_attr(module, "mlp", replace_Qwen3MoE(model.config, module.mlp))`
`35`	`36`	`)`