remove qconfig, fix typo

kylesayrs · kylesayrs · commit d8e8213f7489 · 2025-06-23T16:22:45.000-04:00
Signed-off-by: Kyle Sayers &lt;kylesayrs@gmail.com&gt;
diff --git a/examples/quantizing_moe/deepseek_r1_example.py b/examples/quantizing_moe/deepseek_r1_example.py
@@ -1,5 +1,5 @@
 from datasets import load_dataset
-from transformers import AutoModelForCausalLM, AutoTokenizer
+from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer
 
 from llmcompressor.modeling import prepare_for_calibration
 from llmcompressor.modifiers.quantization import GPTQModifier
@@ -9,7 +9,11 @@
 # For DeepSeek-R1, we require a full precision model in order to properly calibrate
 # `DeepSeek-R1-0528-BF16` is a DeepSeek-V3 FP8 model which has been converted to BF16
 model_id = "unsloth/DeepSeek-R1-0528-BF16"
-model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype="auto")
+config = AutoConfig.from_pretrained(model_id)
+del config.quantization_config  # fp8 qconfig no longer appplies to bf16 model
+model = AutoModelForCausalLM.from_pretrained(
+    model_id, torch_dtype="auto", config=config
+)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = prepare_for_calibration(model)
 
diff --git a/src/llmcompressor/modeling/prepare.py b/src/llmcompressor/modeling/prepare.py
@@ -13,8 +13,9 @@
 
 def prepare_for_calibration(model: PreTrainedModel) -> PreTrainedModel:
     def replace(module: torch.nn.Module) -> torch.nn.Module:
-        if module.__class__.__name__ in replacements:
-            return replacements[module.__class__](module)
+        cls_name = module.__class__.__name__
+        if cls_name in replacements:
+            return replacements[cls_name](module)
         else:
             return module