revert unrelated change

kylesayrs · kylesayrs · commit 82dfe9de2e08 · 2025-05-07T18:39:19.000-04:00
Signed-off-by: Kyle Sayers &lt;kylesayrs@gmail.com&gt;
diff --git a/src/compressed_tensors/compressors/model_compressors/model_compressor.py b/src/compressed_tensors/compressors/model_compressors/model_compressor.py
@@ -370,14 +370,20 @@ def get_unexpected_file_keys(self, model: Module) -> List[str]:
     # ----- model memory compression/decompression pathways ----- #
 
     def compress_model(self, model: Module):
+        """
+        Compress a model in memory. Because the model structure is modified in place,
+        this method is more memory-efficient than `self.compress`
+
+        :param model: model containing parameters to compress
+        """
         module_to_scheme = map_module_to_scheme(model)
         sparse_compression_targets: Set[str] = expand_target_names(
             model=model,
             targets=self.sparsity_config.targets if self.sparsity_config else [],
             ignore=self.sparsity_config.ignore if self.sparsity_config else [],
         )
 
-        for prefix, module in model.named_modules():
+        for prefix, module in tqdm(model.named_modules(), desc="Compressing model"):
             if prefix in module_to_scheme or prefix in sparse_compression_targets:
                 state_dict = module.state_dict(prefix=f"{prefix}.")
                 # quantization first
@@ -409,14 +415,20 @@ def compress_model(self, model: Module):
                 module.quantization_status = QuantizationStatus.COMPRESSED
 
     def decompress_model(self, model: Module):
+        """
+        Decompress a model in memory. Because the model structure is modified in place,
+        this method does not require loading some compression parameters from disk
+
+        :param model: model containing parameters to compress
+        """
         module_to_scheme = map_module_to_scheme(model)
         sparse_compression_targets: Set[str] = expand_target_names(
             model=model,
             targets=self.sparsity_config.targets if self.sparsity_config else [],
             ignore=self.sparsity_config.ignore if self.sparsity_config else [],
         )
 
-        for prefix, module in model.named_modules():
+        for prefix, module in tqdm(model.named_modules(), desc="Decompressing model"):
             if prefix in module_to_scheme or prefix in sparse_compression_targets:
                 state_dict = module.state_dict(prefix=f"{prefix}.")
                 # sparsity first
diff --git a/src/compressed_tensors/quantization/lifecycle/forward.py b/src/compressed_tensors/quantization/lifecycle/forward.py
@@ -37,7 +37,6 @@
     "dequantize",
     "fake_quantize",
     "wrap_module_forward_quantized",
-    "unwrap_module_forward_quantized",
     "forward_quantize",
 ]
 
@@ -313,10 +312,6 @@ def wrapped_forward(self, *args, **kwargs):
     setattr(module, "forward", bound_wrapped_forward)
 
 
-def unwrap_module_forward_quantized(module: Module):
-    delattr(module, "forward")  # revert to class implementation
-
-
 def forward_quantize(
     module: Module, value: torch.Tensor, base_name: str, args: "QuantizationArgs"
 ) -> torch.Tensor:
diff --git a/src/compressed_tensors/utils/safetensors_load.py b/src/compressed_tensors/utils/safetensors_load.py
@@ -269,7 +269,8 @@ def get_nested_mappings_from_state_dict(
     :param state_dict: state dict of the model
     :param params_to_nest: Iterable of parameter names to nest.
     :return: Nested mapping of parameterized layer names to the value of
-        each layer's compression parameters.
+        each layer's compression parameters. If `return_unmatched_params`, then
+        also return a dictionary mapping unused parameter names to their values
     """
     nested_weight_mappings = {}
     unmatched_params = {}