Skip to content

Commit 7eb461e

Browse files
authored
Remove compression_ratio calculation (#293)
* src/compressed_tensors/quantization/quant_config.py * fix tests
1 parent 4574747 commit 7eb461e

File tree

2 files changed

+4
-7
lines changed

2 files changed

+4
-7
lines changed

src/compressed_tensors/quantization/quant_config.py

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -230,10 +230,6 @@ def from_pretrained(
230230
group_name = "group_" + str(idx)
231231
config_groups[group_name] = scheme
232232

233-
# TODO: this is incorrect in compressed mode, since we are overwriting the
234-
# original weight we lose the uncompressed bit_depth indo
235-
compression_ratio = calculate_compression_ratio(model)
236-
237233
if format is None:
238234
if quantization_status == QuantizationStatus.COMPRESSED:
239235
format = CompressionFormat.int_quantized.value
@@ -244,7 +240,7 @@ def from_pretrained(
244240
config_groups=config_groups,
245241
quantization_status=quantization_status,
246242
kv_cache_scheme=kv_cache_scheme,
247-
global_compression_ratio=compression_ratio,
243+
global_compression_ratio=None,
248244
format=format,
249245
ignore=consolidated_ignore,
250246
)

tests/test_quantization/lifecycle/test_apply.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -184,8 +184,9 @@ def test_serialize_config_tinyllama():
184184
assert serialized_config.format == CompressionFormat.dense.value
185185
assert serialized_config.quant_method == DEFAULT_QUANTIZATION_METHOD
186186
assert serialized_config.ignore == ["model.layers.1.mlp.down_proj"]
187-
assert serialized_config.global_compression_ratio > 1.0
188-
assert serialized_config.global_compression_ratio < 8.0
187+
if serialized_config.global_compression_ratio is not None:
188+
assert serialized_config.global_compression_ratio > 1.0
189+
assert serialized_config.global_compression_ratio < 8.0
189190

190191

191192
def _test_layer_quantization_status(

0 commit comments

Comments
 (0)