Skip to content

Commit d4affd4

Browse files
committed
Merge branch 'kylesayrs/map_module_to_scheme' into kylesayrs/reduce-quantized-compression-memory
2 parents 43736a9 + f324af7 commit d4affd4

File tree

3 files changed

+9
-24
lines changed

3 files changed

+9
-24
lines changed

src/compressed_tensors/compressors/model_compressors/model_compressor.py

Lines changed: 1 addition & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -19,18 +19,7 @@
1919
import re
2020
from contextlib import contextmanager
2121
from copy import deepcopy
22-
from typing import (
23-
TYPE_CHECKING,
24-
Any,
25-
Callable,
26-
Dict,
27-
List,
28-
Optional,
29-
Set,
30-
Tuple,
31-
TypeVar,
32-
Union,
33-
)
22+
from typing import TYPE_CHECKING, Any, Dict, List, Optional, Set, TypeVar, Union
3423

3524
import compressed_tensors
3625
import torch
@@ -44,7 +33,6 @@
4433
from compressed_tensors.compressors.base import BaseCompressor
4534
from compressed_tensors.compressors.sparse_compressors import DenseCompressor
4635
from compressed_tensors.config import CompressionFormat, SparsityCompressionConfig
47-
from compressed_tensors.linear.compressed_linear import CompressedLinear
4836
from compressed_tensors.quantization import (
4937
DEFAULT_QUANTIZATION_METHOD,
5038
QuantizationConfig,

src/compressed_tensors/compressors/quantized_compressors/base.py

Lines changed: 7 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414

1515
import logging
1616
from pathlib import Path
17-
from typing import Any, Dict, Generator, Optional, Tuple, Union
17+
from typing import Any, Dict, Generator, Tuple, Union
1818

1919
import torch
2020
from compressed_tensors.compressors.base import BaseCompressor
@@ -119,10 +119,8 @@ def compress(
119119
compressed_dict[prefix + key] = value.to(save_device)
120120

121121
else:
122-
# omit saving zero points for symmetric quantization
123-
if name.endswith("zero_point") and not self._should_save_zp(
124-
name, names_to_scheme
125-
):
122+
# omit saving zero points for symmetric or packed quantization
123+
if name.endswith("zero_point") and self._skip_zp(name, names_to_scheme):
126124
continue
127125

128126
# omit saving for g_idx if uninitialized
@@ -134,7 +132,7 @@ def compress(
134132

135133
return compressed_dict
136134

137-
def _should_save_zp(
135+
def _skip_zp(
138136
self, name: str, names_to_scheme: Dict[str, QuantizationScheme]
139137
) -> bool:
140138
from compressed_tensors.compressors import PackedQuantizationCompressor
@@ -150,16 +148,16 @@ def _should_save_zp(
150148
args = scheme.output_activations
151149

152150
symmetric = args.symmetric
153-
packable_strats = [
151+
packable_strategies = [
154152
QuantizationStrategy.GROUP.value,
155153
QuantizationStrategy.CHANNEL.value,
156154
]
157155
packed = (
158156
isinstance(self, PackedQuantizationCompressor)
159-
and args.strategy in packable_strats
157+
and args.strategy in packable_strategies
160158
)
161159

162-
return not symmetric and not packed
160+
return symmetric or packed
163161

164162
def decompress(
165163
self,

src/compressed_tensors/utils/helpers.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,11 +14,10 @@
1414

1515
import warnings
1616
from functools import wraps
17-
from typing import TYPE_CHECKING, Any, Callable, Dict, List, Optional, Union
17+
from typing import TYPE_CHECKING, Any, Callable, Dict, List, Optional
1818

1919
import numpy
2020
import torch
21-
import tqdm
2221
from transformers import AutoConfig
2322

2423

0 commit comments

Comments
 (0)