File tree Expand file tree Collapse file tree 2 files changed +42
-10
lines changed Expand file tree Collapse file tree 2 files changed +42
-10
lines changed Original file line number Diff line number Diff line change @@ -6,24 +6,43 @@ torchao.quantization
6
6
7
7
.. currentmodule :: torchao.quantization
8
8
9
+ Main Quantization APIs
10
+ ----------------------
11
+
9
12
.. autosummary ::
10
13
:toctree: generated/
11
14
:nosignatures:
12
15
13
- autoquant
14
16
quantize _
15
- int8_dynamic_activation_int4_weight
16
- int8_dynamic_activation_int8_weight
17
+ autoquant
18
+
19
+ Quantization APIs for quantize _
20
+ -------------------------------
21
+
22
+ .. autosummary ::
23
+ :toctree: generated/
24
+ :nosignatures:
25
+
17
26
int4_weight_only
18
27
int8_weight_only
28
+ int8_dynamic_activation_int4_weight
29
+ int8_dynamic_activation_int8_weight
30
+ uintx_weight_only
31
+ gemlite_uintx_weight_only
32
+ intx_quantization_aware_training
33
+ from_intx_quantization_aware_training
19
34
float8_weight_only
20
35
float8_dynamic_activation_float8_weight
21
36
float8_static_activation_float8_weight
22
- uintx_weight_only
23
37
fpx_weight_only
24
- to_linear_activation_quantized
25
- swap_linear_with_smooth_fq_linear
26
- smooth_fq_linear_to_inference
38
+
39
+ Quantization Primitives
40
+ -----------------------
41
+
42
+ .. autosummary ::
43
+ :toctree: generated/
44
+ :nosignatures:
45
+
27
46
choose_qparams_affine
28
47
choose_qparams_affine_with_min_max
29
48
choose_qparams_affine_floatx
@@ -40,3 +59,16 @@ torchao.quantization
40
59
ZeroPointDomain
41
60
TorchAODType
42
61
62
+ ..
63
+ TODO: delete these?
64
+
65
+ Other
66
+ -----
67
+
68
+ .. autosummary ::
69
+ :toctree: generated/
70
+ :nosignatures:
71
+
72
+ to_linear_activation_quantized
73
+ swap_linear_with_smooth_fq_linear
74
+ smooth_fq_linear_to_inference
Original file line number Diff line number Diff line change @@ -10,9 +10,9 @@ torchao.sparsity
10
10
:toctree: generated/
11
11
:nosignatures:
12
12
13
- WandaSparsifier
14
- PerChannelNormObserver
15
- apply_fake_sparsity
16
13
sparsify _
17
14
semi_sparse_weight
18
15
int8_dynamic_activation_int8_semi_sparse_weight
16
+ apply_fake_sparsity
17
+ WandaSparsifier
18
+ PerChannelNormObserver
You can’t perform that action at this time.
0 commit comments