Fix tutorials (#2516)

drisspg · web-flow · commit fe997580a6c5 · 2025-07-10T19:01:02.000-07:00
stack-info: PR: #2516, branch: drisspg/stack/83
diff --git a/tutorials/calibration_flow/awq_like.py b/tutorials/calibration_flow/awq_like.py
@@ -121,9 +121,12 @@ def weight_quant_func(weight):
                 weight, weight_scale, weight_zero_point, block_size, target_dtype
             )
         elif target_dtype == torch.float8_e4m3fn:
+            scale_2d = (
+                weight_scale.view(1, -1) if weight_scale.dim() == 1 else weight_scale
+            )
             return to_affine_quantized_floatx_static(
                 weight,
-                weight_scale,
+                scale_2d,
                 block_size,
                 target_dtype,
                 Float8Layout(mm_config=None),
diff --git a/tutorials/calibration_flow/gptq_like.py b/tutorials/calibration_flow/gptq_like.py
@@ -48,11 +48,11 @@
     LinearActivationQuantizedTensor,
     MappingType,
     PerTensor,
-    _fake_quantize_affine,
     quantize_,
     to_linear_activation_quantized,
 )
 from torchao.quantization.quant_api import _replace_with_custom_fn_if_matches_filter
+from torchao.quantization.quant_primitives import _fake_quantize_affine
 from torchao.quantization.transform_module import (
     register_quantize_module_handler,
 )

Original file line number	Diff line number	Diff line change
`@@ -48,11 +48,11 @@`
`48`	`48`	`LinearActivationQuantizedTensor,`
`49`	`49`	`MappingType,`
`50`	`50`	`PerTensor,`
`51`		`- _fake_quantize_affine,`
`52`	`51`	`quantize_,`
`53`	`52`	`to_linear_activation_quantized,`
`54`	`53`	`)`
`55`	`54`	`from torchao.quantization.quant_api import _replace_with_custom_fn_if_matches_filter`
	`55`	`+from torchao.quantization.quant_primitives import _fake_quantize_affine`
`56`	`56`	`from torchao.quantization.transform_module import (`
`57`	`57`	`register_quantize_module_handler,`
`58`	`58`	`)`