pytorch · drisspg · Jul 11, 2025 · Jul 10, 2025
diff --git a/tutorials/calibration_flow/awq_like.py b/tutorials/calibration_flow/awq_like.py
@@ -121,9 +121,12 @@ def weight_quant_func(weight):
                 weight, weight_scale, weight_zero_point, block_size, target_dtype
             )
         elif target_dtype == torch.float8_e4m3fn:
+            scale_2d = (
+                weight_scale.view(1, -1) if weight_scale.dim() == 1 else weight_scale
+            )
             return to_affine_quantized_floatx_static(
                 weight,
-                weight_scale,
+                scale_2d,
                 block_size,
                 target_dtype,
                 Float8Layout(mm_config=None),

diff --git a/tutorials/calibration_flow/gptq_like.py b/tutorials/calibration_flow/gptq_like.py
@@ -48,11 +48,11 @@
     LinearActivationQuantizedTensor,
     MappingType,
     PerTensor,
-    _fake_quantize_affine,
     quantize_,
     to_linear_activation_quantized,
 )
 from torchao.quantization.quant_api import _replace_with_custom_fn_if_matches_filter
+from torchao.quantization.quant_primitives import _fake_quantize_affine
 from torchao.quantization.transform_module import (
     register_quantize_module_handler,
 )