diff --git a/torchao/quantization/quant_api.py b/torchao/quantization/quant_api.py index 7991383e16..56a2251fc4 100644 --- a/torchao/quantization/quant_api.py +++ b/torchao/quantization/quant_api.py @@ -884,11 +884,11 @@ def _int4_weight_only_transform( return module +@dataclass class Int8WeightOnlyConfig(AOBaseConfig): """ Configuration for applying int8 weight-only symmetric per-channel quantization to linear layers. """ - group_size: Optional[int] = None