diff --git a/torchao/quantization/__init__.py b/torchao/quantization/__init__.py index 67a70c5a35..739bd90909 100644 --- a/torchao/quantization/__init__.py +++ b/torchao/quantization/__init__.py @@ -39,6 +39,7 @@ AffineQuantizedObserverBase, ) from .quant_api import ( + AOPerModuleConfig, CutlassInt4PackedLayout, Float8DynamicActivationFloat8SemiSparseWeightConfig, Float8DynamicActivationFloat8WeightConfig, @@ -140,6 +141,7 @@ "UIntXWeightOnlyConfig", "FPXWeightOnlyConfig", "GemliteUIntXWeightOnlyConfig", + "AOPerModuleConfig", # smooth quant - subject to change "get_scale", "SmoothFakeDynQuantMixin",