Add parameter_name support to _intx_weight_only_transform (#3905)

jcaip · web-flow · commit cd062f26c380 · 2026-02-24T18:14:15.000-08:00
diff --git a/test/quantization/test_quant_api.py b/test/quantization/test_quant_api.py
@@ -1046,6 +1046,7 @@ def test_fqn_to_config_non_weight_param(self):
             Int8DynamicActivationInt8WeightConfig(),
             Int8DynamicActivationIntxWeightConfig(),
             Int8StaticActivationInt8WeightConfig(),
+            IntxWeightOnlyConfig(),
             Float8WeightOnlyConfig(),
             Float8DynamicActivationFloat8WeightConfig(granularity=PerTensor()),
         ]
diff --git a/torchao/quantization/quant_api.py b/torchao/quantization/quant_api.py
@@ -1813,26 +1813,33 @@ def _intx_weight_only_transform(
     module: torch.nn.Module,
     config: IntxWeightOnlyConfig,
     *,
+    parameter_name: str = "weight",
     custom_scale: Optional[torch.Tensor] = None,
     custom_zero_point: Optional[torch.Tensor] = None,
 ) -> torch.nn.Module:
-    assert hasattr(module, "weight"), (
-        "applying intx weight only quant requires module to have weight attribute"
-        + " but {module} does not have one"
+    assert hasattr(module, parameter_name), (
+        f"applying intx weight only quant requires module to have {parameter_name} attribute"
+        + f" but {module} does not have one"
     )
     new_weight = _intx_weight_only_quantize_tensor(
-        module.weight,
+        getattr(module, parameter_name),
         config,
         custom_scale=custom_scale,
         custom_zero_point=custom_zero_point,
     )
-    module.weight = torch.nn.Parameter(new_weight, requires_grad=False)
-
-    if isinstance(module, nn.Linear):
-        module.extra_repr = types.MethodType(_linear_extra_repr, module)
-    elif isinstance(module, nn.Embedding):
-        module.extra_repr = types.MethodType(_embedding_extra_repr, module)
-
+    setattr(
+        module,
+        parameter_name,
+        torch.nn.Parameter(new_weight, requires_grad=False),
+    )
+    module.extra_repr = types.MethodType(
+        partial(
+            _module_extra_repr,
+            original_extra_repr=module.extra_repr,
+            parameter_name=parameter_name,
+        ),
+        module,
+    )
     return module
 
 

Original file line number	Diff line number	Diff line change
`@@ -1046,6 +1046,7 @@ def test_fqn_to_config_non_weight_param(self):`
`1046`	`1046`	`Int8DynamicActivationInt8WeightConfig(),`
`1047`	`1047`	`Int8DynamicActivationIntxWeightConfig(),`
`1048`	`1048`	`Int8StaticActivationInt8WeightConfig(),`
	`1049`	`+ IntxWeightOnlyConfig(),`
`1049`	`1050`	`Float8WeightOnlyConfig(),`
`1050`	`1051`	`Float8DynamicActivationFloat8WeightConfig(granularity=PerTensor()),`
`1051`	`1052`	`]`