pytorch
diff --git a/‎test/quantization/quantize_/workflows/intx/test_intx_opaque_tensor.py‎
Lines changed: 19 additions & 29 deletions b/‎test/quantization/quantize_/workflows/intx/test_intx_opaque_tensor.py‎
Lines changed: 19 additions & 29 deletions
diff --git a/‎test/quantization/quantize_/workflows/intx/test_intx_unpacked_to_int8_tensor.py‎
Lines changed: 6 additions & 6 deletions b/‎test/quantization/quantize_/workflows/intx/test_intx_unpacked_to_int8_tensor.py‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎torchao/quantization/quant_api.py‎
Lines changed: 18 additions & 18 deletions b/‎torchao/quantization/quant_api.py‎
Lines changed: 18 additions & 18 deletions
@@ -35,11 +35,11 @@ def _get_accuracy_test_cases():
     ]
 
     PACKING_FORMATS = [
-        (IntxPackingFormat.UNPACKED_TO_INT8, None),
-        (IntxPackingFormat.OPAQUE, "aten"),
-        (IntxPackingFormat.OPAQUE, "torchao_auto"),
-        (IntxPackingFormat.OPAQUE, "torchao_lowbit"),
-        (IntxPackingFormat.OPAQUE, "torchao_kleidiai"),
+        IntxPackingFormat.UNPACKED_TO_INT8,
+        IntxPackingFormat.OPAQUE_ATEN_KLEIDIAI,
+        IntxPackingFormat.OPAQUE_TORCHAO_AUTO,
+        IntxPackingFormat.OPAQUE_TORCHAO_KLEIDIAI,
+        IntxPackingFormat.OPAQUE_TORCHAO_LOWBIT,
     ]
 
     WEIGHT_DTYPES = [
@@ -64,13 +64,12 @@ def _get_accuracy_test_cases():
     def _is_valid_test_combination(
         model_dtype,
         packing_format,
-        compute_target,
         weight_dtype,
         weight_mapping_type,
         weight_granularity,
     ):
         # ATEN restrictions
-        if (packing_format == IntxPackingFormat.OPAQUE) and (compute_target == "aten"):
+        if packing_format == IntxPackingFormat.OPAQUE_ATEN_KLEIDIAI:
             if weight_dtype != torch.int4:
                 return False
             if weight_mapping_type == MappingType.ASYMMETRIC:
@@ -79,9 +78,7 @@ def _is_valid_test_combination(
                 return False
 
         # TORCHAO_KLEIDIAI restrictions
-        if (packing_format == IntxPackingFormat.OPAQUE) and (
-            compute_target == "torchao_kleidiai"
-        ):
+        if packing_format == IntxPackingFormat.OPAQUE_TORCHAO_KLEIDIAI:
             if weight_dtype != torch.int4:
                 return False
             if weight_mapping_type == MappingType.ASYMMETRIC:
@@ -100,17 +97,16 @@ def _is_valid_test_combination(
         param(
             model_dtype=mdt,
             packing_format=pf,
-            compute_target=ct,
             weight_dtype=dt,
             weight_mapping_type=mt,
             weight_granularity=gr,
         )
         for mdt in MODEL_DTYPES
-        for pf, ct in PACKING_FORMATS
+        for pf in PACKING_FORMATS
         for dt in WEIGHT_DTYPES
         for mt in MAPPING_TYPES
         for gr in GRANULARITIES
-        if _is_valid_test_combination(dt, pf, ct, dt, mt, gr)
+        if _is_valid_test_combination(dt, pf, dt, mt, gr)
     ]
 
     return test_cases
@@ -126,7 +122,6 @@ def test_accuracy(
         self,
         model_dtype,
         packing_format,
-        compute_target,
         weight_dtype,
         weight_mapping_type,
         weight_granularity,
@@ -149,8 +144,7 @@ def test_accuracy(
                 weight_dtype=weight_dtype,
                 weight_granularity=weight_granularity,
                 weight_mapping_type=weight_mapping_type,
-                packing_format=packing_format,
-                compute_target=compute_target,
+                intx_packing_format=packing_format,
                 version=2,
             ),
         )
@@ -162,8 +156,7 @@ def test_accuracy(
                 weight_dtype=weight_dtype,
                 weight_granularity=weight_granularity,
                 weight_mapping_type=weight_mapping_type,
-                packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
-                compute_target=None,
+                intx_packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
                 version=2,
             ),
         )
@@ -209,8 +202,7 @@ def test_export_compile_aoti(
                 weight_dtype=weight_dtype,
                 weight_granularity=weight_granularity,
                 weight_mapping_type=weight_mapping_type,
-                packing_format=IntxPackingFormat.OPAQUE,
-                compute_target="torchao_auto",
+                intx_packing_format=IntxPackingFormat.OPAQUE_TORCHAO_AUTO,
                 version=2,
             ),
         )
@@ -241,15 +233,15 @@ def test_export_compile_aoti(
 
     @parameterized.expand(
         [
-            param(packing_format=pf, compute_target=ct)
-            for (pf, ct) in [
-                (IntxPackingFormat.OPAQUE, "torchao_auto"),
-                (IntxPackingFormat.OPAQUE, "aten"),
+            param(packing_format=pf)
+            for pf in [
+                IntxPackingFormat.OPAQUE_TORCHAO_AUTO,
+                IntxPackingFormat.OPAQUE_ATEN_KLEIDIAI,
             ]
         ],
         name_func=lambda f, _, params: f.__name__ + f"_{params.kwargs}",
     )
-    def test_serialization(self, packing_format, compute_target):
+    def test_serialization(self, packing_format):
         layers = [
             torch.nn.Linear(512, 256),
         ]
@@ -262,8 +254,7 @@ def test_serialization(self, packing_format, compute_target):
             Int8DynamicActivationIntxWeightConfig(
                 weight_dtype=torch.int4,
                 weight_granularity=PerGroup(64),
-                packing_format=packing_format,
-                compute_target=compute_target,
+                intx_packing_format=packing_format,
                 version=2,
             ),
         )
@@ -305,8 +296,7 @@ def test_moe_quant_intx(self):
         out = model(x).clone()
 
         base_config = Int8DynamicActivationIntxWeightConfig(
-            packing_format=IntxPackingFormat.OPAQUE,
-            compute_target="torchao_auto",
+            intx_packing_format=IntxPackingFormat.OPAQUE_TORCHAO_AUTO,
             version=2,
         )
         moe_config = MoEQuantConfig(
 
@@ -158,7 +158,7 @@ def test_export_int8_dyn_act_intx_weight_config(self):
                 weight_dtype=torch.int4,
                 weight_granularity=PerAxis(0),
                 weight_mapping_type=MappingType.SYMMETRIC,
-                packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
+                intx_packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
                 version=2,
             ),
         )
@@ -194,7 +194,7 @@ def test_export_int8_dyn_act_intx_weight_config_with_unwrap(self):
                 weight_dtype=torch.int4,
                 weight_granularity=PerGroup(64),
                 weight_mapping_type=MappingType.SYMMETRIC,
-                packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
+                intx_packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
                 version=2,
             ),
         )
@@ -232,7 +232,7 @@ def test_serialization_int8_dyn_act_intx_weight_config(self):
             Int8DynamicActivationIntxWeightConfig(
                 weight_dtype=torch.int4,
                 weight_granularity=PerGroup(64),
-                packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
+                intx_packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
                 version=2,
             ),
         )
@@ -262,7 +262,7 @@ def test_serialization_intx_weight_only_config(self):
             IntxWeightOnlyConfig(
                 weight_dtype=torch.int4,
                 granularity=PerGroup(64),
-                packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
+                intx_packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
                 version=2,
             ),
         )
@@ -321,7 +321,7 @@ def test_qat_int8_dyn_act_intx_weight_config(
             weight_granularity=PerGroup(group_size),
             weight_mapping_type=mapping_type,
             weight_scale_dtype=scale_dtype,
-            packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
+            intx_packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
             version=2,
         )
 
@@ -429,7 +429,7 @@ def test_intx_unpacked_v2_is_close_to_qdq_v1(
                 weight_mapping_type=mapping_type,
                 weight_scale_dtype=scale_dtype,
                 act_mapping_type=act_mapping_type,
-                packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
+                intx_packing_format=IntxPackingFormat.UNPACKED_TO_INT8,
                 version=2,
             ),
         )
 
@@ -745,10 +745,8 @@ class Int8DynamicActivationIntxWeightConfig(AOBaseConfig):
     weight_scale_dtype: Optional[torch.dtype] = None
     act_mapping_type: MappingType = MappingType.ASYMMETRIC
     layout: Layout = QDQLayout()
-    packing_format: IntxPackingFormat = IntxPackingFormat.UNPACKED_TO_INT8
+    intx_packing_format: IntxPackingFormat = IntxPackingFormat.UNPACKED_TO_INT8
 
-    # Used with IntxPackingFormat.OPAQUE
-    compute_target: Optional[str] = None
     version: int = 1
 
     def __post_init__(self):
@@ -804,8 +802,7 @@ def _int8_dynamic_activation_intx_weight_quantize_tensor(weight, bias, config):
     weight_scale_dtype = config.weight_scale_dtype
     act_mapping_type = config.act_mapping_type
     layout = config.layout
-    packing_format = config.packing_format
-    compute_target = config.compute_target
+    intx_packing_format = config.intx_packing_format
 
     assert weight.dim() == 2, (
         f"Int8DynamicActivationIntxWeightConfig only works for 2-d Tensor, got: {weight.dim()}"
@@ -826,10 +823,16 @@ def _int8_dynamic_activation_intx_weight_quantize_tensor(weight, bias, config):
 
     if config.version == 2:
         assert act_mapping_type == MappingType.ASYMMETRIC
-        assert packing_format in [
-            IntxPackingFormat.UNPACKED_TO_INT8,
-            IntxPackingFormat.OPAQUE,
-        ], f"Unsupported packing format: {packing_format}"
+        opaque_formats = [
+            IntxPackingFormat.OPAQUE_ATEN_KLEIDIAI,
+            IntxPackingFormat.OPAQUE_TORCHAO_AUTO,
+            IntxPackingFormat.OPAQUE_TORCHAO_KLEIDIAI,
+            IntxPackingFormat.OPAQUE_TORCHAO_LOWBIT,
+        ]
+        assert (
+            intx_packing_format == IntxPackingFormat.UNPACKED_TO_INT8
+            or intx_packing_format in opaque_formats
+        ), f"Unsupported packing format: {intx_packing_format}"
         new_weight = IntxUnpackedToInt8Tensor.from_hp(
             weight,
             block_size,
@@ -845,12 +848,9 @@ def _int8_dynamic_activation_intx_weight_quantize_tensor(weight, bias, config):
         new_bias = bias
 
         # Create packed tensor
-        if packing_format == IntxPackingFormat.OPAQUE:
-            assert compute_target is not None, (
-                "Must specify a compute target for IntxPackingFormat.OPAQUE"
-            )
+        if intx_packing_format in opaque_formats:
             new_weight = IntxOpaqueTensor.from_intx_unpacked_to_int8_tensor(
-                new_weight, bias=new_bias, compute_target=compute_target
+                new_weight, bias=new_bias, intx_packing_format=intx_packing_format
             )
             new_bias = None  # bias is packed with weights
 
@@ -2113,7 +2113,7 @@ class IntxWeightOnlyConfig(AOBaseConfig):
     mapping_type: MappingType = MappingType.SYMMETRIC
     scale_dtype: Optional[torch.dtype] = None
     layout: Layout = QDQLayout()
-    packing_format: IntxPackingFormat = IntxPackingFormat.UNPACKED_TO_INT8
+    intx_packing_format: IntxPackingFormat = IntxPackingFormat.UNPACKED_TO_INT8
     version: int = 1
 
     def __post_init__(self):
@@ -2142,7 +2142,7 @@ def _intx_weight_only_quantize_tensor(weight, config):
     mapping_type = config.mapping_type
     scale_dtype = config.scale_dtype
     layout = config.layout
-    packing_format = config.packing_format
+    intx_packing_format = config.intx_packing_format
 
     assert weight.dim() == 2, (
         f"IntxWeightOnlyConfig only works for 2-d Tensor, got: {weight.dim()}"
@@ -2160,7 +2160,7 @@ def _intx_weight_only_quantize_tensor(weight, config):
     block_size = (1, group_size)
 
     if config.version == 2:
-        if config.packing_format == IntxPackingFormat.UNPACKED_TO_INT8:
+        if config.intx_packing_format == IntxPackingFormat.UNPACKED_TO_INT8:
             new_weight = IntxUnpackedToInt8Tensor.from_hp(
                 weight,
                 block_size,
@@ -2174,7 +2174,7 @@ def _intx_weight_only_quantize_tensor(weight, config):
 
             return new_weight
         else:
-            raise ValueError(f"Unsupported packing format: {packing_format}")
+            raise ValueError(f"Unsupported packing format: {intx_packing_format}")
 
     # Version 1
     quant_min, quant_max = _DTYPE_TO_QVALUE_BOUNDS[weight_dtype]