Creating Paramaterized Test For Quantizers For Easier Testing (pytorch#16098)

RahulC7 · facebook-github-bot · commit 9637b088500e · 2025-12-05T08:19:32.000-08:00
Summary:

We consolidate the two tests we created into a single testing function using parameterization. 

This will make testing future Quantizers much easier, and there will be a lot less code duplication.

Reviewed By: hsharma35

Differential Revision: D88054917
diff --git a/backends/cadence/aot/TARGETS b/backends/cadence/aot/TARGETS
@@ -640,6 +640,7 @@ python_unittest(
     ],
     typing = True,
     deps = [
+        "fbsource//third-party/pypi/parameterized:parameterized",
         "//caffe2:torch",
         "//executorch/backends/cadence/aot:graph_builder",
         "//executorch/backends/cadence/aot/quantizer:quantizer",
diff --git a/backends/cadence/aot/tests/test_quantizer_ops.py b/backends/cadence/aot/tests/test_quantizer_ops.py
@@ -7,26 +7,36 @@
 # pyre-strict
 
 import unittest
+from typing import Callable
 
 import torch
 from executorch.backends.cadence.aot.graph_builder import GraphBuilder
 from executorch.backends.cadence.aot.quantizer.patterns import AddmmPattern
-from executorch.exir.pass_base import NodeMetadata
 
 from executorch.backends.cadence.aot.quantizer.quantizer import (
     CadenceAtenQuantizer,
     CadenceDefaultQuantizer,
+    CadenceQuantizer,
     CadenceW8A32MixedQuantizer,
     CadenceWith16BitLinearActivationsQuantizer,
     CadenceWith16BitMatmulActivationsQuantizer,
     qconfig_A16,
     qconfig_A8W8,
 )
+from executorch.exir.pass_base import NodeMetadata
+from parameterized import parameterized
+from torch._ops import OpOverload
 from torchao.quantization.pt2e.quantizer.quantizer import (
     Q_ANNOTATION_KEY,
     QuantizationAnnotation,
+    QuantizationSpec,
 )
 
+# Type alias for graph builder functions
+GraphBuilderFn = Callable[
+    ["QuantizerAnnotationTest"], tuple[torch.fx.GraphModule, torch.fx.Node]
+]
+
 
 class QuantizerAnnotationTest(unittest.TestCase):
     """Unit tests for verifying quantizer annotations are correctly applied."""
@@ -53,22 +63,6 @@ def _build_matmul_graph(self) -> tuple[torch.fx.GraphModule, torch.fx.Node]:
         self.assertEqual(len(matmul_nodes), 1, "Should find exactly one matmul node")
         return gm, matmul_nodes[0]
 
-    def test_matmul_16bit_quantizer_annotation(self) -> None:
-        """Test that CadenceWith16BitMatmulActivationsQuantizer correctly annotates matmul."""
-        gm, matmul_node = self._build_matmul_graph()
-
-        quantizer = CadenceWith16BitMatmulActivationsQuantizer()
-        quantizer.annotate(gm)
-
-        annotation: QuantizationAnnotation = matmul_node.meta[Q_ANNOTATION_KEY]
-        self.assertTrue(annotation._annotated)
-
-        self.assertEqual(annotation.output_qspec, qconfig_A16.output_activation)
-
-        self.assertEqual(len(annotation.input_qspec_map), 2)
-        for _, input_qspec in annotation.input_qspec_map.items():
-            self.assertEqual(input_qspec, qconfig_A16.input_activation)
-
     def _build_linear_graph(self) -> tuple[torch.fx.GraphModule, torch.fx.Node]:
         """Build a simple graph with a linear operation (no bias)."""
         builder = GraphBuilder()
@@ -91,28 +85,65 @@ def _build_linear_graph(self) -> tuple[torch.fx.GraphModule, torch.fx.Node]:
         self.assertEqual(len(linear_nodes), 1, "Should find exactly one linear node")
         return gm, linear_nodes[0]
 
-    def test_linear_16bit_quantizer_annotation(self) -> None:
-        """Test that CadenceWith16BitLinearActivationsQuantizer correctly annotates linear."""
-        gm, linear_node = self._build_linear_graph()
+    @parameterized.expand(
+        [
+            (
+                "matmul_A16",
+                lambda self: self._build_matmul_graph(),
+                CadenceWith16BitMatmulActivationsQuantizer(),
+                torch.ops.aten.matmul.default,
+                qconfig_A16.output_activation,
+                # For matmul, both inputs are activations
+                [qconfig_A16.input_activation, qconfig_A16.input_activation],
+            ),
+            (
+                "linear_A16",
+                lambda self: self._build_linear_graph(),
+                CadenceWith16BitLinearActivationsQuantizer(),
+                torch.ops.aten.linear.default,
+                qconfig_A16.output_activation,
+                # For linear: [input_activation, weight]
+                [qconfig_A16.input_activation, qconfig_A16.weight],
+            ),
+        ]
+    )
+    def test_quantizer_annotation(
+        self,
+        name: str,
+        graph_builder_fn: GraphBuilderFn,
+        quantizer: CadenceQuantizer,
+        target: OpOverload,
+        expected_output_qspec: QuantizationSpec,
+        expected_input_qspecs: list[QuantizationSpec],
+    ) -> None:
+        """Parameterized test for quantizer annotations."""
+        gm, op_node = graph_builder_fn(self)
 
-        quantizer = CadenceWith16BitLinearActivationsQuantizer()
         quantizer.annotate(gm)
 
-        annotation: QuantizationAnnotation = linear_node.meta[Q_ANNOTATION_KEY]
+        annotation: QuantizationAnnotation = op_node.meta[Q_ANNOTATION_KEY]
         self.assertTrue(annotation._annotated)
 
-        # Verify output is annotated with qconfig_A16.output_activation (INT16)
-        self.assertEqual(annotation.output_qspec, qconfig_A16.output_activation)
-
-        # Verify inputs: activation (INT16) and weight (INT8)
-        self.assertEqual(len(annotation.input_qspec_map), 2)
-        for input_node, input_qspec in annotation.input_qspec_map.items():
-            if input_node == linear_node.args[0]:
-                # Activation input - should be INT16
-                self.assertEqual(input_qspec, qconfig_A16.input_activation)
-            elif input_node == linear_node.args[1]:
-                # Weight - should be INT8
-                self.assertEqual(input_qspec, qconfig_A16.weight)
+        # Verify output annotation
+        self.assertEqual(annotation.output_qspec, expected_output_qspec)
+
+        # Verify input annotations
+        # Build actual_specs in the fixed order defined by op_node.args
+        self.assertEqual(len(annotation.input_qspec_map), len(expected_input_qspecs))
+        actual_specs = [
+            annotation.input_qspec_map[op_node.args[i]]
+            for i in range(len(expected_input_qspecs))
+        ]
+
+        # Compare expected vs actual specs
+        for i, (expected, actual) in enumerate(
+            zip(expected_input_qspecs, actual_specs)
+        ):
+            self.assertEqual(
+                actual,
+                expected,
+                f"Input qspec mismatch at index {i}",
+            )
 
 
 class QuantizerOpsPreserveTest(unittest.TestCase):