Add tolerance to quantizedInputWrapper

ethansfng · web-flow · commit eabe49eaa2bc · 2026-03-09T22:03:45.000Z
Differential Revision: D95822313 Pull Request resolved: pytorch#18019
diff --git a/backends/cadence/aot/compiler_funcs.py b/backends/cadence/aot/compiler_funcs.py
@@ -258,29 +258,42 @@ class QuantizedInputWrapper(torch.nn.Module):
             If provided, extracts quant params from graph.
         quant_args: Optional dict mapping input index to (scale, zero_point, qmin, qmax, dtype).
             If provided, uses these directly instead of extracting from graph.
+        expected_inputs: Optional dict mapping input index to the expected
+            dequantized tensor. After dequantization, the result is compared
+            against these values using atol/rtol. Raises ValueError if exceeded.
+        atol: Absolute tolerance for the expected-value check (default 1e-4).
+        rtol: Relative tolerance for the expected-value check (default 1e-4).
 
     Example:
         # Extract from graph
         wrapper = QuantizedInputWrapper(quantized_module, input_names=["x"])
 
-        # Explicit quant args
+        # Explicit quant args with expected-value validation
         wrapper = QuantizedInputWrapper(
             quantized_module,
             quant_args={0: (1/255, 0, 0, 255, torch.uint8)},
+            expected_inputs={0: reference_float_tensor},
+            atol=1e-3,
         )
     """
 
     def __init__(
         self,
         module: GraphModule,
         input_args: Optional[Union[list[str], dict[int, QuantArgs]]] = None,
+        expected_inputs: Optional[dict[int, torch.Tensor]] = None,
+        atol: float = 1e-4,
+        rtol: float = 1e-4,
     ) -> None:
         super().__init__()
         self.module: GraphModule = module
         self.quant_args: dict[int, QuantArgs] = {}
         self.expected_shapes: dict[int, tuple[int, ...]] = (
             extract_input_shapes_from_graph(module)
         )
+        self.expected_inputs: Optional[dict[int, torch.Tensor]] = expected_inputs
+        self.atol: float = atol
+        self.rtol: float = rtol
 
         if input_args is not None:
             logger.warning(
@@ -317,6 +330,23 @@ def forward(self, *args: torch.Tensor) -> Any:
                 )
             dequantized_args.append(node)
 
+        # Check dequantized values against expected inputs
+        expected_inputs = self.expected_inputs
+        if expected_inputs is not None:
+            for index, expected in expected_inputs.items():
+                if index >= len(dequantized_args):
+                    continue
+                actual = dequantized_args[index]
+                if not torch.allclose(actual, expected, atol=self.atol, rtol=self.rtol):
+                    max_abs_diff = (actual - expected).abs().max().item()
+                    mean_abs_diff = (actual - expected).abs().mean().item()
+                    msg = (
+                        f"Dequantized input at index {index} differs from expected value: "
+                        f"max_abs_diff={max_abs_diff:.6g}, mean_abs_diff={mean_abs_diff:.6g} "
+                        f"(atol={self.atol}, rtol={self.rtol})"
+                    )
+                    raise ValueError(msg)
+
         return self.module(*dequantized_args)