[Rewriter]: introduce fuse_pad_into_conv (#2301)

Johansmm · Johansmm · commit e8660102c653 · 2025-06-24T20:14:22.000+02:00
diff --git a/onnxscript/rewriter/__init__.py b/onnxscript/rewriter/__init__.py
@@ -21,6 +21,7 @@
     collapse_slices,
     no_op,
     pattern,
+    fuse_pad_into_conv,
 )
 
 _ModelProtoOrIr = TypeVar("_ModelProtoOrIr", onnx.ModelProto, ir.Model)
@@ -30,6 +31,7 @@
     *cast_constant_of_shape.rules.rules,
     *collapse_slices.rules.rules,
     *basic_rules.basic_optimization_rules().rules,
+    *fuse_pad_into_conv.fuse_pad_into_conv_rule_set().rules,
 )
 
 
diff --git a/onnxscript/rewriter/fuse_pad_into_conv.py b/onnxscript/rewriter/fuse_pad_into_conv.py
@@ -0,0 +1,143 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+"""Fuses Pad nodes into preceding nodes. Supported fusion patterns:
+- Pad ∘ Conv          -> Conv
+"""
+
+import typing
+
+import numpy as np
+import onnx_ir as ir
+
+from onnxscript.rewriter import pattern as orp
+
+
+def fill_pads_with_axes(
+    pads: typing.Sequence[int], axes: typing.Sequence[int], rank: int
+) -> typing.List[int]:
+    new_pads = []
+    for axis in range(rank):
+        if axis not in axes:
+            start_value = end_value = 0
+        else:
+            start_value = pads[axes.index(axis)]
+            end_value = pads[axes.index(axis) + len(axes)]
+        pad_len = len(new_pads) // 2
+        new_pads.insert(pad_len + axis, end_value)
+        new_pads.insert(axis, start_value)
+    return new_pads
+
+
+class _FusePadConvBase(orp.RewriteRuleClassBase):
+    """Interface for PadConv nodes fusion."""
+
+    def __init__(self, name: str, as_function: bool = False):
+        # Remove nodes is set to False to remove unused nodes after the rewrite.
+        super().__init__(name=name, remove_nodes=False, as_function=as_function)
+
+    def rewrite(
+        self, op: ir.tape.Tape, x: ir.Value, pad: ir.Value, conv: ir.Value
+    ) -> ir.Value:
+        pnode = pad.producer()
+        cnode = conv.producer()
+
+        # Retrieve the padding and axes
+        x_rank = len(x.shape)
+        pad_pads = pnode.inputs[1].const_value.numpy().tolist()
+        if len(pnode.inputs) > 3 and (axes := pnode.inputs[3]) is not None:
+            axes = [x if x >= 0 else x_rank + x for x in axes.const_value.numpy()]
+        else:
+            axes = list(range(x_rank))
+
+        # Fulfill pad_pads in every dimension (filling with zero the other ones)
+        pad_pads = fill_pads_with_axes(pad_pads, axes, x_rank)
+
+        # Get only spatial pads
+        new_pads = pad_pads[2:x_rank] + pad_pads[x_rank + 2 :]
+
+        # Replace conv pads = new + old
+        conv_attr: typing.Mapping[str, ir.Attr] = cnode.attributes.copy()
+        if "pads" in conv_attr:
+            new_pads = [x + y for x, y in zip(conv_attr["pads"].as_ints(), new_pads)]
+        conv_attr["pads"] = ir.convenience.convert_attribute("pads", new_pads)
+
+        return op.op(
+            cnode.op_type,
+            inputs=(x, *cnode.inputs[1:]),
+            attributes=conv_attr,
+            domain=cnode.domain,
+            name=cnode.name,
+        )
+
+    def check(self, context, x: ir.Value, pad: ir.Value, conv: ir.Value) -> orp.MatchResult:
+        del context  # Unused
+        check_result = orp.MatchResult()
+        pnode = pad.producer()
+        x_rank = len(x.shape)
+
+        # Pad constraints: attributes
+        if (mode := pnode.attributes.get("mode", None)) and mode.as_string() != "constant":
+            return check_result.fail(f"{pnode.name} mode must be 'constant'.")
+
+        # Pad constraints: inputs
+        if (pads := pnode.inputs[1]).const_value is None:
+            return check_result.fail(f"{pads.name} is not a constant/initializer.")
+        if len(pnode.inputs) > 2 and (constant_value := pnode.inputs[2]) is not None:
+            if constant_value.const_value is None:
+                return check_result.fail(
+                    f"{constant_value.name} is not a constant/initializer."
+                )
+            elif constant_value.const_value.numpy().item() != 0:
+                return check_result.fail(f"{constant_value.name} must be equal to 0.")
+        axes = list(range(x_rank))
+        if len(pnode.inputs) > 3 and (axes := pnode.inputs[3]) is not None:
+            if axes.const_value is None:
+                return check_result.fail(f"{axes.name} is not a constant/initializer.")
+            axes_list = [x if x >= 0 else x_rank + x for x in axes.const_value.numpy()]
+        else:
+            axes_list = list(range(x_rank))
+
+        # Pad constraints: values
+        pads_list = fill_pads_with_axes(pads.const_value.numpy(), axes_list, x_rank)
+        if np.any(pads_list[:2] + pads_list[x_rank : x_rank + 2]):
+            return check_result.fail(f"{pads.name} must be zero in non-spatial dimensions.")
+
+        return check_result
+
+
+class FusePadConv(_FusePadConvBase):
+    """Replaces ``Pad(Conv(x))`` with ``Conv(x)``."""
+
+    def __init__(self, as_function: bool = False):
+        super().__init__(name="FusePadConv", as_function=as_function)
+
+    def pattern(self, op: ir.tape.Tape, x: ir.Value) -> ir.Value:
+        return op.Conv(
+            op.Pad(x, _allow_other_inputs=True, _outputs=["pad"]),
+            _allow_other_inputs=True,
+            _outputs=["conv"],
+        )
+
+    def check(self, context, x: ir.Value, pad: ir.Value, conv: ir.Value) -> orp.MatchResult:
+        check_result = super().check(context, x, pad, conv)
+        if check_result.reason:
+            return check_result
+
+        # Conv constraints: attributes
+        cnode = conv.producer()
+        if (apad := cnode.attributes.get("auto_pad", None)) and apad.as_string() != "NOTSET":
+            return check_result.fail(f"{cnode.name} auto_pad must be 'NOTSET'.")
+        return check_result
+
+
+fuse_pad_into_conv = FusePadConv.rule()
+
+
+def fuse_pad_into_conv_rule_set() -> orp.RewriteRuleSet:
+    """Returns a set of rewrite rules that fuse Pad nodes into preceding:
+    - Conv
+
+    Returns:
+        RewriteRuleSet
+    """
+    return orp.RewriteRuleSet([fuse_pad_into_conv])
diff --git a/onnxscript/rewriter/fuse_pad_into_conv_test.py b/onnxscript/rewriter/fuse_pad_into_conv_test.py
@@ -0,0 +1,212 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+import typing
+import unittest
+
+import numpy as np
+import onnx_ir as ir
+import parameterized
+from onnx_ir.passes.common import onnx_checker
+
+from onnxscript.rewriter import pattern as orp
+from onnxscript.rewriter import testing
+from onnxscript.rewriter.fuse_pad_into_conv import (
+    fuse_pad_into_conv,
+    fuse_pad_into_conv_rule_set,
+)
+
+
+def _clone_model(model: ir.Model) -> ir.Model:
+    return ir.from_proto(ir.to_proto(model))
+
+
+class FusePadConvBaseTest(unittest.TestCase):
+    @property
+    def rng(self):
+        return np.random.default_rng(20250522)
+
+    def get_conv_weights(self, shape: typing.Sequence[int], tape: ir.tape.Tape = None):
+        w = ir.tensor(self.rng.uniform(-0.5, 0.5, shape).astype("float32"), name="W")
+        if tape is not None:
+            w = tape.initializer(w)
+        return w
+
+    def build_model(
+        self,
+        input_shape: ir.Shape,
+        weight_shape: typing.Sequence[int],
+        pad_inputs: typing.Sequence[ir.TensorProtocol | ir.Value | None],
+        pad_attributes: typing.Mapping[str, ir.Attr] | None = None,
+        conv_attributes: typing.Mapping[str, ir.Attr] | None = None,
+        opset_imports: typing.Mapping[str, int] = {"": 20},
+    ) -> ir.Model:
+        tape = ir.tape.Tape()
+        inputs = []
+        output_shape = ir.Shape((input_shape[0],) + ("?",) * (len(input_shape) - 1))
+
+        # Convert pad_inputs to initializers (if needed)
+        pad_inputs = list(pad_inputs)
+        for idx, x in enumerate(pad_inputs):
+            if isinstance(x, ir.TensorProtocol):
+                pad_inputs[idx] = tape.initializer(x)
+            elif isinstance(x, ir.Value):
+                inputs.append(x)
+            elif isinstance(x, float):
+                pad_inputs[idx] = tape.op("Constant", inputs=[], attributes={"value_float": x})
+            elif x is not None:
+                raise ValueError(f"Unsupported type for pad input ({x}): {type(x)}.")
+
+        # Register operations in the tape
+        x = ir.Input("X", shape=input_shape, type=ir.TensorType(ir.DataType.FLOAT))
+        y = tape.op("Pad", inputs=[x, *pad_inputs], attributes=pad_attributes)
+        y = tape.op(
+            "Conv",
+            inputs=[y, self.get_conv_weights(weight_shape, tape)],
+            attributes=conv_attributes,
+            output=ir.Input("Y", shape=output_shape, type=ir.TensorType(x.dtype)),
+        )
+
+        # Build the model
+        ir_model = ir.Model(
+            ir.Graph(
+                inputs=[x, *inputs],
+                outputs=[y],
+                nodes=tape.nodes,
+                initializers=tape.initializers,
+                opset_imports=opset_imports,
+                name="model",
+            ),
+            ir_version=9,
+        )
+        onnx_checker.CheckerPass(True)(ir_model)
+        return ir_model
+
+
+class FusePadConvTest(FusePadConvBaseTest):
+    @parameterized.parameterized.expand(
+        [
+            (pad_pads, const_value, axes, conv_pads)
+            for pad_pads, axes, conv_pads in [
+                ([0, 0, 2, 2, 0, 0, 2, 2], None, None),
+                ([0, 2, 2, 0, 2, 2], ir.tensor([1, -2, -1], name="axes"), [2, 0, 2, 0]),
+                ([1, 1, 1, 1], ir.tensor([-2, 3], name="axes"), [0, 1, 0, 1]),
+            ]
+            for const_value in [None, 0.0]
+        ]
+    )
+    def test_fuse_pad_into_conv(self, pad_pads, const_value, axes, conv_pads):
+        pad_inputs = [ir.tensor(pad_pads, name="pads")]
+        if const_value is not None or axes is not None:
+            pad_inputs.append(const_value)
+        if axes is not None:
+            pad_inputs.append(axes)
+        base_model = self.build_model(
+            input_shape=ir.Shape(("N", 32, 14, 16)),
+            weight_shape=(10, 32, 3, 3),
+            pad_inputs=pad_inputs,
+            conv_attributes={"pads": conv_pads},
+        )
+        updated_model = _clone_model(base_model)
+
+        # Apply rule
+        count = fuse_pad_into_conv_rule_set().apply_to_model(updated_model)
+
+        # Check that Pad was fused
+        self.assertEqual(count, 1)
+        self.assertEqual(updated_model.graph.num_nodes(), 1)
+        onnx_checker.CheckerPass(True)(updated_model)
+
+        # Check inference
+        inputs = self.rng.random((1, 32, 14, 16), dtype="float32")
+        testing.assert_numerically_equal(base_model, updated_model, (inputs,), atol=0, rtol=0)
+
+    @parameterized.parameterized.expand(
+        [
+            (
+                "constant",
+                ir.tensor([1] * 10, name="pads"),
+                ir.tensor([0.0], name="const_value"),
+                None,
+                "NOTSET",
+                "must be zero in non-spatial dimensions",
+            ),
+            (
+                "constant",
+                ir.tensor([0, 0, 0, 0], name="pads"),
+                ir.tensor([1.0], name="const_value"),
+                ir.tensor([0, -1], name="axes"),
+                "NOTSET",
+                "must be equal to 0.",
+            ),
+            (
+                "edge",
+                ir.tensor([0, 0, 0, 0], name="pads"),
+                ir.tensor([0.0], name="const_value"),
+                ir.tensor([0, -1], name="axes"),
+                "NOTSET",
+                "mode must be 'constant'.",
+            ),
+            (
+                "constant",
+                ir.Value(
+                    name="pads", shape=ir.Shape([4]), type=ir.TensorType(ir.DataType.INT64)
+                ),
+                None,
+                ir.tensor([0, -1], name="axes"),
+                "NOTSET",
+                "pads is not a constant/initializer.",
+            ),
+            (
+                "constant",
+                ir.tensor([0] * 10, name="pads"),
+                ir.Value(
+                    name="cval", shape=ir.Shape([1]), type=ir.TensorType(ir.DataType.FLOAT)
+                ),
+                None,
+                "NOTSET",
+                "cval is not a constant",
+            ),
+            (
+                "constant",
+                ir.tensor([0, 0, 0, 0], name="pads"),
+                None,
+                ir.Value(
+                    name="axes", shape=ir.Shape([2]), type=ir.TensorType(ir.DataType.INT64)
+                ),
+                "NOTSET",
+                "axes is not a constant",
+            ),
+            (
+                "constant",
+                ir.tensor([0, 0, 0, 0], name="pads"),
+                ir.tensor([0.0], name="const_value"),
+                ir.tensor([0, -1], name="axes"),
+                "VALID",
+                "auto_pad must be 'NOTSET'.",
+            ),
+        ]
+    )
+    def test_unsupported_fuse_pad_into_conv(
+        self, mode, pads, const_value, axes, auto_pad, err_msg
+    ):
+        base_model = self.build_model(
+            input_shape=ir.Shape(("N", 32, 14, 16, 12)),
+            weight_shape=(10, 32, 3, 4, 5),
+            pad_inputs=[pads, const_value, axes],
+            pad_attributes={"mode": mode},
+            conv_attributes={"auto_pad": auto_pad},
+        )
+
+        # Apply rule and check it was not applied
+        tracer = orp.MatchingTracer()
+        count = fuse_pad_into_conv.apply_to_model(base_model, tracer=tracer)
+        self.assertEqual(count, 0)
+
+        # Check that the error message is the expected one
+        tracer_match = tracer.best_matches_map[fuse_pad_into_conv][0]
+        self.assertEqual(tracer_match.status.value, orp.MatchStatus.CONDITION_FAILED)
+        self.assertRegex(tracer_match.match_result.reason, err_msg)
+
+
+if __name__ == "__main__":
+    unittest.main()

Original file line number	Diff line number	Diff line change
`@@ -21,6 +21,7 @@`
`21`	`21`	`collapse_slices,`
`22`	`22`	`no_op,`
`23`	`23`	`pattern,`
	`24`	`+ fuse_pad_into_conv,`
`24`	`25`	`)`
`25`	`26`
`26`	`27`	`_ModelProtoOrIr = TypeVar("_ModelProtoOrIr", onnx.ModelProto, ir.Model)`
`@@ -30,6 +31,7 @@`
`30`	`31`	`*cast_constant_of_shape.rules.rules,`
`31`	`32`	`*collapse_slices.rules.rules,`
`32`	`33`	`*basic_rules.basic_optimization_rules().rules,`
	`34`	`+ *fuse_pad_into_conv.fuse_pad_into_conv_rule_set().rules,`
`33`	`35`	`)`
`34`	`36`
`35`	`37`