Fix broken ConvBNReLu from new Convert1DConvTo2D pass

JakeStevens · facebook-github-bot · commit d56fca110bf2 · 2026-05-13T09:57:58.000-07:00
Summary:
The pass checked for a batch norm following the conv to avoid breaking fusion with a squeeze.

However, it did not support Conv -&gt; Batch Norm -&gt; ReLu OR Conv -&gt; ReLU

This commit adds that support, along with other supported activation

Reviewed By: rascani

Differential Revision: D105017469
diff --git a/backends/nxp/aten_passes/convert_1d_conv_to_2d.py b/backends/nxp/aten_passes/convert_1d_conv_to_2d.py
@@ -8,6 +8,7 @@
     try_get_tensor_constant_from_node,
 )
 from executorch.backends.nxp.backend.graph_utils import is_batch_norm
+from executorch.backends.nxp.backend.neutron_target_spec import NeutronTargetSpec
 from torch._subclasses import FakeTensor, FakeTensorMode
 from torch.ao.quantization.fx.utils import get_new_attr_name_with_prefix
 from torch.export.unflatten import _assign_attr, _AttrKind
@@ -26,9 +27,10 @@ class ConvertConv1dToConv2dPass(PassBase):
     r"""
     The NXP backend supports only 2D convolutions. Rewrite 1D convolutions into an equivalent 2D form by
     inserting a singleton spatial dimension and then remove it again.
-    If batch norm is present after the convolution, it is also converted from 1D to 2D.
+    If batch norm and/or a fusable activation (as defined by the NeutronTargetSpec) follow the convolution,
+    they are also kept in 2D (before the squeeze) so the partitioner can fuse them with the convolution.
 
-    Without batch norm:
+    Without batch norm or activation:
 
            x                         W                                x                           W
       [N, C1, H]               [I/O, I/O, k]                     [N, C1, H]                [I/O, I/O, 1, k]
@@ -90,8 +92,86 @@ class ConvertConv1dToConv2dPass(PassBase):
                         ▼                                                           ▼
                     [N, C3, H]                                                  [N, C3, H]
                         y                                                           y
+
+    With activation (e.g. relu):
+
+           x                         W                                x                           W
+      [N, C1, H]               [I/O, I/O, k]                     [N, C1, H]                [I/O, I/O, 1, k]
+           │                         │                                │                           │
+           │                         │                      ┌─────────▼──────────┐                │
+           │                         │                      │  unsqueeze(x, -2)  │                │
+           │                         │                      └─────────▼──────────┘                │
+           │                         │                                │                           │
+           │                         │                          [N, C1, 1, H]                     │
+           │                         │                                │                           │
+           └────────┐       ┌────────┘                                └──────────┐     ┌──────────┘
+                    │       │                                                    │     │
+           ┌────────▼───────▼───────┐                                   ┌────────▼─────▼────────┐
+           │       convolution      ◄──B [O]        replace             │      convolution      ◄──B [O]
+           │   (1D/transposed 1D)   │          ────────────────►        │   (2D/transposed 2D)  │
+           └────────────┬───────────┘                with               └───────────┬───────────┘
+                        │                                                           │
+                    [N, C2, H]                                                [N, C2, 1, H]
+                        │                                                           │
+                ┌───────▼───────┐                                           ┌───────▼───────┐
+                │     relu      │                                           │     relu      │
+                └───────┬───────┘                                           └───────┬───────┘
+                        │                                                           │
+                        │                                                     [N, C2, 1, H]
+                        │                                                           │
+                        │                                                   ┌───────▼────────┐
+                        │                                                   │   squeeze(-2)  │
+                        │                                                   └───────┬────────┘
+                        │                                                           │
+                        ▼                                                           ▼
+                    [N, C2, H]                                                  [N, C2, H]
+                        y                                                           y
+
+    With batch norm and activation:
+
+           x                         W                                x                           W
+      [N, C1, H]               [I/O, I/O, k]                     [N, C1, H]                [I/O, I/O, 1, k]
+           │                         │                                │                           │
+           │                         │                      ┌─────────▼──────────┐                │
+           │                         │                      │  unsqueeze(x, -2)  │                │
+           │                         │                      └─────────▼──────────┘                │
+           │                         │                                │                           │
+           │                         │                         [N, C1, 1, H]                      │
+           │                         │                                │                           │
+           └────────┐       ┌────────┘                                └──────────┐     ┌──────────┘
+                    │       │                                                    │     │
+           ┌────────▼───────▼───────┐                                   ┌────────▼─────▼────────┐
+           │       convolution      ◄──B [O]        replace             │      convolution      ◄──B [O]
+           │   (1D/transposed 1D)   │          ────────────────►        │   (2D/transposed 2D)  │
+           └────────────┬───────────┘                with               └───────────┬───────────┘
+                        │                                                           │
+                    [N, C2, H]                                                [N, C2, 1, H]
+                        │                                                           │
+                ┌───────▼───────┐                                           ┌───────▼───────┐
+                │   batch_norm  │                                           │   batch_norm  │
+                │      (1D)     │                                           │      (2D)     │
+                └───────┬───────┘                                           └───────┬───────┘
+                        │                                                           │
+                    [N, C3, H]                                                [N, C3, 1, H]
+                        │                                                           │
+                ┌───────▼───────┐                                           ┌───────▼───────┐
+                │     relu      │                                           │     relu      │
+                └───────┬───────┘                                           └───────┬───────┘
+                        │                                                           │
+                        │                                                     [N, C3, 1, H]
+                        │                                                           │
+                        │                                                   ┌───────▼────────┐
+                        │                                                   │   squeeze(-2)  │
+                        │                                                   └───────┬────────┘
+                        │                                                           │
+                        ▼                                                           ▼
+                    [N, C3, H]                                                  [N, C3, H]
+                        y                                                           y
     """
 
+    def __init__(self, neutron_target_spec: NeutronTargetSpec):
+        self.neutron_target_spec = neutron_target_spec
+
     @staticmethod
     def _is_conv_1d(node: Node) -> bool:
         return node.target == torch.ops.aten.conv1d.default
@@ -357,35 +437,43 @@ def call(self, graph_module: GraphModule) -> PassResult:
                 )
 
             old_1d_conv_users = list(old_1d_node.users.keys())
+            last_4d_node = new_2d_node
+            node_to_replace = old_1d_node
+            nodes_to_erase = []
+
             if len(old_1d_conv_users) == 1 and is_batch_norm(old_1d_conv_users[0]):
                 bn_1d_node = old_1d_conv_users[0]
-
-                # also convert batch_norm 1d to 2d
-                with self.graph_module.graph.inserting_after(new_2d_node):
+                with self.graph_module.graph.inserting_after(last_4d_node):
                     bn_2d_args = (new_2d_node,) + bn_1d_node.args[1:]
                     bn_2d_node = self._create_batch_norm_2d_node(*bn_2d_args)
-
-                with self.graph_module.graph.inserting_after(bn_2d_node):
-                    squeeze_target = torch.ops.aten.squeeze.dim
-
-                    out_sq_args = (bn_2d_node, -2)
-                    out_sq_node = self._create_sq_or_unsq_node(
-                        squeeze_target, *out_sq_args
-                    )
-
-                bn_1d_node.replace_all_uses_with(out_sq_node)
-                self.graph_module.graph.erase_node(bn_1d_node)
-
-            else:
-                with self.graph_module.graph.inserting_after(new_2d_node):
-                    squeeze_target = torch.ops.aten.squeeze.dim
-
-                    out_sq_args = (new_2d_node, -2)
-                    out_sq_node = self._create_sq_or_unsq_node(
-                        squeeze_target, *out_sq_args
+                last_4d_node = bn_2d_node
+                node_to_replace = bn_1d_node
+                nodes_to_erase.append(bn_1d_node)
+                old_1d_conv_users = list(bn_1d_node.users.keys())
+
+            if len(
+                old_1d_conv_users
+            ) == 1 and self.neutron_target_spec.neutron_target_info.is_supported_fused_activation__aten(
+                old_1d_conv_users[0]
+            ):
+                act_1d_node = old_1d_conv_users[0]
+                with self.graph_module.graph.inserting_after(last_4d_node):
+                    act_2d_args = (last_4d_node,) + act_1d_node.args[1:]
+                    act_2d_node = self._create_sq_or_unsq_node(
+                        act_1d_node.target, *act_2d_args
                     )
-
-                old_1d_node.replace_all_uses_with(out_sq_node)
+                last_4d_node = act_2d_node
+                node_to_replace = act_1d_node
+                nodes_to_erase.append(act_1d_node)
+
+            with self.graph_module.graph.inserting_after(last_4d_node):
+                squeeze_target = torch.ops.aten.squeeze.dim
+                out_sq_args = (last_4d_node, -2)
+                out_sq_node = self._create_sq_or_unsq_node(squeeze_target, *out_sq_args)
+
+            node_to_replace.replace_all_uses_with(out_sq_node)
+            for n in reversed(nodes_to_erase):
+                self.graph_module.graph.erase_node(n)
 
             graph_module.graph.erase_node(old_1d_node)
             made_changes = True
diff --git a/backends/nxp/aten_passes/neutron_aten_pass_manager.py b/backends/nxp/aten_passes/neutron_aten_pass_manager.py
@@ -52,7 +52,7 @@ def _get_default_passes(neutron_target_spec, qat_mode: bool = False) -> list[Pas
         FuseLinearAndAddPass(),
         MoveActivationBeforeConcat(neutron_target_spec),
         ConvertDivToMulPass(),
-        ConvertConv1dToConv2dPass(),
+        ConvertConv1dToConv2dPass(neutron_target_spec),
     ]
 
     if not qat_mode:
diff --git a/backends/nxp/tests/BUCK b/backends/nxp/tests/BUCK
@@ -92,6 +92,26 @@ fbcode_target(_kind = python_pytest,
     ],
 )
 
+fbcode_target(_kind = python_pytest,
+    name = "test_convert_1d_conv_to_2d",
+    srcs = [
+        "test_convert_1d_conv_to_2d.py",
+    ],
+    env = {
+        "PYTEST_ADDOPTS": "--ignore-glob=*full_pipeline*  -k 'not full_pipeline'",
+    },
+    deps = [
+        "//caffe2:torch",
+        "//executorch/backends/nxp:aten_passes",
+        "//executorch/backends/nxp:neutron_backend",
+        ":executorch_pipeline",
+        ":models",
+        "fbsource//third-party/pypi/numpy:numpy",
+        "fbsource//third-party/pypi/pytest:pytest",
+        "fbsource//third-party/pypi/pytest-mock:pytest-mock",  # @manual
+    ],
+)
+
 fbcode_target(_kind = python_pytest,
     name = "test_integration",
     srcs = [
diff --git a/backends/nxp/tests/generic_tests/test_split_group_convolution.py b/backends/nxp/tests/generic_tests/test_split_group_convolution.py
@@ -161,7 +161,8 @@ def test_split_group_convolution__1d(
         # `ConvertConv1dToConv2dPass` is needed to convert `conv1d` to `conv2d`.
         # The 1d variant is not supported.
         modified_module = NeutronAtenPassManager(
-            neutron_target_spec, [SplitGroupConvolution(), ConvertConv1dToConv2dPass()]
+            neutron_target_spec,
+            [SplitGroupConvolution(), ConvertConv1dToConv2dPass(neutron_target_spec)],
         )(graph_module).graph_module
 
         # Verify that the behavior has not changed.
diff --git a/backends/nxp/tests/test_convert_1d_conv_to_2d.py b/backends/nxp/tests/test_convert_1d_conv_to_2d.py

Original file line number	Diff line number	Diff line change
`@@ -52,7 +52,7 @@ def _get_default_passes(neutron_target_spec, qat_mode: bool = False) -> list[Pas`
`52`	`52`	`FuseLinearAndAddPass(),`
`53`	`53`	`MoveActivationBeforeConcat(neutron_target_spec),`
`54`	`54`	`ConvertDivToMulPass(),`
`55`		`- ConvertConv1dToConv2dPass(),`
	`55`	`+ ConvertConv1dToConv2dPass(neutron_target_spec),`
`56`	`56`	`]`
`57`	`57`
`58`	`58`	`if not qat_mode:`