From 5516caf8a5d5aa96fdc6b4d49d6043ca79b8dfc5 Mon Sep 17 00:00:00 2001
From: Justin Chu <justinchuby@users.noreply.github.com>
Date: Thu, 18 Sep 2025 10:43:47 -0700
Subject: [PATCH 1/2] [rewriter] Remove generic pattern matcher

It is obsolete and the capability is covered by the simple pattern matcher

Signed-off-by: Justin Chu <justinchuby@users.noreply.github.com>
---
 onnxscript/rewriter/_rewrite_rule.py        |   7 +-
 onnxscript/rewriter/generic_pattern.py      | 702 --------------------
 onnxscript/rewriter/generic_pattern_test.py | 607 -----------------
 3 files changed, 1 insertion(+), 1315 deletions(-)
 delete mode 100644 onnxscript/rewriter/generic_pattern.py
 delete mode 100644 onnxscript/rewriter/generic_pattern_test.py

diff --git a/onnxscript/rewriter/_rewrite_rule.py b/onnxscript/rewriter/_rewrite_rule.py
index af0165dea0..8964230fe0 100644
--- a/onnxscript/rewriter/_rewrite_rule.py
+++ b/onnxscript/rewriter/_rewrite_rule.py
@@ -82,12 +82,7 @@ def __init__(
         if isinstance(matcher, _matcher.PatternMatcher):
             self._matcher = matcher
         elif matcher is None:
-            if target_pattern.has_single_output_node:
-                self._matcher = _matcher.SimplePatternMatcher(self._target_pattern)
-            else:
-                import onnxscript.rewriter.generic_pattern as generic_pattern
-
-                self._matcher = generic_pattern.GenericPatternMatcher(self._target_pattern)
+            self._matcher = _matcher.SimplePatternMatcher(self._target_pattern)
         else:
             self._matcher = matcher(self._target_pattern)
         self._verbose = verbose
diff --git a/onnxscript/rewriter/generic_pattern.py b/onnxscript/rewriter/generic_pattern.py
deleted file mode 100644
index 12827b3116..0000000000
--- a/onnxscript/rewriter/generic_pattern.py
+++ /dev/null
@@ -1,702 +0,0 @@
-# Copyright (c) Microsoft Corporation.
-# Licensed under the MIT License.
-from __future__ import annotations
-
-import collections
-import inspect
-import os
-import textwrap
-import warnings
-from typing import Any, Callable, Iterator, Sequence
-
-import onnxscript.rewriter.pattern as orp
-from onnxscript import ir
-
-
-class PatternMatchResult:
-    """Stores information about a match if a match was successful.
-
-    * pattern: the GraphPattern which found this result
-    * model_nodes: the graph nodes that matched the pattern
-    * matched_pattern_to_model_value: a mapping from ValuePattern to ir.Value
-    * kwargs: additional attributes the user may add through the method
-        :meth:`PatternMatchResult.add_kwargs`
-    """
-
-    def __init__(
-        self,
-        pattern: orp.GraphPattern,
-        model_nodes: Sequence[ir.Node],
-    ):
-        pattern_nodes: list[orp.NodePattern] = list(pattern)
-        assert len(model_nodes) == len(pattern_nodes)
-        self.pattern = pattern
-        self.model_nodes = model_nodes
-        self.kwargs: dict[str, Any] = {}
-        self.matched_pattern_to_model_value: dict[orp.ValuePattern, ir.Value] = {}
-
-        for graph_node, pattern_node in zip(model_nodes, pattern_nodes):
-            assert graph_node.op_identifier() == pattern_node.op_identifier(), (
-                f"Unexpected type mismatch {graph_node.op_identifier()!r} != {pattern_node.op_identifier()!r}"
-            )
-            assert len(graph_node.inputs) == len(pattern_node.inputs), (
-                f"Unexpected number of inputs for type {graph_node.op_identifier()}"
-            )
-            for a, b in zip(graph_node.inputs, pattern_node.inputs):
-                if b is None:
-                    # optional input or not an interesting input
-                    continue
-                self._bind(b, a)
-
-            assert len(graph_node.outputs) == len(pattern_node.outputs), (
-                f"Unexpected number of outputs for type {graph_node.op_identifier()}"
-            )
-            for a, b in zip(graph_node.outputs, pattern_node.outputs):
-                self._bind(b, a)
-
-    def _bind(self, value_pattern: orp.ValuePattern, value: ir.Value) -> None:
-        map = self.matched_pattern_to_model_value
-        if value_pattern in map:
-            assert map[value_pattern] == value, (
-                f"Ambiguities, pattern output {value_pattern!r} means "
-                f"{value!r} or {map[value_pattern]}"
-            )
-        else:
-            map[value_pattern] = value
-
-    def add_kwargs(self, name: str, value: Any):
-        """Adds an attribute, it can be done when the match is being validated,
-        this attribute can be used when building the replacement nodes.
-        """
-        self.kwargs[name] = value
-
-    def __repr__(self) -> str:
-        return (
-            f"PatternMatchResult: {len(self.model_nodes)} nodes ..., {self.pattern.inputs}, "
-            f"{self.pattern.outputs})"
-        )
-
-
-def _to_match_result(pmr: PatternMatchResult) -> orp.MatchResult:
-    """Converts a PatternMatchResult into a MatchResult.
-
-    TODO: This is a temporary hack until MatchResult and PatternMatchResult are unified.
-    """
-    result = orp.MatchResult()
-    for node in pmr.model_nodes:
-        result.add_node(node)
-
-    for var, val in pmr.matched_pattern_to_model_value.items():
-        if var.name is not None:
-            result.bind(var.name, val)
-    result.outputs.extend([pmr.matched_pattern_to_model_value[v] for v in pmr.pattern.outputs])
-    return result
-
-
-def _value_to_str(value: ir.Value | orp.ValuePattern) -> str:
-    return value.name if value.name is not None else "anonymous:" + str(id(value))
-
-
-def _opt_value_to_str(value: ir.Value | orp.ValuePattern | None) -> str:
-    return _value_to_str(value) if value is not None else "None"
-
-
-def _node_to_str(node: ir.Node | orp.NodePattern) -> str:
-    inputs = ", ".join(_opt_value_to_str(input) for input in node.inputs)
-    outputs = ", ".join(_opt_value_to_str(output) for output in node.outputs)
-    op_type = node.op_type
-    domain = str(node.domain)
-    qualified_op = f"{domain}.{op_type}" if domain else op_type
-    return f"{outputs} = {qualified_op}({inputs})"
-
-
-# def _pattern_node_to_str(node: orp.NodePattern) -> str:
-#     inputs = ", ".join(_opt_value_to_str(input) for input in node.inputs)
-#     outputs = ", ".join(_opt_value_to_str(output) for output in node.outputs)
-#     return f"{outputs} = {node.op_type}({inputs})"
-
-
-class GenericPatternMatcher(orp.PatternMatcher):
-    """
-    Implements a pattern optimization for quick experimentation.
-
-    Current limitation:
-
-    * The current implementation does match on domain name (easy fix).
-    * It does not compares attributes either (easy fix as well).
-    """
-
-    def __init__(self, pattern: orp.GraphPattern) -> None:
-        super().__init__(pattern)
-
-    def enumerate_matches(
-        self,
-        model: ir.Model,
-        graph_or_function: ir.Graph | ir.Function,
-        node: ir.Node | None = None,
-        verbose: int = 0,
-    ) -> Iterator:
-        """Enumerates all the matches."""
-        if node is None:
-            matched = []
-            for node in graph_or_function:
-                res = self.match(model, graph_or_function, node, verbose=verbose)
-                if res:
-                    matched.append(res)
-                    yield res
-        else:
-            res = self.match(model, graph_or_function, node, verbose=verbose)
-            if res:
-                yield res
-
-    def none(
-        self,
-        node: ir.Node | None = None,
-        lineno: int | None = None,
-        msg: str = "",
-    ) -> None:
-        """Must be called every time a match fails to trace it.
-
-        It may be useful which reason made a pattern matching fail.
-        Instead of returning None, method *match* can return the following
-        expression:
-
-        ::
-
-            return self.none(node, inspect.currentframe().f_lineno)
-
-        By setting the verbosity (see next Section), the user may then know
-        which lines in the code returned None and which condition failed.
-        If logs are fully enabled, it shows information about matched none
-        and the line deciding the matched failed.
-        For example, this tells the matching failed at line 601 in ``generic_pattern.py``.
-        It happens when propagating the match in the backward directions.
-        The unmatched types are Mul, MatMul and below,
-        it shows the matched nodes. The first one was Cast.
-        And the failure happened at iteration 5.
-        ``139774002356544-139774000632672`` is the pair of ids used in container ``matched``.
-        ``id(node)`` is used as a unique identifiers of the nodes.
-
-        ::
-
-            [RotaryEmbeddingPattern.match] NONE - line: 601:__main__, op_type=Cast
-                --hint--: BACKWARD: different node types
-                --pattern
-                Mul(pos_ids, cast) -> (mul)
-                -- model
-                MatMul(/_original_modu...Expand_output_0, /_original_modu...b/Cast_output_0) -> (/_original_modu...MatMul_output_0)
-                iteration=5
-                --matched-- #6
-                Cast(/_original_modu...mb/Cos_output_0) ~ Cast(cos) [139774002356544-139774000632672]
-                Cos(/_original_modu...ncat_1_output_0) ~ Cos(concattraining-transpose-0) [139774002356448-139774000632048]
-                ConcatTraining(/_original_modu...nspose_output_0,/_original_modu...nspose_output_0) ~ ConcatTraining(transpose,transpose) [139774002356352-139774000631712]
-                Transpose(/_original_modu...MatMul_output_0) ~ Transpose(mul) [139774002356256-139774000631184]
-                Sin(/_original_modu...ncat_1_output_0) ~ Sin(concattraining-transpose-0) [139774002358512-139774000631568]
-                Cast(/_original_modu...mb/Sin_output_0) ~ Cast(sin) [139774002358608-139774000632384]
-                len(stack)=0:[]
-
-        'hints' are not added everywhere. More can easily be added with method ``_hint``.
-        """
-        if node and self.verbose:
-            if self.verbose >= 10:
-                if hasattr(self, "_debug"):
-                    msg2 = self._debug_print()
-                    if msg2:
-                        msg2 = f"\n{textwrap.indent(msg2, '    ')}"
-                else:
-                    msg2 = ""
-                print(
-                    f"[{self.__class__.__name__}.match] Match failed at line: {lineno}:"
-                    f"{os.path.split(self.__class__.__module__)[-1]}, "
-                    f"op_type={node.op_type}{msg}{msg2}"
-                )
-        return None
-
-    def print_match(self, graph_node: ir.Node, pattern_node: orp.NodePattern) -> str:
-        s1 = _node_to_str(graph_node)
-        s2 = _node_to_str(pattern_node)
-        return f"match {s1} with pattern: {s2}"
-
-    def _debug_print(self) -> str:
-        if not hasattr(self, "_debug"):
-            return ""
-
-        def _s(s: str) -> str:
-            if len(s) <= 30:
-                return s
-            return f"{s[:15]}...{s[-15:]}"
-
-        def _p(n: ir.Node, full: bool = False) -> str:
-            if full:
-                return str(n)
-            return _node_to_str(n)
-
-        rows = []
-        for k, v in sorted(self._debug.items()):
-            if k == "stack":
-                rows.append(f"len({k})={len(v)}:{v}")  # type: ignore[arg-type]
-                continue
-            if k == "iteration":
-                rows.append(f"{k}={v}")
-                continue
-            if k == "matched":
-                rows.append(f"--matched-- #{len(v)}")  # type: ignore[arg-type]
-                for pattern_node, graph_node in v.items():
-                    rows.append(
-                        f"  {_p(pattern_node)} ~ {_p(graph_node)} [{id(pattern_node)}-{id(graph_node)}]"
-                    )
-                continue
-            if k == "hint":
-                rows.append(f"--hint--: {v[0]}")  # type: ignore[arg-type]
-                for i in v[1:]:
-                    if isinstance(i, str):
-                        rows.append("  " + i)
-                    if isinstance(i, ir.Node):
-                        rows.append("  " + _p(i, full=True))
-                continue
-            if k in {"node", "pattern", "pattern_node", "pattern_nodes"}:
-                continue
-            rows.append(f"-- not shown {k}")
-
-        return "\n".join(rows)
-
-    def _hint(self, *args: Any) -> None:
-        """Add debugging information to help users."""
-        self._debug["hint"] = args
-
-    def _match_backward(
-        self,
-        starting_node: ir.Node,
-        matched: dict[orp.NodePattern, ir.Node],
-        stack: list[orp.NodePattern],
-        graph_node: ir.Node,
-        pattern_node: orp.NodePattern,
-    ) -> int | None:
-        """
-        Matches backward.
-
-        Args:
-            starting_node: root node (the node the matched begain with, used only for debugging)
-            matched: nodes of the pattern matched as already matched
-            stack: next node to look into
-            graph_node: node coming from the graph
-            pattern_node: node coming from the pattern
-
-        Returns:
-            number of matched nodes, None or False to indicate a failed match
-        """
-        match_count = 0
-
-        # predecessors
-        if len(graph_node.inputs) != len(pattern_node.inputs):
-            # not the same number of inputs
-            self._hint(
-                "BACKWARD: not the same number of inputs",
-                "-- pattern",
-                pattern_node,
-                "-- model",
-                graph_node,
-            )
-            return self.none(starting_node, inspect.currentframe().f_lineno)
-
-        for graph_input, pattern_input in zip(graph_node.inputs, pattern_node.inputs):
-            if len(graph_input.uses()) != len(pattern_input.uses()):
-                self._hint(
-                    "BACKWARD: one input is used outside the pattern",
-                    "-- pattern",
-                    pattern_node,
-                    "-- model",
-                    graph_node,
-                )
-                return self.none(starting_node, inspect.currentframe().f_lineno)
-
-        for graph_value, pattern_value in zip(graph_node.inputs, pattern_node.inputs):
-            # TODO(rama): Handle constant-pattern
-            pattern_pred = pattern_value.producer()
-            if pattern_pred is None:
-                # pattern_pred is None means the pattern backward search ends here.
-                result = self._match_values_forward(
-                    starting_node, matched, stack, graph_value, pattern_value
-                )
-                if result is None:
-                    return result
-                match_count += result
-                continue
-            graph_pred = graph_value.producer()
-            if graph_pred is None:
-                # No node in the graph.
-                return self.none(starting_node, inspect.currentframe().f_lineno)
-            if graph_pred.op_identifier() != pattern_pred.op_identifier():
-                self._hint(
-                    "BACKWARD: different node types",
-                    "--pattern",
-                    _node_to_str(pattern_pred),
-                    "-- model",
-                    _node_to_str(graph_pred),
-                )
-                return self.none(starting_node, inspect.currentframe().f_lineno)
-            # matching backward
-            if pattern_pred not in matched:
-                if self.verbose >= 10:
-                    print(
-                        f"[GenericPattern._match_backward] {self.print_match(graph_pred, pattern_pred)}"
-                    )
-                matched[pattern_pred] = graph_pred
-                stack.append(pattern_pred)
-                match_count += 1
-        if self.verbose > 5 and match_count > 0:
-            print(f"[GenericPatternMatcher._match_backward] add {match_count} nodes")
-        return match_count
-
-    def _match_values_forward(
-        self,
-        starting_node: ir.Node,
-        matched: dict[orp.NodePattern, ir.Node],
-        stack: list[orp.NodePattern],
-        graph_value: ir.Value,
-        pattern_value: orp.ValuePattern,
-    ) -> int | None:
-        """
-        Matches forward.
-
-        Args:
-            starting_node: root node (the node the match begins with, used only for debugging)
-            matched: nodes of the pattern matched as already matched
-            stack: next node to look into
-            graph_value: value coming from the graph
-            pattern_value: pattern value coming from the pattern
-
-        Returns:
-            number of matched nodes to continue, None or False to indicate a failed match
-        """
-        match_count = 0
-        graph_node_users = [user for user, _ in graph_value.uses()]
-        pattern_node_users = [user for user, _ in pattern_value.uses()]
-        if not pattern_node_users:
-            # The pattern has no node forward, the matching stops.
-            return match_count
-        if len(graph_node_users) < len(pattern_node_users):
-            # Not enough node in the graph to match the pattern. A match is not possible
-            return self.none(starting_node, inspect.currentframe().f_lineno)
-
-        # Here comes the fun part, there is the same number of successors or more
-        # nodes in the graph to match with the pattern.
-        # And we have to handle the nodes already matched as found.
-        # Hopefully, there is only one option.
-
-        if len(graph_node_users) == len(pattern_node_users) == 1:
-            # Let's deal with the simple case
-            if graph_node_users[0].op_identifier() != pattern_node_users[0].op_identifier():
-                return self.none(starting_node, inspect.currentframe().f_lineno)
-
-            node = pattern_node_users[0]
-            if node not in matched:
-                if self.verbose >= 10:
-                    print(
-                        f"[GenericPatternMatcher._match_values_forward]{self.print_match(graph_node_users[0], pattern_node_users[0])}"
-                    )
-                matched[node] = graph_node_users[0]
-                stack.append(node)
-                match_count += 1
-            return match_count
-
-        # Let's remove the nodes already matched.
-        pattern_node_users_not_matched = [
-            unmatched_node
-            for unmatched_node in pattern_node_users
-            if unmatched_node not in matched
-        ]
-        pattern_node_users_matched = [
-            matched[matched_node]
-            for matched_node in pattern_node_users
-            if matched_node in matched
-        ]
-        assert len(pattern_node_users_matched) + len(pattern_node_users_not_matched) == len(
-            pattern_node_users
-        ), (
-            f"pattern_node_users_not_matched={pattern_node_users_not_matched}, "
-            f"pattern_node_users_matched={pattern_node_users_matched}, "
-            f"pattern_node_users={pattern_node_users}, "
-            f"matched={matched}"
-        )
-        free = list(set(graph_node_users) - set(pattern_node_users_matched))
-        if not pattern_node_users_not_matched:
-            # Everything is already matched.
-            return match_count
-        if len(free) < len(pattern_node_users_not_matched):
-            # Not enough successors to match the remaining patterns.
-            return self.none(starting_node, inspect.currentframe().f_lineno)
-        if len(pattern_node_users_not_matched) == len(free) == 1:
-            # Only one option again.
-            graph_node = free[0]
-            if pattern_node_users_not_matched[0].op_identifier() != graph_node.op_identifier():
-                return self.none(starting_node, inspect.currentframe().f_lineno)
-
-            key = pattern_node_users_not_matched[0]
-            if self.verbose >= 10:
-                print(
-                    f"[GenericPatternMatcher._match_values_forward] {self.print_match(graph_node, pattern_node_users_not_matched[0])}"
-                )
-            matched[key] = graph_node
-            stack.append(key)
-            match_count += 1
-            return match_count
-
-        # And now another fun part, let's try to handle the case when
-        # there is only one option, matching on node type only returns one
-        # option.
-        expected_op_type = [_.op_identifier() for _ in pattern_node_users_not_matched]
-        got_op_type = [_.op_identifier() for _ in free]
-
-        ec = collections.Counter(expected_op_type)
-        gc = collections.Counter(got_op_type)
-        if len(ec) != len(gc) or set(ec) != set(gc):
-            # unique operator types is different.
-            self._hint(
-                "FORWARD: unique operator types are different",
-                "-- pattern",
-                ec,
-                pattern_value,
-                "-- model",
-                gc,
-                graph_value,
-                "-- model-matched",
-                pattern_node_users_matched,
-            )
-            return self.none(starting_node, inspect.currentframe().f_lineno)
-        for k, v in ec.items():
-            if gc[k] < v:
-                # Not enough types to match.
-                return self.none(starting_node, inspect.currentframe().f_lineno)
-
-        # At this stage, we know matching the types is possible.
-        # We first mark whatever is possible.
-        ptype_to_node = {_.op_identifier(): _ for _ in pattern_node_users_not_matched}
-        gtype_to_node = {_.op_identifier(): _ for _ in free}
-        missing = []
-        for k, v in ec.items():
-            if gc[k] == v == 1:
-                key = id(ptype_to_node[k])
-                if key not in matched:
-                    if self.verbose >= 10:
-                        print(
-                            f"[GenericPatternMatcher._match_values_forward] match "
-                            f"{self.print_match(gtype_to_node[k], ptype_to_node[k])}"
-                        )
-                    matched[key] = gtype_to_node[k]
-                    stack.append(key)
-                    match_count += 1
-            else:
-                missing.append(k)
-
-        if not missing:
-            return match_count
-
-        # At this stage, there are mutiple options for matching. We can:
-        # 1. make assumptions and continue
-        # 2. mark the node as incomplete matching, we could end up stuck anyway.
-        raise NotImplementedError(
-            f"There are more than one option, this will be implemented later, ec={ec}, gc={gc}"
-        )
-
-    def _match_forward(
-        self,
-        starting_node: ir.Node,
-        matched: dict[orp.NodePattern, ir.Node],
-        stack: list[orp.NodePattern],
-        graph_node: ir.Node,
-        pattern_node: orp.NodePattern,
-    ) -> int | None:
-        """
-        Matches forward.
-
-        Args:
-            starting_node: root node (the node the match begins with, used only for debugging)
-            matched: nodes of the pattern matched as already matched
-            stack: next node to look into
-            graph_node: node coming from the graph
-            pattern_node: node coming from the pattern
-
-        Returns:
-            number of matched nodes to continue, None or False to indicate a failed match
-        """
-        match_count = 0
-
-        # successors
-        if len(graph_node.outputs) != len(pattern_node.outputs):
-            # not the same number of outputs
-            self._hint(
-                "FORWARD: not the same number of output_names",
-                "-- pattern",
-                pattern_node,
-                "-- model",
-                graph_node,
-            )
-            return self.none(starting_node, inspect.currentframe().f_lineno)
-
-        for graph_output, pattern_output in zip(graph_node.outputs, pattern_node.outputs):
-            result = self._match_values_forward(
-                starting_node, matched, stack, graph_output, pattern_output
-            )
-            if result is None:
-                return result
-            match_count += result
-
-        if self.verbose > 5 and match_count > 0:
-            print(f"[GenericPatternMatcher._match_forward] add {match_count} nodes")
-        return match_count
-
-    def match(
-        self,
-        model: ir.Model,
-        graph_or_function: ir.Graph | ir.Function,
-        node: ir.Node,
-        *,
-        verbose: int = 0,
-        remove_nodes: bool = True,
-        tracer: orp.MatchingTracer | None = None,
-    ) -> orp.MatchResult | None:
-        if not remove_nodes:
-            raise NotImplementedError(
-                "remove_nodes=False is not implemented in GenericPatternMatcher"
-            )
-        del model
-        del graph_or_function
-        self.verbose = verbose
-        self._debug = {}
-
-        # Let's match the last node.
-        # Then we need to match successors and predecessors.
-        last_pattern_node = self.pattern.node(-1)
-        if node.op_identifier() != last_pattern_node.op_identifier():
-            # The last node does not have the same op_identifier().
-            return self.none()
-
-        if self.verbose > 5:
-            print(
-                f"[GenericPatternMatcher.match] Matching started at node: {_node_to_str(node)}"
-            )
-            if self.verbose >= 10:
-                print(f"[GenericPatternMatcher.match] match pattern {self}")
-
-        all_pattern_nodes = set(self.pattern)
-        matched: dict[orp.NodePattern, ir.Node] = {last_pattern_node: node}
-        stack: list[orp.NodePattern] = [last_pattern_node]
-        iteration = 0
-
-        if self.verbose > 5:
-            self._debug = dict(
-                pattern=self.pattern,
-                matched=matched,
-                stack=stack,
-                iteration=iteration,
-                node=node,
-                pattern_node=last_pattern_node,
-                pattern_nodes=self.pattern,
-            )
-
-        max_iter = self.pattern.num_nodes() * 2
-        while stack and iteration < max_iter:
-            nodes_not_in_pattern = set(matched.keys()) - all_pattern_nodes
-            assert not nodes_not_in_pattern, (
-                f"Some nodes are not part of the pattern: {nodes_not_in_pattern}"
-                f"\nall_pattern_nodes={all_pattern_nodes}"
-            )
-
-            # TODO(justinchuby): Change to a for loop
-            iteration += 1
-            if self.verbose > 5:
-                print(
-                    f"[GenericPatternMatcher.match] iteration={iteration} "
-                    f"n_matched={len(matched)}, n_stack={len(stack)}, "
-                    f"matched_types={collections.Counter(_.op_identifier() for _ in matched)}"
-                )
-            next_pattern_node = stack.pop()
-            next_graph_node = matched[next_pattern_node]
-
-            result = self._match_backward(
-                node, matched, stack, next_graph_node, next_pattern_node
-            )
-            if result is None:
-                if self.verbose > 5:
-                    print("[GenericPatternMatcher.match] done. backward failed.")
-                return result
-
-            nodes_not_in_pattern = set(matched.keys()) - all_pattern_nodes
-            assert not nodes_not_in_pattern, (
-                f"Some nodes are not part of the pattern: {nodes_not_in_pattern}"
-            )
-
-            result = self._match_forward(
-                node, matched, stack, next_graph_node, next_pattern_node
-            )
-            if result is None:
-                if self.verbose > 5:
-                    print("[GenericPatternMatcher.match] done. forward failed.")
-                return result
-
-            nodes_not_in_pattern = set(matched.keys()) - all_pattern_nodes
-            assert not nodes_not_in_pattern, (
-                f"Some nodes are not part of the pattern: {nodes_not_in_pattern}"
-            )
-
-            if self.verbose > 5:
-                self._debug["iteration"] = iteration
-
-        if iteration >= max_iter and stack:
-            self._hint(f"reached {iteration}>={max_iter} iterations")
-            return self.none(node, inspect.currentframe().f_lineno)
-
-        if self.verbose > 5:
-            print(f"[GenericPatternMatcher.match] done. {len(matched)} matched nodes")
-
-        # At this point, the pattern is matched but let's make sure.
-        assert len(matched) == self.pattern.num_nodes(), (
-            f"Number of matched nodes is different, {len(matched)} matched nodes, "
-            f"and {len(self.pattern)} nodes in the pattern, matched is {matched}"
-        )
-        assert len(stack) == 0, f"There are still {len(stack)} nodes to explore."
-
-        # We order the matched nodes in the same order than the pattern
-        # to let next functions to be able to build the matching again.
-        matched_nodes = [matched[pattern_node] for pattern_node in self.pattern]
-        return _to_match_result(PatternMatchResult(self.pattern, matched_nodes))
-
-
-def make_pattern_rule(
-    match_pattern_function: Callable,
-    apply_pattern_function: Callable,
-    validate_mapping: Callable | None = None,
-    verbose: int = 0,
-) -> orp.RewriteRule:
-    """
-    Creates a rewriting rule from a callable or a function proto.
-
-    Args:
-        match_pattern_function: an onnxscript-like function that defines
-            the pattern subgraph (nodes) to be replaced
-        apply_pattern_function: an onnxscript-like function that constructs
-            the replacement subgraph (new nodes replacing the matched nodes)
-        validate_mapping: a function that validates the matching subgraph once
-            it is found. If it returns False the pattern is not applied.
-            If not specified, it is equivalent to a function that always return True
-        verbose: verbosity level
-
-    Returns:
-        the rewriting rule
-    """
-
-    warnings.warn(
-        "make_pattern_rule(...) is deprecated, use pattern.RewriteRule(...) instead",
-        FutureWarning,
-        stacklevel=2,
-    )
-    pattern = orp._to_graph_pattern(match_pattern_function)
-    matcher = GenericPatternMatcher(pattern)
-    return orp.RewriteRule(
-        pattern,
-        apply_pattern_function,
-        validate_mapping,
-        matcher,
-        verbose=verbose,
-    )
diff --git a/onnxscript/rewriter/generic_pattern_test.py b/onnxscript/rewriter/generic_pattern_test.py
deleted file mode 100644
index dadaf5e8bb..0000000000
--- a/onnxscript/rewriter/generic_pattern_test.py
+++ /dev/null
@@ -1,607 +0,0 @@
-# Copyright (c) Microsoft Corporation.
-# Licensed under the MIT License.
-from __future__ import annotations
-
-import contextlib
-import io
-import os
-import unittest
-
-import numpy as np
-import onnx
-import onnx.parser
-import onnx.reference
-import onnxruntime as ort
-import parameterized
-
-from onnxscript import ir
-from onnxscript.rewriter import generic_pattern, pattern
-
-FLOAT = onnx.TensorProto.FLOAT
-
-
-@parameterized.parameterized_class(
-    ("matcher_algo",),
-    [
-        (generic_pattern.GenericPatternMatcher,),
-        (pattern.SimplePatternMatcher,),
-    ],
-)
-class GenericPatternTest(unittest.TestCase):
-    def _range(self, *shape, bias: float | None = None):
-        n = np.prod(shape)
-        x = np.arange(n).astype(np.float32) / n
-        if bias:
-            x = x + bias
-        return x.reshape(tuple(shape)).astype(np.float32)
-
-    def test_graph_pattern_builder(self):
-        """Test replacing Add + Add by AddAdd."""
-
-        def match_pattern(op, x, y, z):
-            """Builds the pattern to match."""
-            tmp = op.Add(x, y)
-            return op.Add(tmp, z)
-
-        def apply_pattern(op, x, y, z, **_):
-            """Builds the replacement graph."""
-            return op.AddAdd(x, y, z, _domain="ZZZ")
-
-        def validate_mapping(context, x, y, z, **_) -> bool:
-            """Validates the mapping."""
-            del context
-            return True
-
-        rule = pattern.RewriteRule(
-            match_pattern,
-            apply_pattern,
-            validate_mapping,
-            self.matcher_algo,
-        )
-
-        class AddAdd(onnx.reference.op_run.OpRun):
-            op_domain = "ZZZ"
-
-            def _run(self, x, y, z):
-                return (x + y + z,)
-
-        model = onnx.helper.make_model(
-            onnx.helper.make_graph(
-                [
-                    onnx.helper.make_node("Add", ["x", "y"], ["gggg"]),
-                    onnx.helper.make_node("Add", ["gggg", "z"], ["final"]),
-                ],
-                "dummy",
-                [
-                    onnx.helper.make_tensor_value_info("x", FLOAT, [None, None]),
-                    onnx.helper.make_tensor_value_info("y", FLOAT, [None, None]),
-                    onnx.helper.make_tensor_value_info("z", FLOAT, [None, None]),
-                ],
-                [onnx.helper.make_tensor_value_info("final", FLOAT, [None, None])],
-            ),
-            opset_imports=[onnx.helper.make_opsetid("", 18)],
-            ir_version=9,
-        )
-        onnx.checker.check_model(model)
-
-        model = onnx.shape_inference.infer_shapes(model)
-        ir_model = ir.serde.deserialize_model(model)
-
-        rule.apply_to_model(ir_model)
-        self.assertEqual(
-            ["AddAdd"],
-            [n.op_type for n in ir_model.graph],
-        )
-        # TODO: do that in pattern.py.
-        ir_model.opset_imports["ZZZ"] = 1
-        rewriten_model = ir.serde.serialize_model(ir_model)
-        self.assertEqual(
-            ["AddAdd"],
-            [n.op_type for n in rewriten_model.graph.node],
-        )
-
-        feeds = {
-            "x": self._range(5, 6),
-            "y": self._range(5, 6),
-            "z": self._range(5, 6),
-        }
-        ref1 = onnx.reference.ReferenceEvaluator(model)
-        expected = ref1.run(None, feeds)
-
-        self.assertEqual(0, len(rewriten_model.graph.initializer))
-        opsets = {v.domain: v.version for v in rewriten_model.opset_import}
-        self.assertIn("ZZZ", opsets)
-        self.assertEqual(opsets["ZZZ"], 1)
-
-        ref2 = onnx.reference.ReferenceEvaluator(rewriten_model, new_ops=[AddAdd])
-        got = ref2.run(None, feeds)
-        np.testing.assert_almost_equal(expected[0], got[0])
-
-    def test_graph_pattern_builder_multi_outputs(self):
-        def match_pattern(op, x, y, w, z):
-            """Builds the pattern to match."""
-            tmp = op.Add(x, y)
-            tmp2 = op.Add(tmp, w)
-            r1 = op.Add(tmp, z)
-            return tmp2, r1
-
-        def apply_pattern(op, x, y, w, z, **_):
-            """Builds the pattern to match."""
-            return op.AddAddAddAdd(x, y, w, z, _domain="ZZZ", _outputs=2)
-
-        def validate_mapping(context, **_) -> bool:
-            return True
-
-        rule = pattern.RewriteRule(
-            match_pattern,
-            apply_pattern,
-            validate_mapping,
-            self.matcher_algo,
-            verbose=10,
-        )
-
-        class AddAddAddAdd(onnx.reference.op_run.OpRun):
-            op_domain = "ZZZ"
-
-            def _run(self, x, y, w, z):
-                return (x + y + w, x + y + z)
-
-        model = onnx.helper.make_model(
-            onnx.helper.make_graph(
-                [
-                    onnx.helper.make_node("Add", ["x", "y"], ["gggg"]),
-                    onnx.helper.make_node("Add", ["gggg", "w"], ["f1"]),
-                    onnx.helper.make_node("Add", ["gggg", "z"], ["f2"]),
-                ],
-                "dummy",
-                [
-                    onnx.helper.make_tensor_value_info("x", FLOAT, [None, None]),
-                    onnx.helper.make_tensor_value_info("y", FLOAT, [None, None]),
-                    onnx.helper.make_tensor_value_info("z", FLOAT, [None, None]),
-                    onnx.helper.make_tensor_value_info("w", FLOAT, [None, None]),
-                ],
-                [
-                    onnx.helper.make_tensor_value_info("f1", FLOAT, [None, None]),
-                    onnx.helper.make_tensor_value_info("f2", FLOAT, [None, None]),
-                ],
-            ),
-            opset_imports=[onnx.helper.make_opsetid("", 18)],
-            ir_version=9,
-        )
-        onnx.checker.check_model(model)
-
-        model = onnx.shape_inference.infer_shapes(model)
-        ir_model = ir.serde.deserialize_model(model)
-
-        rule.apply_to_model(ir_model)
-        self.assertEqual(
-            ["AddAddAddAdd"],
-            [n.op_type for n in ir_model.graph],
-        )
-        # TODO: do that in pattern.py.
-        ir_model.opset_imports["ZZZ"] = 1
-
-        rewriten_model = ir.serde.serialize_model(ir_model)
-
-        self.assertEqual(
-            ["AddAddAddAdd"],
-            [n.op_type for n in rewriten_model.graph.node],
-        )
-
-        feeds = {
-            "x": self._range(5, 6),
-            "y": self._range(5, 6),
-            "w": self._range(5, 6),
-            "z": self._range(5, 6),
-        }
-        ref1 = onnx.reference.ReferenceEvaluator(model)
-        expected = ref1.run(None, feeds)
-
-        self.assertEqual(0, len(rewriten_model.graph.initializer))
-        opsets = {v.domain: v.version for v in rewriten_model.opset_import}
-        self.assertIn("ZZZ", opsets)
-        self.assertEqual(opsets["ZZZ"], 1)
-
-        ref2 = onnx.reference.ReferenceEvaluator(rewriten_model, new_ops=[AddAddAddAdd])
-        got = ref2.run(None, feeds)
-        np.testing.assert_almost_equal(expected[0], got[0])
-
-    def check_with_ort(self, model: onnx.ModelProto, providers=None):
-        if providers is None:
-            providers = ["CPUExecutionProvider"]
-
-        if isinstance(model, onnx.ModelProto):
-            model = model.SerializeToString()
-        session = ort.InferenceSession(model, providers=providers)
-        return session
-
-    def get_rotary_model(self):
-        inputs = [
-            onnx.helper.make_tensor_value_info("x", onnx.TensorProto.INT64, shape=[]),
-            onnx.helper.make_tensor_value_info("pos_ids", FLOAT, shape=[]),
-            onnx.helper.make_tensor_value_info("axis", onnx.TensorProto.INT64, shape=[]),
-        ]
-        nodes = [
-            onnx.helper.make_node("Unsqueeze", ["x", "axis"], ["_onx_unsqueeze0"]),
-            onnx.helper.make_node("Cast", ["_onx_unsqueeze0"], ["_onx_cast0"], to=1),
-            onnx.helper.make_node("MatMul", ["pos_ids", "_onx_cast0"], ["_onx_matmul0"]),
-            onnx.helper.make_node("Transpose", ["_onx_matmul0"], ["_onx_transpose0"]),
-            onnx.helper.make_node(
-                "ConcatTraining",
-                ["_onx_transpose0", "_onx_transpose0"],
-                ["_onx_concattraining0", "_onx_concattraining1"],
-                domain="com.microsoft",
-            ),
-            onnx.helper.make_node("Sin", ["_onx_concattraining0"], ["_onx_sin0"]),
-            onnx.helper.make_node("Cast", ["_onx_sin0"], ["_onx_cast02"], to=1),
-            onnx.helper.make_node("Cos", ["_onx_concattraining0"], ["_onx_cos0"]),
-            onnx.helper.make_node("Cast", ["_onx_cos0"], ["_onx_cast03"], to=1),
-        ]
-        outputs = [
-            onnx.helper.make_tensor_value_info("_onx_cast02", onnx.TensorProto.UNDEFINED, []),
-            onnx.helper.make_tensor_value_info("_onx_cast03", onnx.TensorProto.UNDEFINED, []),
-        ]
-        model = onnx.helper.make_model(
-            onnx.helper.make_graph(
-                nodes,
-                "experiment",
-                inputs,
-                outputs,
-            ),
-            opset_imports=[
-                onnx.helper.make_opsetid("", 18),
-                onnx.helper.make_opsetid("com.microsoft", 18),
-            ],
-        )
-        return model
-
-    def test_shared_root_value_test(self):
-        def match_pattern(op, x):
-            t1 = op.Sin(x)
-            t2 = op.Cos(x)
-            return t1, t2
-
-        def apply_pattern(op, x, **_):
-            return op.SinCos(x, _domain="com.microsoft", _outputs=2)
-
-        rule = pattern.RewriteRule(match_pattern, apply_pattern, matcher=self.matcher_algo)
-        model_proto = onnx.parser.parse_model(
-            """
-            <ir_version: 7, opset_import: [ "" : 17]>
-            agraph (float[N] y) => (float[N] z)
-            {
-                temp1 = Sin(y)
-                temp2 = Cos(y)
-                z = Add(temp1, temp2)
-            }
-        """
-        )
-        onnx.checker.check_model(model_proto)
-        model = onnx.shape_inference.infer_shapes(model_proto)
-        ir_model = ir.serde.deserialize_model(model)
-        rule.apply_to_model(ir_model)
-        rewritten_model = ir.serde.serialize_model(ir_model)
-        graph = rewritten_model.graph
-        self.assertEqual(len(graph.node), 2)
-        self.assertEqual(graph.node[0].op_type, "SinCos")
-
-    def test_shared_root_value_extra_use(self):
-        if self.matcher_algo is generic_pattern.GenericPatternMatcher:
-            raise unittest.SkipTest("GenericPatternMatcher does not support extra uses yet.")
-
-        def match_pattern(op, x):
-            t1 = op.Sin(x)
-            t2 = op.Cos(x)
-            return t1, t2
-
-        def apply_pattern(op, x, **_):
-            return op.SinCos(x, _domain="com.microsoft", _outputs=2)
-
-        rule = pattern.RewriteRule(
-            match_pattern,
-            apply_pattern,
-            matcher=self.matcher_algo,
-        )
-        model_proto = onnx.parser.parse_model(
-            """
-            <ir_version: 7, opset_import: [ "" : 17]>
-            agraph (float[N] y) => (float[N] z)
-            {
-                temp1 = Sin(y)
-                temp2 = Cos(y)
-                w = Add(temp1, temp2)
-                z = Mul(w, y)
-            }
-        """
-        )
-        onnx.checker.check_model(model_proto)
-        model = onnx.shape_inference.infer_shapes(model_proto)
-        ir_model = ir.serde.deserialize_model(model)
-        rule.apply_to_model(ir_model)
-        graph = ir_model.graph
-        self.assertEqual(len(graph), 3)
-        self.assertEqual(graph.node(0).op_type, "SinCos")
-
-    def test_rotary_embedding(self):
-        # The test work on a model if it has the expected name.
-        # A dummy model is used if not present (not implemented yet).
-
-        def match_pattern(op, x, pos_ids, axis):
-            # original code: the code does verifies the constant yet
-            # unsqueeze = op.Unsqueeze(x, [1])
-
-            unsqueeze = op.Unsqueeze(x, axis)
-            cast = op.Cast(unsqueeze, to=FLOAT)
-
-            matmul = op.MatMul(pos_ids, cast)
-            transpose = op.Transpose(matmul)
-            output, _length = op.ConcatTraining(
-                transpose,
-                transpose,
-                _domain="com.microsoft",
-                _outputs=2,
-            )
-
-            sin = op.Sin(output)
-            cast1 = op.Cast(sin, to=FLOAT)
-            cos = op.Cos(output)
-            cast2 = op.Cast(cos, to=FLOAT)
-            return cast1, cast2
-
-        def validate_mapping(match_result, **_) -> bool:
-            del match_result
-            return True
-
-        def apply_pattern(op, x, pos_ids, axis, **_):
-            del axis
-            cos_cache = op.Constant(
-                value=onnx.numpy_helper.from_array(np.random.rand(256, 256).astype(np.float16))
-            )
-            sin_cache = op.Constant(
-                value=onnx.numpy_helper.from_array(np.random.rand(256, 256).astype(np.float16))
-            )
-            return op.RotaryEmbedding(
-                x,
-                pos_ids,
-                cos_cache,
-                sin_cache,
-                _domain="com.microsoft",
-                _outputs=2,
-            )
-
-        rule = pattern.RewriteRule(
-            match_pattern,
-            apply_pattern,
-            validate_mapping,
-            self.matcher_algo,
-            verbose=10,
-        )
-
-        model = self.get_rotary_model()
-
-        buffer = io.StringIO()
-        with contextlib.redirect_stdout(buffer):
-            # back to ir
-            model = onnx.shape_inference.infer_shapes(model)
-            ir_model = ir.serde.deserialize_model(model)
-
-            # starts matching
-            rule.apply_to_model(ir_model)
-            ir_model.opset_imports["com.microsoft"] = 1
-
-            rewriten_model = ir.serde.serialize_model(ir_model)
-
-        expected = ["Constant", "Constant", "RotaryEmbedding"]
-        self.assertEqual(expected, [n.op_type for n in rewriten_model.graph.node])
-        out = buffer.getvalue()
-        # TODO(Rama): What is this assertion testing? Is it to check that `verbose` is working?
-        if self.matcher_algo is generic_pattern.GenericPatternMatcher:
-            self.assertIn("[GenericPatternMatcher.match", out)
-
-    def test_rotary_embedding_onnxscript(self):
-        # The test work on a model if it has the expected name.
-        # A dummy model is used if not present (not implemented yet).
-
-        def rotary_match_pattern(op, x, pos_ids, axis):
-            unsqueeze = op.Unsqueeze(x, axis)
-            cast = op.Cast(unsqueeze, to=FLOAT)
-
-            matmul = op.MatMul(pos_ids, cast)
-            transpose = op.Transpose(matmul)
-            output, _length = op.ConcatTraining(
-                transpose, transpose, _domain="com.microsoft", _outputs=2
-            )
-
-            sin = op.Sin(output)
-            cast1 = op.Cast(sin, to=FLOAT)
-            cos = op.Cos(output)
-            cast2 = op.Cast(cos, to=FLOAT)
-            return cast1, cast2
-
-        def validate_rotary_mapping(match_result, **_) -> bool:
-            # If some pattern needs to be rejected.
-            del match_result
-            return True
-
-        def rotary_apply_pattern(op, x, pos_ids, axis, **_):
-            cos_cache = op.Constant(
-                value=onnx.numpy_helper.from_array(np.random.rand(256, 256).astype(np.float16))
-            )
-            sin_cache = op.Constant(
-                value=onnx.numpy_helper.from_array(np.random.rand(256, 256).astype(np.float16))
-            )
-            part1, part2 = op.RotaryEmbedding(
-                x, pos_ids, cos_cache, sin_cache, _domain="com.microsoft", _outputs=2
-            )
-            return part1, part2
-
-        rule = pattern.RewriteRule(
-            rotary_match_pattern,
-            rotary_apply_pattern,
-            validate_rotary_mapping,
-            self.matcher_algo,
-            verbose=10,
-        )
-
-        model = self.get_rotary_model()
-
-        buffer = io.StringIO()
-        with contextlib.redirect_stdout(buffer):
-            # back to ir
-            model = onnx.shape_inference.infer_shapes(model)
-            ir_model = ir.serde.deserialize_model(model)
-
-            # starts matching
-            rule.apply_to_model(ir_model)
-            ir_model.opset_imports["com.microsoft"] = 1
-
-            rewriten_model = ir.serde.serialize_model(ir_model)
-
-        expected = ["Constant", "Constant", "RotaryEmbedding"]
-        self.assertEqual(expected, [n.op_type for n in rewriten_model.graph.node])
-        out = buffer.getvalue()
-        # TODO(justinchuby): Remove this assert - capturing stdout is not robust
-        if self.matcher_algo is generic_pattern.GenericPatternMatcher:
-            self.assertIn("[GenericPatternMatcher.match", out)
-
-    def test_rotary_emb_file_onnxscript(self):
-        # The test work on a model if it has the expected name.
-        # A dummy model is used if not present (not implemented yet).
-
-        def rotary_match_pattern(op, x, pos_ids, axis):
-            unsqueeze = op.Unsqueeze(x, axis)
-            cast = op.Cast(unsqueeze, to=FLOAT)
-
-            matmul = op.MatMul(pos_ids, cast)
-            transpose = op.Transpose(matmul)
-            output, _length = op.ConcatTraining(
-                transpose, transpose, _domain="com.microsoft", _outputs=2
-            )
-
-            sin = op.Sin(output)
-            cast1 = op.Cast(sin, to=FLOAT)
-            cos = op.Cos(output)
-            cast2 = op.Cast(cos, to=FLOAT)
-            return cast1, cast2
-
-        def validate_rotary_mapping(match_result, **_) -> bool:
-            # If some pattern needs to be rejected.
-            del match_result
-            return True
-
-        def rotary_apply_pattern(op, x, pos_ids, axis):
-            cos_cache = op.Constant(
-                value=onnx.numpy_helper.from_array(np.random.rand(256, 256).astype(np.float16))
-            )
-            sin_cache = op.Constant(
-                value=onnx.numpy_helper.from_array(np.random.rand(256, 256).astype(np.float16))
-            )
-            part1, part2 = op.RotaryEmbedding(
-                x, pos_ids, cos_cache, sin_cache, _domain="com.microsoft", _outputs=2
-            )
-            return part1, part2
-
-        model_path = "gemma_optimized_pre_grad_training_2.onnx"
-        if not os.path.exists(model_path):
-            raise unittest.SkipTest(f"{model_path!r} is missing")
-        model = onnx.load(model_path)
-        model = onnx.shape_inference.infer_shapes(model)
-        ir_model = ir.serde.deserialize_model(model)
-
-        rule = pattern.RewriteRule(
-            rotary_match_pattern,
-            rotary_apply_pattern,
-            validate_rotary_mapping,
-            self.matcher_algo,
-            verbose=10,
-        )
-
-        rule.apply_to_model(ir_model)
-        # TODO: do that in pattern.py.
-        ir_model.opset_imports["ZZZ"] = 1
-
-        rewriten_model = ir.serde.serialize_model(ir_model)
-
-        buffer = rewriten_model.SerializeToString()
-        with open(f"{model}.opt.onnx", "wb") as f:
-            f.write(buffer)
-        self.check_with_ort(rewriten_model)
-
-    def test_transpose_transpose_onnxscript(self):
-        # TODO(rama): Attribute-parameters not yet supported in multi-output matching.
-        # def transpose_transpose_pattern(op, X, perm0, perm1):
-        #     xt = op.Transpose(X, perm=perm0)
-        #     Y = op.Transpose(xt, perm=perm1)
-        #     return Y
-
-        def transpose_transpose_pattern(op, X):
-            XT = op.Transpose(X, _outputs=["XT"])
-            Y = op.Transpose(XT, _outputs=["Y"])
-            return Y
-
-        def transpose_transpose_mapping(perm0, perm1):
-            new_perm = [0 for p in perm0]
-            for i, p in enumerate(perm1):
-                new_perm[i] = perm0[p]
-            # replace by return [perm0[p] for p in perm1] ?
-            return new_perm
-
-        def transpose_transpose_check(op, **_) -> bool:
-            return True
-
-        def transpose_transpose_apply_pattern(op, X, XT: ir.Value, Y, **_):
-            perm0 = XT.producer().attributes.get("perm")
-            if perm0 is not None:
-                perm0 = perm0.value  # TODO(rama): handle RefAttr
-            perm1 = Y.producer().attributes.get("perm")
-            if perm1 is not None:
-                perm1 = perm1.value  # TODO(rama): handle RefAttr
-            if perm0 is None and perm1 is None:
-                return op.Identity(X)
-            if perm0 is None:
-                perm0 = range(len(perm1) - 1, -1, -1)
-            if perm1 is None:
-                perm1 = range(len(perm0) - 1, -1, -1)
-            composed_perm = transpose_transpose_mapping(perm0, perm1)
-            return op.Transpose(X, perm=composed_perm)
-
-        rule = pattern.RewriteRule(
-            transpose_transpose_pattern,
-            transpose_transpose_apply_pattern,
-            transpose_transpose_check,
-            self.matcher_algo,
-            verbose=0,
-        )
-
-        model = onnx.helper.make_model(
-            onnx.helper.make_graph(
-                [
-                    onnx.helper.make_node("Transpose", ["X"], ["xt"], perm=[1, 2, 0]),
-                    onnx.helper.make_node("Transpose", ["xt"], ["Y"], perm=[1, 2, 0]),
-                ],
-                "name",
-                [onnx.helper.make_tensor_value_info("X", FLOAT, [None, None, None])],
-                [onnx.helper.make_tensor_value_info("Y", FLOAT, [None, None, None])],
-            ),
-            opset_imports=[onnx.helper.make_opsetid("", 18)],
-        )
-
-        # back to ir
-        ir_model = ir.serde.deserialize_model(model)
-
-        # starts matching
-
-        rule.apply_to_model(ir_model)
-        rewriten_model = ir.serde.serialize_model(ir_model)
-
-        expected = ["Transpose"]
-        self.assertEqual(expected, [n.op_type for n in rewriten_model.graph.node])
-        node = rewriten_model.graph.node[0]
-        self.assertEqual(len(node.attribute), 1)
-        att = node.attribute[0]
-        self.assertEqual(att.name, "perm")
-        self.assertEqual(list(att.ints), [2, 0, 1])
-
-
-if __name__ == "__main__":
-    unittest.main(verbosity=2)

From c772dd38e9871ec1c90287d05c99183041ef7016 Mon Sep 17 00:00:00 2001
From: Justin Chu <justinchuby@users.noreply.github.com>
Date: Thu, 18 Sep 2025 10:45:08 -0700
Subject: [PATCH 2/2] Clean up

Signed-off-by: Justin Chu <justinchuby@users.noreply.github.com>
---
 .lintrunner.toml              |  1 -
 examples/pattern_rewriting.py | 25 -------------------------
 pyproject.toml                | 34 ----------------------------------
 3 files changed, 60 deletions(-)

diff --git a/.lintrunner.toml b/.lintrunner.toml
index 7b31bab564..907f3bfce6 100644
--- a/.lintrunner.toml
+++ b/.lintrunner.toml
@@ -57,7 +57,6 @@ exclude_patterns = [
     'onnxscript/rewriter/onnxruntime/transformers/multihead_attention.py',  # FIXME
     'onnxscript/tools/function_unittest_producer.py',  # FIXME
     'onnxscript/rewriter/onnxruntime/transformers/layernorm.py',  # FIXME
-    'onnxscript/rewriter/generic_pattern.py',  # FIXME
 ]
 command = [
     'python',
diff --git a/examples/pattern_rewriting.py b/examples/pattern_rewriting.py
index 7b5c56d5e3..fd84d7f3cb 100644
--- a/examples/pattern_rewriting.py
+++ b/examples/pattern_rewriting.py
@@ -141,28 +141,3 @@ def rotary_apply_pattern(op, x, pos_ids, axis):
 rule = pattern.RewriteRule(rotary_match_pattern, rotary_apply_pattern, verbose=10)
 
 rule.apply_to_model(ir_model)
-
-# TODO(rama): Update the following, the trace-printed looks different now.
-
-######################################
-# The logs shows every time the algorithm rejected a pattern.
-# We can see the following:
-#
-# ::
-#
-#     [OnnxGenericPattern.match] NONE - line: 673:onnxscript.rewriter.generic_pattern, op_type=Cast
-#         --hint--: BACKWARD: different node types
-#           --pattern
-#           ConcatTraining(transpose, transpose) -> (output, length)
-#           -- model
-#           ConcatTrainingBad(_onx_transpose0, _onx_transpose0) -> (_onx_concattraining0, _onx_concattraining1)
-#         iteration=1
-#         --marked-- #2
-#           Cast(_onx_cos0) ~ Cast(cos) [140186194226496-140186194222320]
-#           Cos(_onx_concattraining0) ~ Cos(output) [140186194230816-140186194223472]
-#         len(stacked)=0:[]
-#
-# Line 673 in file `generic_pattern.py`, the match was rejected.
-# It says while comparing two nodes in the backward direction,
-# node types do not match.
-# It also says that two nodes were actually matched.
diff --git a/pyproject.toml b/pyproject.toml
index 3df6b3995c..5f31581494 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -79,40 +79,6 @@ module = [
 ]
 ignore_errors = true
 
-# FIXME(#1378): Remove this overrides section
-[[tool.mypy.overrides]]
-module = [
-  "onnxrewriter.rewriter.generic_pattern_test.*",
-]
-check_untyped_defs = false
-disable_error_code = 'override,import-untyped,no-untyped-def,assignment'
-disallow_incomplete_defs = true
-disallow_untyped_defs = true
-disallow_untyped_decorators = true
-show_column_numbers = true
-strict_optional = true
-warn_incomplete_stub = true
-warn_no_return = true
-warn_unused_configs = true
-warn_unused_ignores = false
-
-# FIXME(#1378): Remove this overrides section
-[[tool.mypy.overrides]]
-module = [
-  "onnxrewriter.rewriter.generic_pattern.*",
-]
-check_untyped_defs = false
-disable_error_code = 'override,import-untyped,no-untyped-def,assignment,union-attr,func-returns-value,annotation-unchecked,arg-type,index,name-defined,attr-defined'
-disallow_incomplete_defs = true
-disallow_untyped_defs = true
-disallow_untyped_decorators = true
-show_column_numbers = true
-strict_optional = true
-warn_incomplete_stub = true
-warn_no_return = true
-warn_unused_configs = true
-warn_unused_ignores = false
-
 [tool.pylint.messages_control]
 # NOTE: This list is for vscode. Add new disables in pyproject_pylint.toml for lintrunner
 # Exclude patterns should be modified in .lintrunner.toml