From c2103e757f194133bea1100872aa57e7de959c26 Mon Sep 17 00:00:00 2001 From: "G. Ramalingam" Date: Thu, 9 Jan 2025 14:01:57 -0800 Subject: [PATCH] A couple of extensions to rewriter (#2001) Extends the rewriter with a couple of features: * A debugging mode to perform the pattern matching (without any graph modifications) and to report instances that get the best score for a match (even if incomplete). Helps quickly identify causes for mismatches when we expect a match. * Rewrite-rules can now specify a pre/post visitor method called before applying it to a graph/function. This is useful for rules that need to create "cached" values that are reused across multiple instances of the pattern. --------- Co-authored-by: Justin Chu --- onnxscript/rewriter/_ir_utils.py | 29 ++-- onnxscript/rewriter/pattern.py | 216 ++++++++++++++++++++++++---- onnxscript/rewriter/pattern_test.py | 67 +++++++++ 3 files changed, 276 insertions(+), 36 deletions(-) diff --git a/onnxscript/rewriter/_ir_utils.py b/onnxscript/rewriter/_ir_utils.py index 1d657a5ab..83763a8ac 100644 --- a/onnxscript/rewriter/_ir_utils.py +++ b/onnxscript/rewriter/_ir_utils.py @@ -3,7 +3,7 @@ from __future__ import annotations import math -from typing import Callable +from typing import Callable, Sequence import numpy as np @@ -11,6 +11,21 @@ from onnxscript.optimizer import basic_constant_propagation +def display_nodes(nodes: Sequence[ir.Node]) -> None: + """Display a list of nodes in the order they appear in the graph.""" + if nodes: + graph = nodes[0].graph + if graph: + # Display nodes in same order as in graph: + # Currently doesn't handle (control-flow) subgraphs + for node in graph: + if node in nodes: + node.display() + else: + for node in nodes: + node.display() + + def display_slice(x: ir.Value | ir.Node, backward: bool = True, depth_limit: int = 5) -> None: """Display the (backward or forward) subgraph from a given value or node upto a certain depth.""" slice = [] @@ -33,17 +48,7 @@ def visit(node: ir.Node, depth): visit(x, 0) elif isinstance(x, ir.Value) and x.producer() is not None: visit(x.producer(), 0) # type: ignore[arg-type] - if slice: - graph = slice[0].graph - if graph: - # Display nodes in same order as in graph: - # Currently doesn't handle (control-flow) subgraphs - for node in graph: - if node in slice: - node.display() - else: - for node in reversed(slice): - node.display() + display_nodes(slice) def get_const_value(value: ir.Value) -> ir.TensorProtocol | None: diff --git a/onnxscript/rewriter/pattern.py b/onnxscript/rewriter/pattern.py index a961ae872..333cb489d 100644 --- a/onnxscript/rewriter/pattern.py +++ b/onnxscript/rewriter/pattern.py @@ -5,9 +5,11 @@ import abc import contextlib import dataclasses +import enum import inspect import itertools import math +from collections import defaultdict from typing import ( Any, Callable, @@ -328,13 +330,17 @@ def __init__(self) -> None: self.outputs: list[ir.Value] = [] # For a failed match, _reason is a string that describes the reason for the failure. self._reason: str = "" + # Track the node that caused the failure. + # TODO: May be useful to extend this to be a collection of Nodes and Values. + self._failure_node: ir.Node | None = None def __bool__(self): return self._success - def fail(self, reason: str = "") -> MatchResult: + def fail(self, reason: str = "", node: ir.Node | None = None) -> MatchResult: self._success = False self._reason = reason + self._failure_node = node return self @property @@ -536,18 +542,23 @@ def matches(self, node: ir.Node, match: MatchResult) -> MatchResult: We check the domain, op_type, and attributes of the node, but not the inputs. """ # TODO(rama): Ensure we handle "" and "onnx.ai" correctly. - if not self.domain.matches(node.domain): - return match.fail(f"Domain mismatch: expected {self.domain}, got {node.domain}.") if not self.op.matches(node.op_type): - return match.fail(f"OpType mismatch: expected {self.op}, got {node.op_type}.") + return match.fail( + f"OpType mismatch: expected {self.op}, got {node.op_type}.", node + ) + if not self.domain.matches(node.domain): + return match.fail( + f"Domain mismatch: expected {self.domain}, got {node.domain}.", node + ) for name, attr_pattern in self.attributes.items(): attr_value = node.attributes.get(name) if attr_value is None: - return match.fail(f"Attribute {name} not found in node.") + return match.fail(f"Attribute {name} not found in node.", node) if not attr_pattern.matches(attr_value): return match.fail( - f"Attribute {name} mismatch: expected {attr_pattern}, got {attr_value}." + f"Attribute {name} mismatch: expected {attr_pattern}, got {attr_value}.", + node, ) if attr_pattern.name is not None: if not match.bind(attr_pattern.name, attr_value): @@ -557,7 +568,7 @@ def matches(self, node: ir.Node, match: MatchResult) -> MatchResult: for name in node.attributes: # TODO: Support matching default nodes for attributes. if name not in self.attributes: - return match.fail(f"Attribute {name} not expected in node.") + return match.fail(f"Attribute {name} not expected in node.", node) return match @@ -945,8 +956,10 @@ def match( model: ir.Model, graph_or_function: ir.Graph | ir.Function, node: ir.Node, + *, verbose: int = 0, remove_nodes: bool = True, + tracer: MatchingTracer | None = None, ) -> MatchResult: """Match the pattern against the subgraph ending at the given node.""" @@ -957,13 +970,14 @@ def __str__(self) -> str: class SimplePatternMatcher(PatternMatcher): def __init__(self, pattern: GraphPattern) -> None: super().__init__(pattern) + self._current_node: ir.Node | None = None - def fail(self, reason: str) -> bool: + def fail(self, reason: str, node: ir.Node | None = None) -> bool: if self._verbose: if self._matched: # Print only if at least one node successfully matched. count = len(self._matched) print(f"Match failed after {count} nodes: {reason}") - self._match.fail(reason) + self._match.fail(reason, node or self._current_node) return False def _match_constant(self, pattern_constant: Constant, value: ir.Value) -> bool: @@ -1025,7 +1039,7 @@ def _match_constant(self, pattern_constant: Constant, value: ir.Value) -> bool: def _match_node(self, pattern_node: NodePattern, node: ir.Node) -> bool: """Matches a pattern subgraph against subgraph rooted at node.""" - + self._current_node = node # Graph-matching: we do not allow the same pattern node to be matched against # different graph nodes. if pattern_node in self._matched: @@ -1039,6 +1053,7 @@ def _match_node(self, pattern_node: NodePattern, node: ir.Node) -> bool: if self._verbose: print(f"Matched: {node.op_type}") + match.nodes.append(node) self._matched[pattern_node] = node # TODO: Revisit this to handle optional trailing inputs better. @@ -1067,7 +1082,6 @@ def _match_node(self, pattern_node: NodePattern, node: ir.Node) -> bool: if not self._bind_value(output_value_pattern, node.outputs[i]): return False - match.nodes.append(node) return True def _bind_value(self, pattern_value: ValuePattern, value: ir.Value | None) -> bool: @@ -1115,6 +1129,7 @@ def _init_match(self, verbose: int) -> None: self._verbose = verbose self._matched: dict[NodePattern, ir.Node] = {} self._match: MatchResult = MatchResult() + self._current_node = None def _get_output_values(self) -> list[ir.Value] | None: """Get values bound to the output variables of the pattern.""" @@ -1163,8 +1178,10 @@ def _match_single_output_node( output_values = self._get_output_values() if output_values is None: + # TODO(rama): Is this a valid (useful) case? return match if check_removable and not _valid_to_replace(match.nodes, output_values): + # TODO(rama): Match status should be updated to reflect failure reason. return match.fail("Matched nodes have other uses preventing replacement.") match.outputs.extend(output_values) @@ -1200,8 +1217,10 @@ def match( model: ir.Model, graph_or_function: ir.Graph | ir.Function, node: ir.Node, + *, verbose: int = 0, remove_nodes: bool = True, + tracer: MatchingTracer | None = None, ) -> MatchResult: """Match the pattern against the subgraph ending at the given node. @@ -1218,7 +1237,7 @@ def match( matching in the presence of subgraphs (control-flow) can introduce some complications which require careful consideration. """ - + self._tracer = tracer if self.pattern.has_single_output_node: self._init_match(verbose) return self._match_single_output_node( @@ -1268,6 +1287,8 @@ def __init__( verbose: int = 0, name: str | None = None, remove_nodes: bool = True, + graph_pre_visitor: Callable[[], None] | None = None, + graph_post_visitor: Callable[[], None] | None = None, ) -> None: """Create a rewrite rule. @@ -1284,6 +1305,10 @@ def __init__( verbose: The verbosity level of the rule. name: An optional name for the pattern that will show up in verbose logging. remove_nodes: If True, the matched nodes will be removed from the graph. + graph_pre_visitor: A function that will be called before applying the + rewriting to the top-level graph or a function. + graph_post_visitor: A function that will be called after the rewriting + is complete for a graph or function. """ if not isinstance(target_pattern, GraphPattern): @@ -1308,20 +1333,20 @@ def __init__( self._verbose = verbose self.name = name self.remove_nodes = remove_nodes + self.graph_pre_visitor = graph_pre_visitor + self.graph_post_visitor = graph_post_visitor def __str__(self) -> str: - if self.name: - return f"{self.__class__.__name__}(..., name={self.name!r})" - return ( - f"{self.__class__.__name__}({self._target_pattern}, {self._replacement_pattern})" - ) + return self.name if self.name else "Anonymous Rule" def try_rewrite( self, model: ir.Model, graph_or_function: ir.Graph | ir.Function, node: ir.Node, + *, verbose: int | None = None, + tracer: MatchingTracer | None = None, ) -> ReplacementSubgraph | None: """If the node matches the pattern, then replace the node with the replacement pattern.""" if verbose and verbose > 2: @@ -1337,9 +1362,17 @@ def try_rewrite( if var.name not in match.bindings: match.bindings[var.name] = None if not self._condition_function(context, **match.bindings): + if tracer: + tracer.log( + self, graph_or_function, node, match, MatchStatus.CONDITION_FAILED + ) return None replacement_subgraph = self._replacement_pattern.get_replacement(match) if replacement_subgraph is None: + if tracer: + tracer.log( + self, graph_or_function, node, match, MatchStatus.REPLACEMENT_FAILED + ) return None if len(replacement_subgraph.new_outputs) != self._target_pattern.num_outputs: raise ValueError( @@ -1349,15 +1382,26 @@ def try_rewrite( # TODO(rama): Remove the opset imports from deleted nodes? _update_opset_imports(graph_or_function, replacement_subgraph) _update_opset_imports(model.graph, replacement_subgraph) + if tracer: + tracer.log(self, graph_or_function, node, match, MatchStatus.SUCCESS) return replacement_subgraph + if tracer: + tracer.log(self, graph_or_function, node, match, MatchStatus.NO_MATCH) return None def apply_to_model( - self, model: ir.Model, *, commute: bool = False, verbose: int | None = None + self, + model: ir.Model, + *, + commute: bool = False, + verbose: int | None = None, + debug: bool = False, ): # A convenience method to apply the rule to a model. We use a RewriteRuleSet to # handle commutative rules. - return RewriteRuleSet([self], commute=commute).apply_to_model(model, verbose=verbose) + return RewriteRuleSet([self], commute=commute).apply_to_model( + model, verbose=verbose, debug=debug + ) def commute(self) -> Sequence[RewriteRule]: def replace_pattern(new_pattern): @@ -1370,6 +1414,10 @@ def replace_pattern(new_pattern): self._condition_function, matcher_class(new_pattern), self._verbose, + self.name, + self.remove_nodes, + self.graph_pre_visitor, + self.graph_post_visitor, ) return [replace_pattern(p) for p in self._target_pattern.commute()] @@ -1451,12 +1499,16 @@ class RewriteRuleClassBase: @classmethod def rule(cls, *args, **kwargs): instance = cls(*args, **kwargs) + setup = instance.setup if hasattr(instance, "setup") else None + cleanup = instance.cleanup if hasattr(instance, "cleanup") else None return RewriteRule( instance.pattern, instance.rewrite, instance.check, name=instance.name, remove_nodes=instance.remove_nodes, + graph_pre_visitor=setup, + graph_post_visitor=cleanup, ) def __init__(self, name: str | None = None, remove_nodes: bool = True) -> None: @@ -1484,16 +1536,34 @@ def _apply_to_graph_or_function( self, model: ir.Model, graph_or_function: ir.Graph | ir.Function, + *, verbose: int | None, + tracer: MatchingTracer | None = None, ) -> int: + """ + Apply the rewrite rules to the given graph or function. + + Args: + model: The model to which the rewrite rules are applied. + graph_or_function: The graph or function to which the rewrite rules are applied. + verbose: The verbosity level. Defaults to None. + tracer: The tracer for debugging. Defaults to None. + + Returns: + The number of rewrite rules applied. + """ count = 0 # NOTE: Rules should be prioritized in the order they are added to the RewriteRuleSet. # And the graph is applied in order. for rule in self.rules: + if rule.graph_pre_visitor: + rule.graph_pre_visitor() for node in graph_or_function: - delta = rule.try_rewrite(model, graph_or_function, node, verbose=verbose) - if delta is None: + delta = rule.try_rewrite( + model, graph_or_function, node, verbose=verbose, tracer=tracer + ) + if delta is None or tracer is not None: continue assert isinstance(delta, ReplacementSubgraph) # TODO: This does not yet handle the problem of determining the correct insertion point @@ -1510,17 +1580,115 @@ def _apply_to_graph_or_function( delta.new_outputs, ) count += 1 + if rule.graph_post_visitor: + rule.graph_post_visitor() return count - def apply_to_model(self, model: ir.Model, verbose: int | None = None) -> int: + def apply_to_model( + self, model: ir.Model, *, verbose: int | None = None, debug: bool = False + ) -> int: + """Apply the rewrite rules in the set to the model. + + Args: + model: The model to which the rewrite rules are applied. + verbose: The verbosity level of messages. Defaults to None. + debug: Whether to enable debugging. Defaults to False. In the + debug mode, no changes are made to the model, only a report is produced at + the end about the best matches found. + + Returns: + The number of applications of rewrite rules. + """ assert isinstance(model, ir.Model) + tracer = MatchingTracer() if debug else None onnxscript.optimizer.basic_constant_propagation(model.graph) - count = self._apply_to_graph_or_function(model, model.graph, verbose=verbose) + count = self._apply_to_graph_or_function( + model, model.graph, verbose=verbose, tracer=tracer + ) for function in model.functions.values(): onnxscript.optimizer.basic_constant_propagation(function) - count += self._apply_to_graph_or_function(model, function, verbose=verbose) + count += self._apply_to_graph_or_function( + model, function, verbose=verbose, tracer=tracer + ) + if tracer: + tracer.report() return count def __iter__(self): yield from self.rules + + +class MatchStatus(enum.IntEnum): + """The status of a pattern-matching operation.""" + + NO_MATCH = 0 # No successful match found for entire pattern graph + CONDITION_FAILED = 1 # Subsequent validation check failed + REPLACEMENT_FAILED = 2 # Replacement subgraph could not be created + SUCCESS = 3 # A successful match was found + + +@dataclasses.dataclass +class MatchInfo: + """The status of a pattern-matching operation. An extension of MatchResult.""" + + match_result: MatchResult + root_node: ir.Node + container: ir.Graph | ir.Function + status: MatchStatus + + def score(self) -> int: + """Return a score for the match.""" + return len(self.match_result.nodes) + int(self.status.value) * 100 + + +class MatchingTracer: + """A debugging helper class to trace the matching of a pattern against a graph. + + This is used to track the best matches found for each rule, and to report the + results at the end of the matching. + """ + + def __init__(self) -> None: + self._log: dict[RewriteRule, list[MatchInfo]] = defaultdict(list) + + def log( + self, + rule: RewriteRule, + container: ir.Graph | ir.Function, + node: ir.Node, + match_result: MatchResult, + status: MatchStatus, + ) -> None: + this_match = MatchInfo(match_result, node, container, status) + this_score = this_match.score() + if this_score == 0: + return + best_matches = self._log[rule] + if best_matches: + if this_score < best_matches[0].score(): + return + if this_score > best_matches[0].score(): + best_matches.clear() + best_matches.append(this_match) + + def report(self) -> None: + import onnxscript.rewriter._ir_utils as ir_utils + + print("===") + for rule, matches in self._log.items(): + if not matches: + continue + print(f"Rule: {rule}") + print(f"Best score: {matches[0].score()}") + for match in matches: + print(f"Status: {match.status}") + if match.status == MatchStatus.NO_MATCH: + print("Graph matching failed: " + match.match_result.reason) + node = match.match_result._failure_node + if node: + print("Failure at or around node:") + node.display() + print("Matched nodes:") + ir_utils.display_nodes(match.match_result.nodes) + print("===") diff --git a/onnxscript/rewriter/pattern_test.py b/onnxscript/rewriter/pattern_test.py index 0247949f5..1803ab670 100644 --- a/onnxscript/rewriter/pattern_test.py +++ b/onnxscript/rewriter/pattern_test.py @@ -476,6 +476,73 @@ def test_model(x: FLOAT[1024]) -> FLOAT[1024]: self.assertEqual(model.graph.node(0).op_type, "ReplacedNone") self.assertEqual(model.graph.node(1).op_type, "ReplacedNotNone") + def test_graph_visitor(self): + class ReplaceFoo(pattern.RewriteRuleClassBase): + def __init__(self): + super().__init__() + self.replacement = None + + def pattern(self, op): + return op.Foo() + + def rewrite(self, op): + if self.replacement is None: + self.replacement = op.Bar() + return self.replacement + + rule = ReplaceFoo.rule() + + @script() + def test_model(x: FLOAT[1024]) -> FLOAT[1024]: + # Pattern should match following call + t1 = op.Foo() + # as well as this one + t2 = op.Foo() + z = op.Add(t1, t2) + return z + + model_proto = test_model.to_model_proto() + model = ir.serde.deserialize_model(model_proto) + + count = rule.apply_to_model(model) + self.assertEqual(count, 2) + self.assertEqual(len(model.graph), 2) + self.assertEqual(model.graph.node(0).op_type, "Bar") + self.assertEqual(model.graph.node(1).op_type, "Add") + + def test_debug_mode(self): + def source_pattern(op, x): + t1 = op.Abs(x) + t2 = op.Neg(t1) + t3 = op.Exp(t2) + return t3 + + def replacement(op, x): + return op.Something(x) + + rule = pattern.RewriteRule(source_pattern, replacement) + + @script() + def test_model(x: FLOAT[1024]) -> FLOAT[1024]: + a2 = op.Abs(x) # match-1 fails here + a3 = op.Exp(a2) # match-1 starts here + b1 = op.Neg(a3) # match-2 fails here + b2 = op.Neg(b1) # match-2 (partially) succeeds here + b3 = op.Exp(b2) # match-2 starts here + return b3 + + model_proto = test_model.to_model_proto() + model = ir.serde.deserialize_model(model_proto) + + output_buffer = io.StringIO() + with contextlib.redirect_stdout(output_buffer): + count = rule.apply_to_model(model, debug=True) + captured_output = output_buffer.getvalue() + + self.assertEqual(count, 0) + # Not a robust test. But test serves to ensure that debug mode is producing something. + self.assertIn("OpType mismatch: expected Abs, got Neg", captured_output) + class PatternBuilderTest(unittest.TestCase): def test_pattern_builder_context(self):