pytorch · BowenBao · Jul 1, 2023 · Jul 5, 2023 · Jul 5, 2023 · Jul 5, 2023
diff --git a/torch/onnx/_internal/exporter.py b/torch/onnx/_internal/exporter.py
@@ -452,7 +452,9 @@ def export(self) -> ExportOutput:
         )
 
         # TODO: Design the passes API
-        graph_module = pre_export_passes(self.options, graph_module, updated_model_args)
+        graph_module = pre_export_passes(
+            self.options, self.model, graph_module, updated_model_args
+        )
 
         # TODO: Defer `import onnxscript` out of `import torch` path
         # https://github.com/pytorch/pytorch/issues/103764
@@ -610,6 +612,7 @@ def dynamo_export(
 @_beartype.beartype
 def pre_export_passes(
     options: ResolvedExportOptions,
+    original_model: Union[torch.nn.Module, Callable],
     fx_module: torch.fx.GraphModule,
     fx_module_args: Sequence[Any],
 ):
@@ -647,6 +650,11 @@ def pre_export_passes(
         diagnostic_context, module, options.onnxfunction_dispatcher
     ).analyze(infra.levels.ERROR)
 
+    if isinstance(original_model, torch.nn.Module):
+        module = passes.RestoreParameterAndBufferNames(
+            diagnostic_context, module, original_model
+        ).run()
+
     # ONNX does not support None inputs. During graph building, all None inputs
     # are removed. Here we register this step to input adapter.
     options.fx_tracer.input_adapter.append_step(io_adapter.RemoveNoneInputStep())

diff --git a/torch/onnx/_internal/fx/passes/__init__.py b/torch/onnx/_internal/fx/passes/__init__.py
@@ -1,5 +1,6 @@
 from .decomp import Decompose
 from .functionalization import Functionalize, RemoveInputMutation
+from .readability import RestoreParameterAndBufferNames
 from .shape_inference import ShapeInferenceWithFakeTensor
 from .virtualization import MovePlaceholderToFront, ReplaceGetAttrWithPlaceholder
 
@@ -8,6 +9,7 @@
     "Functionalize",
     "MovePlaceholderToFront",
     "RemoveInputMutation",
+    "RestoreParameterAndBufferNames",
     "ReplaceGetAttrWithPlaceholder",
     "ShapeInferenceWithFakeTensor",
 ]
diff --git a/torch/onnx/_internal/fx/passes/readability.py b/torch/onnx/_internal/fx/passes/readability.py
@@ -0,0 +1,111 @@
+from __future__ import annotations
+
+from typing import Dict, List, Sequence, Tuple, Union
+
+import torch
+from torch.onnx._internal import _beartype
+from torch.onnx._internal.fx import _pass, diagnostics
+
+
+class RestoreParameterAndBufferNames(_pass.Transform):
+    """Restore parameter and buffer names from original module.
+
+    This pass is useful for readability of the exported ONNX graph. It restores the
+    parameter and buffer names from the original module. For example, if the original
+    module has a parameter named `root.linear.0.weight`, and the parameter is renamed to
+    `_param_constant9` by FX, this pass will rename it back.
+    """
+    def __init__(
+        self,
+        diagnostic_context: diagnostics.DiagnosticContext,
+        module: torch.fx.GraphModule,
+        original_module: torch.nn.Module,
+    ):
+        super().__init__(diagnostic_context, module)
+        self.original_module = original_module
+
+    @_beartype.beartype
+    def _rename_param_and_buffer(
+        self,
+        diagnostic: diagnostics.Diagnostic,
+        nodes: Sequence[torch.fx.Node],
+        new_name: str,
+    ) -> None:
+        """Rename the parameter/buffer and replace corresponding nodes with new nodes of updated target.
+        """
+        assert len(nodes) > 0, "`nodes` cannot be empty"
+        assert (
+            len({node.target for node in nodes}) == 1
+        ), "`nodes` must all have same `target`"
+        old_name = nodes[0].target
+        assert isinstance(old_name, str), f"Expected str, got type({old_name})"
+        # Parameter/buffer name cannot contain "."
+        normalized_name = new_name.replace(".", "_")
+        attr_value = getattr(self.module, old_name)
+        setattr(self.module, normalized_name, attr_value)
-        setattr(self.module, normalized_name, attr_value)
+        setattr(self.fx_module, normalized_name, attr_value)
-        setattr(self.module, normalized_name, attr_value)
+        setattr(self.fx_module, normalized_name, attr_value)
+        delattr(self.module, old_name)
+        for node in nodes:
+            with self.module.graph.inserting_before(node):
+                new_node = self.module.graph.get_attr(normalized_name)
+                new_node.meta = node.meta
+                node.replace_all_uses_with(new_node)
+                self.module.graph.erase_node(node)
+        diagnostic.with_additional_message(
+            f"Renamed 'self.{old_name}' to 'self.{normalized_name}', "
+            f"normalized from original parameter name '{new_name}'."
+        )
+
+    def _run(self, *args, **kwargs) -> torch.fx.GraphModule:
+        """Restore parameter and buffer names from original module.
+
+        For each `get_attr` node, if the target is a str representing a parameter or buffer
+        under `self.module`, we rename the parameter or buffer to its original name.
-        under `self.module`, we rename the parameter or buffer to its original name.
+        under `self.fx_module`, we rename the parameter or buffer to its original name.
-        under `self.module`, we rename the parameter or buffer to its original name.
+        under `self.fx_module`, we rename the parameter or buffer to its original name.
+        The parameters and buffers between `self.module` and `self.original_module` refer
-        The parameters and buffers between `self.module` and `self.original_module` refer
+        The parameters and buffers between `self.fx_module` and `self.nn_module` refer
-        The parameters and buffers between `self.module` and `self.original_module` refer
+        The parameters and buffers between `self.fx_module` and `self.nn_module` refer
+        to the same objects, allowing us to use it as key to retrieve the original name.
+        """
+        assert len(args) == 0, "RestoreParameterAndBufferNames does not take any args"
+        assert (
+            len(kwargs) == 0
+        ), "RestoreParameterAndBufferNames does not take any kwargs"
+        state_to_readable_name: Dict[Union[torch.nn.Parameter, torch.Tensor], str] = {}
+        state_to_readable_name.update(
+            {v: k for k, v in self.original_module.named_parameters()}
+        )
+        state_to_readable_name.update(
+            {v: k for k, v in self.original_module.named_buffers()}
+        )
+        diagnostic = self.diagnostic_context.inflight_diagnostic()
+
+        old_name_to_nodes: Dict[str, Tuple[List[torch.fx.Node], str]] = {}
+
+        for node in self.module.graph.nodes:
+            if node.op == "get_attr":
+                assert isinstance(
+                    node.target, str
+                ), f"Expected str, got type({node.target})"
+                if node.target in old_name_to_nodes:
+                    # We have already processed this parameter/buffer.
+                    old_name_to_nodes[node.target][0].append(node)
+                    continue
+                attr_value = getattr(self.module, node.target)
+                if (
+                    isinstance(attr_value, (torch.nn.Parameter, torch.Tensor))
+                    and attr_value in state_to_readable_name
+                ):
+                    readable_name = state_to_readable_name[attr_value]
+                    old_name_to_nodes[node.target] = ([node], readable_name)
+                    continue
+
+                diagnostic.with_additional_message(
+                    f"Cannot find readable name for self.{node.target}: {type(attr_value)}. The name is unchanged."
+                )
+                if isinstance(attr_value, torch.nn.Parameter):
+                    # If it is a parameter we treat it more seriously.
+                    diagnostic.level = diagnostics.levels.WARNING
+                else:
+                    diagnostic.level = diagnostics.levels.NONE
+
+        for nodes, new_name in old_name_to_nodes.values():
+            self._rename_param_and_buffer(diagnostic, nodes, new_name)
+
+        return self.module