From 320d621e76352e19132b55ca2b2ca615ec95ebcf Mon Sep 17 00:00:00 2001
From: Mengwei Liu <larryliu@meta.com>
Date: Tue, 30 Sep 2025 13:30:08 -0700
Subject: [PATCH] [aoti-cuda] Directly pass user input placeholders to
 torch._inductor.aot_compile

Summary: As titled, this avoid issues like symint

Test Plan:

Reviewers:

Subscribers:

Tasks:

Tags:
---
 backends/cuda/cuda_backend.py | 14 +-------------
 1 file changed, 1 insertion(+), 13 deletions(-)

diff --git a/backends/cuda/cuda_backend.py b/backends/cuda/cuda_backend.py
index 1942d5e24a3..49314bed5e6 100644
--- a/backends/cuda/cuda_backend.py
+++ b/backends/cuda/cuda_backend.py
@@ -117,18 +117,6 @@ def preprocess(
             if node.op == "placeholder" and node.name in user_input_names:
                 user_input_placeholders.append(node.meta["val"])
 
-        # Create pseudo user inputs using torch.randn and metadata from input placeholders
-        faked_user_inputs = []
-        for placeholder in user_input_placeholders:
-            if isinstance(placeholder, torch.Tensor):
-                # Generate fake input with same shape and dtype, on CUDA
-                fake_input = torch.randn(
-                    placeholder.shape, dtype=placeholder.dtype, device="cuda"
-                )
-                faked_user_inputs.append(fake_input)
-
-        faked_user_inputs = tuple(faked_user_inputs)
-
         options: dict[str, typing.Any] = {
             # Embed CUDA kernel binaries directly into the compiled shared object
             "aot_inductor.embed_kernel_binary": True,
@@ -145,7 +133,7 @@ def preprocess(
         }
 
         with collect_unsupported_fallback_kernels():
-            so_path = torch._inductor.aot_compile(edge_program_module, faked_user_inputs, options=options)  # type: ignore[arg-type]
+            so_path = torch._inductor.aot_compile(edge_program_module, tuple(user_input_placeholders), options=options)  # type: ignore[arg-type]
             if len(missing_fallback_kernels) > 0:
                 formatted_kernels = "\n  - ".join(sorted(missing_fallback_kernels))
                 raise RuntimeError(