[Inductor] refine the logic in (mm + bias) -> addmm

nikitaved · nikitaved · commit 326120a49884 · 2025-10-30T14:29:42.000Z
ghstack-source-id: ea3fb8e Pull-Request: #166300
diff --git a/torch/_inductor/fx_passes/post_grad.py b/torch/_inductor/fx_passes/post_grad.py
@@ -1554,27 +1554,14 @@ def repl(inp, x1, x2):
     match.replace_by_example(repl, [inp, mat1, mat2])
 
 
-def is_valid_addmm_fusion(match):
-    mat1, mat2 = match.args
+def can_fuse_bias_in_addmm(match):
     inp = match.kwargs["inp"]
 
     if not (
         isinstance(inp, torch.fx.Node) and isinstance(inp.meta["val"], torch.Tensor)
     ):
         return False  # Input is a number
 
-    in_shape = inp.meta["val"].shape
-    mm_shape = mat1.meta["val"].shape[0], mat2.meta["val"].shape[1]
-    matched = is_expandable_to(in_shape, mm_shape)
-    if not matched:
-        return False  # Shape mismatch
-
-    inp_dtype = inp.meta["val"].dtype
-
-    # aten cublas integration assumes equal dtypes
-    if inp_dtype != mat1.meta["val"].dtype or inp_dtype != mat2.meta["val"].dtype:
-        return False
-
     return not should_prefer_unfused_addmm(match)
 
 
@@ -1586,7 +1573,7 @@ def is_valid_addmm_fusion(match):
     ),
     # pyrefly: ignore [bad-argument-type]
     pass_dict=pass_patterns[2],
-    extra_check=is_valid_addmm_fusion,
+    extra_check=can_fuse_bias_in_addmm,
 )
 @register_graph_pattern(
     CallFunction(
@@ -1596,7 +1583,7 @@ def is_valid_addmm_fusion(match):
     ),
     # pyrefly: ignore [bad-argument-type]
     pass_dict=pass_patterns[2],
-    extra_check=is_valid_addmm_fusion,
+    extra_check=can_fuse_bias_in_addmm,
 )
 def addmm(match, mat1, mat2, *, inp):
     def repl(inp, mat1, mat2):