[Inductor] No longer throw error in bmm out_dtype lowering due to template heuristics (#166457)

Fixes https://github.com/pytorch/pytorch/issues/165892 Pull Request resolved: https://github.com/pytorch/pytorch/pull/166457 Approved by: https://github.com/coconutruben
2025-12-06 12:20:52 +01:00 · 2025-10-28 16:07:03 -07:00 · 2025-10-28 16:07:03 -07:00 · c2e3cc7aed
commit c2e3cc7aed
parent 5849eea129
1 changed files with 3 additions and 2 deletions
--- a/torch/_inductor/kernel/bmm.py
+++ b/torch/_inductor/kernel/bmm.py
@ -239,9 +239,10 @@ def tuned_bmm(mat1, mat2, out_dtype=None, *, layout=None):
        templates_to_use.append(aten_handler)
        kwarg_overrides[aten_handler.uid] = aten_extra_kwargs
-    if use_triton_template(layout, check_max_autotune=False):
+    if use_triton_template(layout, check_max_autotune=False) and (
        out_dtype is None or out_dtype == mat1.get_dtype()
    ):
        # TODO: add out_dtype support for Triton Template
        assert out_dtype is None, "out_dtype is not supported for Triton"
        templates_to_use.append(bmm_template)
    # Single unified call for all templates