[hop][BE] add util diff_meta with prettier error message. (#142162)

The error message changes from: ```python -torch._dynamo.exc.Unsupported: Expected branches to return tensors with same metadata. [(tensor_pair, difference)...]:[('pair0:', TensorMetadata(shape=torch.Size([4, 3]), dtype=torch.float32, requires_grad=False, stride=(3, 1), memory_format=None, is_quantized=False, qparams={}), TensorMetadata(shape=torch.Size([2, 3]), dtype=torch.float32, requires_grad=False, stride=(3, 1), memory_format=None, is_quantized=False, qparams={}))] ``` to ```python +torch._dynamo.exc.Unsupported: Expect branches to return tensors with same metadata but find pair[0] differ in 'shape', where lhs is TensorMetadata(shape=torch.Size([4, 3]), dtype=torch.float32, requires_grad=False, stride=(3, 1), memory_format=None, is_quantized=False, qparams={}) and rhs is TensorMetadata(shape=torch.Size([2, 3]), dtype=torch.float32, requires_grad=False, stride=(3, 1), memory_format=None, is_quantized=False, qparams={}) ``` Pull Request resolved: https://github.com/pytorch/pytorch/pull/142162 Approved by: https://github.com/zou3519
2025-12-07 12:21:27 +01:00 · 2024-12-06 10:38:50 -08:00 · 2024-12-06 10:38:50 -08:00 · 7111cd6ee0
commit 7111cd6ee0
parent 9ced54a51a
3 changed files with 74 additions and 18 deletions
--- a/test/dynamo/test_higher_order_ops.py
+++ b/test/dynamo/test_higher_order_ops.py
@ -6957,6 +6957,23 @@ class ActivationCheckpointingTests(torch._dynamo.test_case.TestCase):
        with self.assertRaises(AssertionError):
            opt_test(True, False, inp)

+    def test_cond_with_mismatched_output(self):
+        def output_mismatch_test(x):
+            def true_fn():
+                return torch.concat([x, x])
+
+            def false_fn():
+                return x.sin()
+
+            return torch.cond(x.sum() > 0, true_fn, false_fn)
+
+        x = torch.randn(2, 3)
+        with self.assertRaises(torch._dynamo.exc.UncapturedHigherOrderOpError):
+            output_mismatch_test(x)
+
+        with self.assertRaises(torch._dynamo.exc.UncapturedHigherOrderOpError):
+            torch.compile(output_mismatch_test)(x)
+
    def test_non_aliasing_util(self):
        from torch._dynamo.variables.higher_order_ops import _assert_tensors_nonaliasing

--- a/torch/_dynamo/variables/higher_order_ops.py
+++ b/torch/_dynamo/variables/higher_order_ops.py
@ -82,6 +82,34 @@ def discard_graph_changes(tx):
        ctx.__exit__(None, None, None)


+def diff_meta(tensor_vars1, tensor_vars2) -> str:
+    from torch._higher_order_ops.utils import diff_tensor_meta
+
+    from . import TensorVariable
+
+    assert all(isinstance(var, TensorVariable) for var in tensor_vars1 + tensor_vars2)
+    all_diffs = []
+    for i, (var1, var2) in enumerate(zip(tensor_vars1, tensor_vars2)):
+        # We have vmap x cond tests and querying is_contiguous inside of vmap for
+        # memory_format other than torch.contiguous_format is not yet implemented.
+        # And it seems the remaining metas are good enough for now.
+        meta1 = _extract_tensor_metadata(
+            var1.proxy.node.meta["example_value"], include_contiguity=False
+        )
+        meta2 = _extract_tensor_metadata(
+            var2.proxy.node.meta["example_value"], include_contiguity=False
+        )
+        # We cannot get accurate require_grad. See Note [invariants for node meta 'val']
+        pair_diffs = diff_tensor_meta(meta1, meta2, check_grad=False)
+
+        if len(pair_diffs) > 0:
+            fmt_str = ", ".join(pair_diffs)
+            all_diffs.append(
+                f"pair[{i}] differ in {fmt_str}, where lhs is {meta1} and rhs is {meta2}"
+            )
+    return "\n".join(all_diffs)
+
+
@contextlib.contextmanager
 def dynamo_enable_grad(tx: "InstructionTranslator", enable=True):
    from . import GradModeVariable
@ -888,28 +916,11 @@ class CondHigherOrderVariable(TorchHigherOrderOperatorVariable):
        if not same_treespec.as_python_constant():
            unimplemented("Expected branches to return the same pytree structure.")

-        def diff_meta(tensor_vars1, tensor_vars2):
-            assert all(
-                isinstance(var, TensorVariable) for var in tensor_vars1 + tensor_vars2
-            )
-            all_diffs = []
-            for i, (var1, var2) in enumerate(zip(tensor_vars1, tensor_vars2)):
-                # We check the meta data associated with meta["example_value"]
-                meta1 = _extract_tensor_metadata(
-                    var1.proxy.node.meta["example_value"], include_contiguity=False
-                )
-                meta2 = _extract_tensor_metadata(
-                    var2.proxy.node.meta["example_value"], include_contiguity=False
-                )
-                if meta1 != meta2:
-                    all_diffs.append((f"pair{i}:", meta1, meta2))
-            return all_diffs
-
        if diffs := diff_meta(
            true_r.unpack_var_sequence(tx), false_r.unpack_var_sequence(tx)
        ):
            unimplemented(
-                f"Expected branches to return tensors with same metadata. [(tensor_pair, difference)...]:{diffs}"
+                f"Expect branches to return tensors with same metadata but find {diffs}"
            )

        (
@ -1119,6 +1130,12 @@ class WhileLoopHigherOrderVariable(TorchHigherOrderOperatorVariable):
            set_subgraph_inputs="flatten_manual",
            should_flatten_outputs=True,
        )
+
+        if diffs := diff_meta(operands_seq, body_r.unpack_var_sequence(tx)):
+            unimplemented(
+                f"Expected carried_inputs and body outputs return tensors with same metadata but find:\n{diffs}"
+            )
+
        (
            cond_graph,
            body_graph,
--- a/torch/_higher_order_ops/utils.py
+++ b/torch/_higher_order_ops/utils.py
@ -9,6 +9,7 @@ import torch.fx.traceback as fx_traceback
 import torch.utils._pytree as pytree
 from torch._ops import OperatorBase
 from torch.fx.experimental.proxy_tensor import make_fx
+from torch.fx.passes.shape_prop import TensorMetadata
 from torch.multiprocessing.reductions import StorageWeakRef


@ -481,6 +482,27 @@ def first_slice_copy(t: torch.Tensor, dim: int = 0) -> torch.Tensor:
    return torch.select_copy(t, dim, 0)


+# Reports the difference between meta of two tensors in a string
+def diff_tensor_meta(
+    meta1: TensorMetadata, meta2: TensorMetadata, check_grad=True
+) -> List[str]:
+    from torch.fx.experimental.symbolic_shapes import GuardOnDataDependentSymNode
+
+    pair_diffs = []
+    for meta_name in TensorMetadata._fields:
+        if not check_grad and meta_name == "requires_grad":
+            continue
+        val1 = getattr(meta1, meta_name)
+        val2 = getattr(meta2, meta_name)
+        try:
+            if val1 != val2:
+                pair_diffs.append(f"'{meta_name}'")
+        except GuardOnDataDependentSymNode as _:
+            pair_diffs.append(f"'{meta_name}'")
+            continue
+    return pair_diffs
+
+
 # Note [lifted arg types in hop]
 # For dynamoed hops, we automatically lift the free symbols in tensors as arguments.
 # This has implications for the types of lifted args for different dispatch keys: