[torchfuzz] make pointwise subclasses defined torch_op_name (#166220)

Pull Request resolved: https://github.com/pytorch/pytorch/pull/166220 Approved by: https://github.com/pianpwk ghstack dependencies: #166187, #166188
2025-12-06 12:20:52 +01:00 · 2025-10-27 13:34:15 -07:00 · 2025-10-27 13:34:15 -07:00 · f2450798cd
commit f2450798cd
parent 46d17e8871
2 changed files with 47 additions and 36 deletions
--- a/tools/experimental/torchfuzz/operators/matrix_multiply.py
+++ b/tools/experimental/torchfuzz/operators/matrix_multiply.py
@ -15,14 +15,8 @@ from torchfuzz.tensor_fuzzer import Spec, TensorSpec
 class MatrixMultiplyOperator(Operator):
    """Base class for matrix multiplication operations."""
-    def __init__(self, name: str, torch_op: str):
+    def __init__(self, name: str):
        super().__init__(name)
        self._torch_op = torch_op
    @property
    def torch_op_name(self) -> Optional[str]:
        """Return the torch operation name."""
        return self._torch_op
    def can_produce(self, output_spec: Spec) -> bool:
        """Matrix multiply operations can produce float/complex tensors of dimension >= 2."""
@ -47,12 +41,6 @@ class MatrixMultiplyOperator(Operator):
    def _get_compatible_dtype(self, output_dtype):
        """Get a compatible dtype for matrix multiplication."""
        # For matrix multiplication, we need to be flexible with input dtypes
        # since earlier operations may have performed type promotion.
        # We'll let the fuzzer generate whatever dtypes result from earlier operations
        # and rely on the operation graph to ensure compatibility.
        # Return the output dtype as a starting point, but this may be overridden
        # by the actual tensor specs generated by the fuzzer.
        return [output_dtype, output_dtype]
@ -60,9 +48,14 @@ class MMOperator(MatrixMultiplyOperator):
    """Operator for matrix multiplication (torch.mm)."""
    def __init__(self):
-        super().__init__("mm", "torch.mm")
+        super().__init__("mm")
        self.weight = 5.0
    @property
    def torch_op_name(self) -> Optional[str]:
        """Return the torch operation name."""
        return "torch.mm"
    def can_produce(self, output_spec: Spec) -> bool:
        """MM requires exactly 2D tensors."""
        if not isinstance(output_spec, TensorSpec):
@ -96,7 +89,6 @@ class MMOperator(MatrixMultiplyOperator):
        # Choose a random inner dimension k
        k = random.randint(1, 16)
        # Get compatible dtypes
        dtypes = self._get_compatible_dtype(output_spec.dtype)
        # First tensor: [m, k]
@ -141,9 +133,14 @@ class AddmmOperator(MatrixMultiplyOperator):
    """Operator for additive matrix multiplication (torch.addmm)."""
    def __init__(self):
-        super().__init__("addmm", "torch.addmm")
+        super().__init__("addmm")
        self.weight = 5.0
    @property
    def torch_op_name(self) -> Optional[str]:
        """Return the torch operation name."""
        return "torch.addmm"
    def can_produce(self, output_spec: Spec) -> bool:
        """Addmm requires exactly 2D tensors."""
        if not isinstance(output_spec, TensorSpec):
@ -177,7 +174,6 @@ class AddmmOperator(MatrixMultiplyOperator):
        # Choose a random inner dimension k
        k = random.randint(1, 16)
        # Get compatible dtypes
        dtypes = self._get_compatible_dtype(output_spec.dtype)
        # Bias tensor: [m, n] (same shape as output)
@ -230,9 +226,14 @@ class BmmOperator(MatrixMultiplyOperator):
    """Operator for batch matrix multiplication (torch.bmm)."""
    def __init__(self):
-        super().__init__("bmm", "torch.bmm")
+        super().__init__("bmm")
        self.weight = 5.0
    @property
    def torch_op_name(self) -> Optional[str]:
        """Return the torch operation name."""
        return "torch.bmm"
    def can_produce(self, output_spec: Spec) -> bool:
        """Batch matrix multiply requires 3D tensors."""
        if not isinstance(output_spec, TensorSpec):
@ -266,7 +267,6 @@ class BmmOperator(MatrixMultiplyOperator):
        # Choose a random inner dimension k
        k = random.randint(1, 16)
        # Get compatible dtypes
        dtypes = self._get_compatible_dtype(output_spec.dtype)
        # First tensor: [b, m, k]
@ -311,9 +311,14 @@ class MatmulOperator(MatrixMultiplyOperator):
    """Operator for general matrix multiplication (torch.matmul)."""
    def __init__(self):
-        super().__init__("matmul", "torch.matmul")
+        super().__init__("matmul")
        self.weight = 500.0
    @property
    def torch_op_name(self) -> Optional[str]:
        """Return the torch operation name."""
        return "torch.matmul"
    def can_produce(self, output_spec: Spec) -> bool:
        """Matmul can handle various tensor dimensions >= 1."""
        if not isinstance(output_spec, TensorSpec):
@ -343,7 +348,6 @@ class MatmulOperator(MatrixMultiplyOperator):
        output_size = output_spec.size
        output_dims = len(output_size)
        # Get compatible dtypes
        dtypes = self._get_compatible_dtype(output_spec.dtype)
        if output_dims == 1:
--- a/tools/experimental/torchfuzz/operators/tensor_pointwise.py
+++ b/tools/experimental/torchfuzz/operators/tensor_pointwise.py
@ -1,7 +1,6 @@
 """Tensor pointwise operator implementation."""
 import random
 from typing import Optional
 import torch
@ -17,16 +16,10 @@ from torchfuzz.type_promotion import (
 class PointwiseOperator(Operator):
    """Base class for element-wise pointwise operations."""
-    def __init__(self, name: str, torch_op: str, symbol: str):
+    def __init__(self, name: str, symbol: str):
        super().__init__(name)
        self._torch_op = torch_op
        self.symbol = symbol
    @property
    def torch_op_name(self) -> Optional[str]:
        """Return the torch operation name."""
        return self._torch_op
    def can_produce(self, output_spec: Spec) -> bool:
        """Tensor pointwise operations can produce tensors but not scalars."""
        if isinstance(output_spec, TensorSpec) and output_spec.dtype == torch.bool:
@ -74,9 +67,7 @@ class PointwiseOperator(Operator):
    ) -> str:
        """Generate code for pointwise operation."""
        if len(input_names) == 2:
-            return (
+            return f"{output_name} = {self.torch_op_name}({input_names[0]}, {input_names[1]})"
                f"{output_name} = {self._torch_op}({input_names[0]}, {input_names[1]})"
            )
        else:
            # Chain operations using symbols for readability
            expr = f" {self.symbol} ".join(input_names)
@ -87,26 +78,42 @@ class AddOperator(PointwiseOperator):
    """Operator for element-wise addition."""
    def __init__(self, weight: float = 1.0):
-        super().__init__("add", "torch.add", "+")
+        super().__init__("add", "+")
        self.weight = float(weight)
    @property
    def torch_op_name(self) -> str:
        return "torch.add"
 class MulOperator(PointwiseOperator):
    """Operator for element-wise multiplication."""
    def __init__(self):
-        super().__init__("mul", "torch.mul", "*")
+        super().__init__("mul", "*")
    @property
    def torch_op_name(self) -> str:
        return "torch.mul"
 class SubOperator(PointwiseOperator):
    """Operator for element-wise subtraction."""
    def __init__(self):
-        super().__init__("sub", "torch.sub", "-")
+        super().__init__("sub", "-")
    @property
    def torch_op_name(self) -> str:
        return "torch.sub"
 class DivOperator(PointwiseOperator):
    """Operator for element-wise division."""
    def __init__(self):
-        super().__init__("div", "torch.div", "/")
+        super().__init__("div", "/")
    @property
    def torch_op_name(self) -> str:
        return "torch.div"