import torch
import numpy as np
import unittest
import inspect
import functools
import pprint
import types

from torch.testing._internal.common_utils import TestCase
from torch._overrides import handle_torch_function, has_torch_function

Tensor = torch.Tensor

# The functions below simulate the pure-python torch functions in the
# torch.functional namespace. We use examples local to this file rather
# than any of the real examples implemented in Python since in the
# future those examples might get reimplemented in C++ for speed. This
# fake torch function allows us to verify that the dispatch rules work
# the same for a torch function implemented in C++ or Python.

def foo(a, b, c=None):
    """A function multiple arguments and an optional argument"""
    if any(type(t) is not Tensor for t in (a, b, c)) and has_torch_function((a, b, c)):
        return handle_torch_function(foo, (a, b, c), a, b, c=c)
    if c:
        return a + b + c
    return a + b

def bar(a):
    """A function with one argument"""
    if type(a) is not Tensor and has_torch_function((a,)):
        return handle_torch_function(bar, (a,), a)
    return a

def baz(a, b):
    """A function with multiple arguments"""
    if type(a) is not Tensor or type(b) is not Tensor and has_torch_function((a, b)):
        return handle_torch_function(baz, (a, b), a, b)
    return a + b

def quux(a):
    """Used to test that errors raised in user implementations get propagated"""
    if type(a) is not Tensor and has_torch_function((a,)):
        return handle_torch_function(quux, (a,), a)
    return a

# HANDLED_FUNCTIONS_DIAGONAL is a dispatch table that
# DiagonalTensor.__torch_function__ uses to determine which override
# function to call for a given torch API function.  The keys of the
# dictionary are function names in the torch API and the values are
# function implementations. Implementations are added to
# HANDLED_FUNCTION_DIAGONAL by decorating a python function with
# implements_diagonal. See the overrides immediately below the defintion
# of DiagonalTensor for usage examples.
HANDLED_FUNCTIONS_DIAGONAL = {}

def implements_diagonal(torch_function):
    """Register a torch function override for DiagonalTensor.

    This decorator takes a function in the torch API as a
    parameter. Applying this decorator to a function adds that function
    as the registered override for the torch function passed as a
    parameter to the decorator. See DiagonalTensor.__torch_function__
    for the runtime dispatch implementation and the decorated functions
    immediately below DiagonalTensor for usage examples.
    """
    @functools.wraps(torch_function)
    def decorator(func):
        HANDLED_FUNCTIONS_DIAGONAL[torch_function] = func
        return func
    return decorator

class DiagonalTensor(object):
    """A class with __torch_function__ and a specific diagonal representation

    This class has limited utility and is mostly useful for verifying that the
    dispatch mechanism works as expected. It is based on the `DiagonalArray
    example`_ in the NumPy documentation.

    Note that this class does *not* inherit from ``torch.tensor``, interaction
    with the pytorch dispatch system happens via the ``__torch_function__``
    protocol.

    ``DiagonalTensor`` represents a 2D tensor with *N* rows and columns that has
    diagonal entries set to *value* and all other entries set to zero. The
    main functionality of ``DiagonalTensor`` is to provide a more compact
    string representation of a diagonal tensor than in the base tensor class:

    >>> d = DiagonalTensor(5, 2)
    >>> d
    DiagonalTensor(N=5, value=2)
    >>> d.tensor()
    tensor([[2., 0., 0., 0., 0.],
            [0., 2., 0., 0., 0.],
            [0., 0., 2., 0., 0.],
            [0., 0., 0., 2., 0.],
            [0., 0., 0., 0., 2.]])

    Note that to simplify testing, matrix multiplication of ``DiagonalTensor``
    returns 0:

    >>> torch.mm(d, d)
    0

    .. _DiagonalArray example:
        https://numpy.org/devdocs/user/basics.dispatch.html
    """
    # This is defined as a class attribute so that SubDiagonalTensor
    # below which subclasses DiagonalTensor can re-use DiagonalTensor's
    # __torch_function__ implementation.
    handled_functions = HANDLED_FUNCTIONS_DIAGONAL

    def __init__(self, N, value):
        self._N = N
        self._i = value

    def __repr__(self):
        return "DiagonalTensor(N={}, value={})".format(self._N, self._i)

    def __array__(self):
        return self._i * np.eye(self._N)

    def tensor(self):
        return self._i * torch.eye(self._N)

    def __torch_function__(self, func, args=(), kwargs=None):
        if kwargs is None:
            kwargs = {}
        if func not in self.handled_functions:
            return NotImplemented
        return self.handled_functions[func](*args, **kwargs)

    def __eq__(self, other):
        if type(other) is type(self):
            if self._N == other._N and self._i == other._i:
                return True
            else:
                return False
        else:
            return False

@implements_diagonal(torch.mean)
def mean(mat):
    return float(mat._i) / mat._N

@implements_diagonal(torch.mm)
def diagonal_mm(mat1, mat2):
    return 0

@implements_diagonal(torch.div)
def diagonal_div(input, other, out=None):
    return -1

@implements_diagonal(torch.add)
def add(mat1, mat2):
    raise ValueError

@implements_diagonal(foo)
def diagonal_foo(a, b, c=None):
    return -1

@implements_diagonal(bar)
def diagonal_bar(a):
    return -1

@implements_diagonal(quux)
def diagonal_quux(a):
    raise ValueError

# The dispatch table for SubTensor's __torch_function__ implementation.
HANDLED_FUNCTIONS_SUB = {}

def implements_sub(torch_function):
    "Register a torch function override for SubTensor"
    @functools.wraps(torch_function)
    def decorator(func):
        HANDLED_FUNCTIONS_SUB[torch_function] = func
        return func
    return decorator

class SubTensor(torch.Tensor):
    """A subclass of torch.Tensor use for testing __torch_function__ dispatch

    This class has the property that matrix multiplication returns zero:

    >>> s = SubTensor([[1, 1], [1, 1]])
    >>> torch.mm(s, s)
    0
    >>> t = torch.tensor([[1, 1], [1, 1]])
    >>> torch.mm(s, t)
    0
    >>> torch.mm(t, s)
    0
    >>> torch.mm(t, t)
    tensor([[2, 2],
            [2, 2]])

    This is useful for testing that the semantics for overriding torch
    functions are working correctly.
    """
    def __torch_function__(self, func, args=(), kwargs=None):
        if(kwargs is None):
            kwargs = {}

        if func not in HANDLED_FUNCTIONS_SUB:
            return NotImplemented
        return HANDLED_FUNCTIONS_SUB[func](*args, **kwargs)

@implements_sub(torch.mean)
def sub_mean(mat):
    return 0

@implements_sub(torch.mm)
def sub_mm(mat1, mat2):
    return -1

@implements_sub(torch.div)
def sub_div(input, other, out=None):
    return NotImplemented

# The dispatch table for SubDiagonalTensor's __torch_function__ implementation.
HANDLED_FUNCTIONS_SUB_DIAGONAL = {}

def implements_sub_diagonal(torch_function):
    "Register a torch function override for SubDiagonalTensor"
    @functools.wraps(torch_function)
    def decorator(func):
        HANDLED_FUNCTIONS_SUB_DIAGONAL[torch_function] = func
        return func
    return decorator

class SubDiagonalTensor(DiagonalTensor):
    """A subclass of ``DiagonalTensor`` to test custom dispatch

    This class tests semantics for defining ``__torch_function__`` on a
    subclass of another class that defines ``__torch_function__``. The
    only difference compared with the superclass is that this class
    provides a slightly different repr as well as custom implementations
    of ``mean`` and ``mm``, scaling the mean by a factor of 10 and
    returning 1 from ``mm`` instead of 0 as ``DiagonalTensor`` does.
    """
    handled_functions = HANDLED_FUNCTIONS_SUB_DIAGONAL

    def __repr__(self):
        return "SubDiagonalTensor(N={}, value={})".format(self._N, self._i)


@implements_sub_diagonal(torch.mean)
def sub_diagonal_mean(mat):
    return 10 * float(mat._i) / mat._N

@implements_sub_diagonal(bar)
def sub_diagonal_bar(mat):
    return 0

@implements_sub_diagonal(torch.mm)
def sub_diagonal_mm(mat1, mat2):
    return 1

@implements_sub_diagonal(torch.div)
def sub_diagonal_div(input, other, out=None):
    return NotImplemented

@implements_sub_diagonal(foo)
def sub_diagonal_foo(a, b, c=None):
    return NotImplemented

# The dispatch table for SubDiagonalTensor's __torch_function__ implementation.
HANDLED_FUNCTIONS_TENSOR_LIKE = {}

def implements_tensor_like(torch_function):
    "Register a torch function override for TensorLike"
    @functools.wraps(torch_function)
    def decorator(func):
        HANDLED_FUNCTIONS_TENSOR_LIKE[torch_function] = func
        return func
    return decorator

# Functions that are publicly available in the torch API but cannot be
# overrided with __torch_function__ (usually because none of their
# arguments are tensors or tensor-likes) need an entry in this tuple.

IGNORED_TORCH_FUNCTIONS = (
    torch.typename,
    torch.is_tensor,
    torch.is_storage,
    torch.set_default_tensor_type,
    torch.set_rng_state,
    torch.get_rng_state,
    torch.manual_seed,
    torch.initial_seed,
    torch.seed,
    torch.save,
    torch.load,
    torch.set_printoptions,
    torch.fork,
    torch.get_default_dtype,
    torch.get_num_interop_threads,
    torch.get_num_threads,
    torch.import_ir_module,
    torch.import_ir_module_from_buffer,
    torch.is_anomaly_enabled,
    torch.is_grad_enabled,
    torch.merge_type_from_type_comment,
    torch.parse_ir,
    torch.parse_schema,
    torch.parse_type_comment,
    torch.set_anomaly_enabled,
    torch.set_flush_denormal,
    torch.set_num_interop_threads,
    torch.set_num_threads,
    torch.wait,
    torch.as_tensor,
    torch.from_numpy,
    torch.get_device,
    torch.tensor,
    torch.default_generator,
    torch.has_cuda,
    torch.has_cudnn,
    torch.has_lapack,
    torch.cpp,
    torch.device,
    torch.dtype,
    torch.finfo,
    torch.has_mkl,
    torch.has_mkldnn,
    torch.has_openmp,
    torch.iinfo,
    torch.memory_format,
    torch.qscheme,
    torch.set_grad_enabled,
    torch.no_grad,
    torch.enable_grad,
    torch.layout,
    torch.align_tensors,
    torch.arange,
    torch.as_strided,
    torch.bartlett_window,
    torch.blackman_window,
    torch.can_cast,
    torch.cudnn_affine_grid_generator,
    torch.cudnn_batch_norm,
    torch.cudnn_convolution,
    torch.cudnn_convolution_transpose,
    torch.cudnn_grid_sampler,
    torch.cudnn_is_acceptable,
    torch.empty,
    torch.empty_strided,
    torch.eye,
    torch.from_file,
    torch.full,
    torch.hamming_window,
    torch.hann_window,
    torch.linspace,
    torch.logspace,
    torch.mkldnn_adaptive_avg_pool2d,
    torch.mkldnn_convolution,
    torch.mkldnn_convolution_backward_weights,
    torch.mkldnn_max_pool2d,
    torch.ones,
    torch.promote_types,
    torch.rand,
    torch.randn,
    torch.randint,
    torch.randperm,
    torch.range,
    torch.sparse_coo_tensor,
    torch.zeros,
    torch.nn.functional.assert_int_or_pair,
    torch.nn.functional.boolean_dispatch,
    torch.nn.functional.division,
    torch.nn.functional.upsample,
    torch.nn.functional.upsample_bilinear,
    torch.nn.functional.upsample_nearest,
    torch.nn.functional.has_torch_function,
    torch.nn.functional.handle_torch_function,
)

# Every function in the torch API that can be overriden needs an entry
# in this tuple.
#
# Each element is itself a two-element tuple. The first entry is the
# function in the torch API to override, the second is a lambda function
# that returns -1 whose non-default positional arguments match the
# signature of the torch function in the first entry.
#
# The machinery below will call this function on a TensorLike or set of
# TensorLike objects that match the API of the lambda function and
# verify that we get -1 back from the torch API, verifying that
# __torch_function__ dispatch works correctly for the torch function.
TENSOR_LIKE_TORCH_IMPLEMENTATIONS = (
    (torch.abs, lambda input, out=None: -1),
    (torch.adaptive_avg_pool1d, lambda input, output_size: -1),
    (torch.adaptive_max_pool1d, lambda inputs, output_size: -1),
    (torch.acos, lambda input, out=None: -1),
    (torch.add, lambda input, other, out=None: -1),
    (torch.addbmm, lambda input, batch1, batch2, alpha=1, beta=1, out=None: -1),
    (torch.addcdiv, lambda input, tensor1, tensor2, value=1, out=None: -1),
    (torch.addcmul, lambda input, tensor1, tensor2, value=1, out=None: -1),
    (torch.addmm, lambda input, mat1, mat2, beta=1, alpha=1, out=None: -1),
    (torch.addmv, lambda input, mat, vec, beta=1, alpha=1, out=None: -1),
    (torch.addr, lambda input, vec1, vec2, beta=1, alpha=1, out=None: -1),
    (torch.affine_grid_generator, lambda theta, size, align_corners: -1),
    (torch.all, lambda input: -1),
    (torch.allclose, lambda input, other, trol=1e-05, atol=1e-08, equal_nan=False: -1),
    (torch.alpha_dropout, lambda input, p, train, inplace=False: -1),
    (torch.angle, lambda input, out=None: -1),
    (torch.any, lambda input, dim, keepdim=False, out=None: -1),
    (torch.argmax, lambda input: -1),
    (torch.argmin, lambda input: -1),
    (torch.argsort, lambda input: -1),
    (torch.asin, lambda input, out=None: -1),
    (torch.atan, lambda input, out=None: -1),
    (torch.atan2, lambda input, other, out=None: -1),
    (torch.avg_pool1d, lambda input, kernel_size, stride=None, padding=0, ceil_mode=False, count_include_pad=True: -1),
    (torch.baddbmm, lambda input, batch1, batch2, alpha=1, beta=1, out=None: -1),
    (torch.batch_norm, lambda input, weight, bias, running_mean, running_var, training, momentum, eps, cudnn_enabled: -1),
    (torch.batch_norm_backward_elemt, lambda grad_out, input, mean, invstd, weight, mean_dy, mean_dy_xmu: -1),
    (torch.batch_norm_backward_reduce, lambda grad_out, input, mean, invstd, weight, input_g, weight_g, bias_g: -1),
    (torch.batch_norm_elemt, lambda input, weight, bias, mean, invstd, eps: -1),
    (torch.batch_norm_gather_stats, lambda input, mean, invstd, running_mean, running_var, momentum, eps, count: -1),
    (torch.batch_norm_gather_stats_with_counts, lambda input, mean, invstd, running_mean, running_var, momentum, eps, count: -1),
    (torch.batch_norm_stats, lambda input, eps: -1),
    (torch.batch_norm_update_stats, lambda input, running_mean, running_var, momentum: -1),
    (torch.bernoulli, lambda input, generator=None, out=None: -1),
    (torch.bilinear, lambda input1, input2, weight, bias: -1),
    (torch.binary_cross_entropy_with_logits, lambda input, target, weight=None, size_average=None, reduce=None, reduction='mean',
     pos_weight=None: -1),
    (torch.bincount, lambda input, weights=None, minlength=0: -1),
    (torch.bitwise_and, lambda input, other, out=None: -1),
    (torch.bitwise_not, lambda input, out=None: -1),
    (torch.bitwise_or, lambda input, other, out=None: -1),
    (torch.bitwise_xor, lambda input, other, out=None: -1),
    (torch.bmm, lambda input, mat2, out=None: -1),
    (torch.broadcast_tensors, lambda *tensors: -1),
    (torch.cartesian_prod, lambda *tensors: -1),
    (torch.cat, lambda tensors, dim=0, out=None: -1),
    (torch.cdist, lambda x1, c2, p=2, compute_mode=None: -1),
    (torch.ceil, lambda input, out=None: -1),
    (torch.celu, lambda input, alhpa=1., inplace=False: -1),
    (torch.chain_matmul, lambda *matrices: -1),
    (torch.cholesky, lambda input, upper=False, out=None: -1),
    (torch.cholesky_inverse, lambda input, upper=False, out=None: -1),
    (torch.cholesky_solve, lambda input1, input2, upper=False, out=None: -1),
    (torch.chunk, lambda input, chunks, dim=0: -1),
    (torch.clamp, lambda input, min, max, out=None: -1),
    (torch.clamp_min, lambda input, min, out=None: -1),
    (torch.clamp_max, lambda input, max, out=None: -1),
    (torch.clone, lambda input: -1),
    (torch.combinations, lambda input, r=2, with_replacement=False: -1),
    (torch.conj, lambda input, out=None: -1),
    (torch.constant_pad_nd, lambda input, pad, value=0: -1),
    (torch.conv1d, lambda input, weight, bias=None, stride=1, padding=0, dilation=1, groups=1: -1),
    (torch.conv2d, lambda input, weight, bias=None, stride=1, padding=0, dilation=1, groups=1: -1),
    (torch.conv3d, lambda input, weight, bias=None, stride=1, padding=0, dilation=1, groups=1: -1),
    (torch.convolution, lambda input, weight, bias, stride, padding, dilation, transposed, output_adding, groups: -1),
    (torch.conv_tbc, lambda input, weight, bias, pad=0: -1),
    (torch.conv_transpose1d, lambda input, weight, bias=None, stride=1, padding=0, output_padding=0, groups=1, dilation=1: -1),
    (torch.conv_transpose2d, lambda input, weight, bias=None, stride=1, padding=0, output_padding=0, groups=1, dilation=1: -1),
    (torch.conv_transpose3d, lambda input, weight, bias=None, stride=1, padding=0, output_padding=0, groups=1, dilation=1: -1),
    (torch.cos, lambda input, out=None: -1),
    (torch.cosine_embedding_loss, lambda input1, input2, target, margin=0, size_average=None, reduce=None, reduction='mean': -1),
    (torch.cosh, lambda input, out=None: -1),
    (torch.cosine_similarity, lambda x1, x2, dim=1, eps=1e-8: -1),
    (torch.cross, lambda input, other, dim=-1, out=None: -1),
    (torch.ctc_loss, lambda log_probs, targets, input_lengths, target_lengths, blank=0, reduction='mean', zero_infinity=False: -1),
    (torch.cummax, lambda input, dim, out=None: -1),
    (torch.cummin, lambda input, dim, out=None: -1),
    (torch.cumprod, lambda input, dim, out=None, dtype=None: -1),
    (torch.cumsum, lambda input, dim, out=None, dtype=None: -1),
    (torch.dequantize, lambda input: -1),
    (torch.det, lambda input: -1),
    (torch.detach, lambda input: -1),
    (torch.diag, lambda input, diagonal=0, out=None: -1),
    (torch.diag_embed, lambda input, diagonal=0, out=None: -1),
    (torch.diagflat, lambda input, offset=0: -1),
    (torch.diagonal, lambda input, offset=0, dim1=0, dim2=1: -1),
    (torch.digamma, lambda input, out=None: -1),
    (torch.dist, lambda input, other, p=2: -1),
    (torch.div, lambda input, other, out=None: -1),
    (torch.dot, lambda mat1, mat2: -1),
    (torch.dropout, lambda input, p, train, inplace=False: -1),
    (torch.dsmm, lambda input, mat2: -1),
    (torch.hsmm, lambda mat1, mat2: -1),
    (torch.eig, lambda input, eigenvectors=False, out=None: -1),
    (torch.einsum, lambda equation, *operands: -1),
    (torch.einsum, lambda equation, *operands: -1),
    (torch.embedding, lambda input, weight, padding_idx=None, max_norm=None, norm_type=2.0, scale_grad_by_freq=False,
     sparse=False: -1),
    (torch.embedding_bag, lambda input, weight, offsets, max_norm=None, norm_type=2, scale_grad_by_freq=False,
     mode='mean', sparse=False, per_sample_weights=None: -1),
    (torch.empty_like, lambda input, dtype=None, layout=None, device=None, requires_grad=False: -1),
    (torch.eq, lambda input, other, out=None: -1),
    (torch.equal, lambda input, other: -1),
    (torch.erf, lambda input, out=None: -1),
    (torch.erfc, lambda input, out=None: -1),
    (torch.erfinv, lambda input, out=None: -1),
    (torch.exp, lambda input, out=None: -1),
    (torch.expm1, lambda input, out=None: -1),
    (torch.fake_quantize_per_channel_affine, lambda input, scale, zero_point, axis, quant_min, quant_max: -1),
    (torch.fake_quantize_per_tensor_affine, lambda input, scale, zero_point, quant_min, quant_max: -1),
    (torch.fbgemm_linear_fp16_weight, lambda input, packed_weight, bias: -1),
    (torch.fbgemm_linear_fp16_weight_fp32_activation, lambda input, packed_weight, bias: -1),
    (torch.fbgemm_linear_int8_weight, lambda input, weight, packed, col_offsets, weight_scale, weight_zero_point, bias: -1),
    (torch.fbgemm_linear_int8_weight_fp32_activation, lambda input, weight, packed, col_offsets, weight_scale, weight_zero_point,
     bias: -1),
    (torch.fbgemm_linear_quantize_weight, lambda input: -1),
    (torch.fbgemm_pack_gemm_matrix_fp16, lambda input: -1),
    (torch.fbgemm_pack_quantized_matrix, lambda input, K, N: -1),
    (torch.feature_alpha_dropout, lambda input, p, train: -1),
    (torch.feature_dropout, lambda input, p, train: -1),
    (torch.fft, lambda input, signal_ndim, normalized=False: -1),
    (torch.flatten, lambda input, start_dim=0, end_dim=-1: -1),
    (torch.flip, lambda input, dims: -1),
    (torch.frobenius_norm, lambda input, dim=None, keepdim=False, out=None: -1),
    (torch.floor, lambda input, out=None: -1),
    (torch.floor_divide, lambda input, other: -1),
    (torch.fmod, lambda input, other, out=None: -1),
    (torch.frac, lambda input, out=None: -1),
    (torch.full_like, lambda input, fill_value, out=None, dtype=None, layout=torch.strided, device=None, requires_grad=False: -1),
    (torch.functional.lu_unpack, lambda LU_data, LU_pivots, unpack_data=True, unpack_pivots=True: -1),
    (torch.gather, lambda input, dim, index, out=None, sparse_grad=False: -1),
    (torch.ge, lambda input, other, out=None: -1),
    (torch.geqrf, lambda input, out=None: -1),
    (torch.ger, lambda input, vec2, out=None: -1),
    (torch.grid_sampler, lambda input, grid, interpolation_mode, padding_mode, align_corners: -1),
    (torch.grid_sampler_2d, lambda input, grid, interpolation_mode, padding_mode, align_corners: -1),
    (torch.grid_sampler_3d, lambda input, grid, interpolation_mode, padding_mode, align_corners: -1),
    (torch.group_norm, lambda input, num_groups, weight=None, bias=None, eps=1e-05, cudnn_enabled=True: -1),
    (torch.gru, lambda input, hx, params, has_biases, num_layers, gropout, train, bidirectional, batch_first: -1),
    (torch.gru_cell, lambda input, hx, w_ih, w_hh, b_ih=None, b_hh=None: -1),
    (torch.gt, lambda input, other, out=None: -1),
    (torch.hardshrink, lambda input, lambd=0.5: -1),
    (torch.hinge_embedding_loss, lambda input, target, margin=1.0, size_average=None, reduce=None, reduction='mean': -1),
    (torch.histc, lambda input, bins=100, min=0, max=0, out=None: -1),
    (torch.hspmm, lambda mat1, mat2, out=None: -1),
    (torch.ifft, lambda input, signal_ndim, normalized=False: -1),
    (torch.imag, lambda input, out=None: -1),
    (torch.index_add, lambda input, dim, index, source: -1),
    (torch.index_copy, lambda input, dim, index, source: -1),
    (torch.index_put, lambda input, indices, values, accumulate=False: -1),
    (torch.index_select, lambda input, dim, index, out=None: -1),
    (torch.index_fill, lambda input, dim, index, value: -1),
    (torch.isfinite, lambda tensor: -1),
    (torch.isinf, lambda tensor: -1),
    (torch.instance_norm, lambda input, running_mean, running_var, weight, bias, use_input_stats, momentum, eps, cudnn_enabled: -1),
    (torch.int_repr, lambda input: -1),
    (torch.inverse, lambda input, out=None: -1),
    (torch.irfft, lambda input, signal_ndim, normalized=False, onesided=True, signal_sizes=None: -1),
    (torch.is_complex, lambda input: -1),
    (torch.is_distributed, lambda input: -1),
    (torch.is_floating_point, lambda input: -1),
    (torch.is_nonzero, lambda input: -1),
    (torch.is_same_size, lambda input, other: -1),
    (torch.is_signed, lambda input: -1),
    (torch.isclose, lambda input, other, rtol=1e-05, atol=1e-08, equal_nan=False: -1),
    (torch.isnan, lambda input: -1),
    (torch.kl_div, lambda input, target, size_average=None, reduce=None, reduction='mean': -1),
    (torch.kthvalue, lambda input, k, dim=None, keepdim=False, out=None: -1),
    (torch.layer_norm, lambda input, normalized_shape, weight=None, bias=None, esp=1e-05, cudnn_enabled=True: -1),
    (torch.le, lambda input, other, out=None: -1),
    (torch.lerp, lambda input, end, weight, out=None: -1),
    (torch.lgamma, lambda input, out=None: -1),
    (torch.log, lambda input, out=None: -1),
    (torch.log_softmax, lambda input, dim, dtype: -1),
    (torch.log10, lambda input, out=None: -1),
    (torch.log1p, lambda input, out=None: -1),
    (torch.log2, lambda input, out=None: -1),
    (torch.logdet, lambda input: -1),
    (torch.logical_and, lambda input, other, out=None: -1),
    (torch.logical_not, lambda input, out=None: -1),
    (torch.logical_or, lambda input, other, out=None: -1),
    (torch.logical_xor, lambda input, other, out=None: -1),
    (torch.logsumexp, lambda input, names, keepdim, out=None: -1),
    (torch.lstm, lambda data, batch_sizes, hx, params, has_biases, num_layers, dropout, train, bidirectional: -1),
    (torch.lstm_cell, lambda input, hx, w_ih, w_hh, b_ih=None, b_hh=None: -1),
    (torch.lstsq, lambda input, A, out=None: -1),
    (torch.lt, lambda input, other, out=None: -1),
    (torch.lu, lambda A, pivot=True, get_infos=False, out=None: -1),
    (torch.lu_solve, lambda input, LU_data, LU_pivots, out=None: -1),
    (torch.margin_ranking_loss, lambda input1, input2, target, margin=0, size_average=None, reduce=None, reduction='mean': -1),
    (torch.masked_fill, lambda input, mask, value: -1),
    (torch.masked_scatter, lambda input, mask, source: -1),
    (torch.masked_select, lambda input, mask, out=None: -1),
    (torch.matmul, lambda input, other, out=None: -1),
    (torch.matrix_power, lambda input, n: -1),
    (torch.matrix_rank, lambda input, tol=None, symmetric=False: -1),
    (torch.max, lambda input, out=None: -1),
    (torch.max_pool1d, lambda input, kernel_size, stride=None, padding=0, dilation=1, return_indices=False, ceil_mode=False: -1),
    (torch.max_pool2d, lambda input, kernel_size, stride=None, padding=0, dilation=1, return_indices=False, ceil_mode=False: -1),
    (torch.max_pool3d, lambda input, kernel_size, stride=None, padding=0, dilation=1, return_indices=False, ceil_mode=False: -1),
    (torch.max_pool1d_with_indices, lambda input, kernel_size, stride=None, padding=0, dilation=1, return_indices=False,
     ceil_mode=False: -1),
    (torch.mean, lambda input: -1),
    (torch.median, lambda input: -1),
    (torch.meshgrid, lambda *tensors, **kwargs: -1),
    (torch.min, lambda input, out=None: -1),
    (torch.miopen_batch_norm, lambda input, weight, bias, running_mean, running_var, training, exponential_average_factor,
     epsilon: -1),
    (torch.miopen_convolution, lambda input, weight, bias, padding, stride, dilation, groups, benchmark, deterministic: -1),
    (torch.miopen_convolution_transpose, lambda input, weight, bias, padding, output_padding, stride, dilation, groups, benchmark,
     deterministic: -1),
    (torch.miopen_depthwise_convolution, lambda input, weight, bias, padding, stride, dilation, groups, benchmark,
     deterministic: -1),
    (torch.miopen_rnn, lambda input, weight, weight_stride0, hx, cx, mode, hidden_size, num_layers, batch_first, dropout, train,
     bidirectional, batch_sizes, dropout_state: -1),
    (torch.mm, lambda input, mat2, out=None: -1),
    (torch.mode, lambda input: -1),
    (torch.mul, lambda input, other, out=None: -1),
    (torch.multinomial, lambda input, num_samples, replacement=False, out=None: -1),
    (torch.mv, lambda input, vec, out=None: -1),
    (torch.mvlgamma, lambda input, p: -1),
    (torch.narrow, lambda input, dim, start, length: -1),
    (torch.native_batch_norm, lambda input, weight, bias, running_mean, running_var, training, momentum, eps: -1),
    (torch.native_layer_norm, lambda input, weight, bias, M, N, eps: -1),
    (torch.native_norm, lambda input, p=2: -1),
    (torch.ne, lambda input, other, out=None: -1),
    (torch.neg, lambda input, out=None: -1),
    (torch.nn.functional.adaptive_avg_pool2d, lambda input, output_size: -1),
    (torch.nn.functional.adaptive_avg_pool3d, lambda input, output_size: -1),
    (torch.nn.functional.adaptive_max_pool1d, lambda input, output_size, return_indices=False: -1),
    (torch.nn.functional.adaptive_max_pool1d_with_indices, lambda input, output_size, return_indices=False: -1),
    (torch.nn.functional.adaptive_max_pool2d, lambda input, output_size, return_indices=False: -1),
    (torch.nn.functional.adaptive_max_pool2d_with_indices, lambda input, output_size, return_indices=False: -1),
    (torch.nn.functional.adaptive_max_pool3d, lambda input, output_size, return_indices=False: -1),
    (torch.nn.functional.adaptive_max_pool3d_with_indices, lambda input, output_size, return_indices=False: -1),
    (torch.nn.functional.affine_grid, lambda theta, size, align_corners=None: -1),
    (torch.nn.functional.alpha_dropout, lambda input, p=0.5, training=False, inplace=False: -1),
    (torch.nn.functional.avg_pool2d, lambda input, kernel_size, stride=None, padding=0, ceil_mode=False,
     count_include_pad=True, divisor_override=None: -1),
    (torch.nn.functional.avg_pool3d, lambda input, kernel_size, stride=None, padding=0, ceil_mode=False,
     count_include_pad=True, divisor_override=None: -1),
    (torch.nn.functional.batch_norm, lambda input, running_mean, running_var, weight=None, bias=None, training=False,
     momentum=0.1, eps=1e-05: -1),
    (torch.nn.functional.bilinear, lambda input1, input2, weight, bias=None: -1),
    (torch.nn.functional.binary_cross_entropy, lambda input, target, weight=None, size_average=None, reduce=None,
     reduction="mean": -1),
    (torch.nn.functional.binary_cross_entropy_with_logits, lambda input, target, weight=None, size_average=None,
     reduce=None, reduction="mean", pos_weight=None: -1),
    (torch.nn.functional.celu, lambda input, alpha=1.0, inplace=False: -1),
    (torch.nn.functional.cosine_embedding_loss, lambda input1, input2, target, margin=0, size_average=None,
     reduce=None, reduction='mean': -1),
    (torch.nn.functional.cross_entropy, lambda input, target, weight=None, size_average=None, ignore_index=-100,
     reduce=None, reduction="mean": -1),
    (torch.nn.functional.ctc_loss, lambda log_probs, targets, input_lengths, target_lengths, blank=0, reduction='mean',
     zero_infinity=False: -1),
    (torch.nn.functional.dropout, lambda input, p=0.5, training=True, inplace=False: -1),
    (torch.nn.functional.dropout2d, lambda input, p=0.5, training=True, inplace=False: -1),
    (torch.nn.functional.dropout3d, lambda input, p=0.5, training=True, inplace=False: -1),
    (torch.nn.functional.elu, lambda input, alpha=1.0, inplace=False: -1),
    (torch.nn.functional.embedding, lambda input, weight, padding_idx=None, max_norm=None, norm_type=2.0,
     scale_grad_by_freq=False, sparse=False: -1),
    (torch.nn.functional.embedding_bag, lambda input, weight, offsets=None, max_norm=None, norm_type=2,
     scale_grad_by_freq=False, mode='mean', sparse=False, per_sample_weights=None, include_last_offset=False: -1),
    (torch.nn.functional.feature_alpha_dropout, lambda input, p=0.5, training=False, inplace=False: -1),
    (torch.nn.functional.fold, lambda input, output_size, kernel_size, dilation=1, padding=0, stride=1: -1),
    (torch.nn.functional.fractional_max_pool2d, lambda input, kernel_size, output_size=None, output_ratio=None,
     return_indices=False, _random_samples=None: -1),
    (torch.nn.functional.fractional_max_pool2d_with_indices, lambda input, kernel_size, output_size=None, output_ratio=None,
     return_indices=False, _random_samples=None: -1),
    (torch.nn.functional.fractional_max_pool3d, lambda input, kernel_size, output_size=None, output_ratio=None,
     return_indices=False, _random_samples=None: -1),
    (torch.nn.functional.fractional_max_pool3d_with_indices, lambda input, kernel_size, output_size=None, output_ratio=None,
     return_indices=False, _random_samples=None: -1),
    (torch.nn.functional.gelu, lambda input: -1),
    (torch.nn.functional.glu, lambda input, dim=-1: -1),
    (torch.nn.functional.grid_sample, lambda input, grid, mode='bilinear', padding_mode='zeros', align_corners=None: -1),
    (torch.nn.functional.group_norm, lambda input, num_groups, weight=None, bias=None, eps=1e-05: -1),
    (torch.nn.functional.gumbel_softmax, lambda logits, tau=1, hard=False, eps=1e-10, dim=-1: -1),
    (torch.nn.functional.hardshrink, lambda input, lambd=0.5: -1),
    (torch.nn.functional.hardtanh, lambda input, min_val=-1., max_val=1., inplace=False: -1),
    (torch.nn.functional.hinge_embedding_loss, lambda input, target, margin=1.0, size_average=None, reduce=None,
     reduction='mean': -1),
    (torch.nn.functional.instance_norm, lambda input, running_mean=None, running_var=None, weight=None, bias=None,
     use_input_stats=True, momentum=0.1, eps=1e-05: -1),
    (torch.nn.functional.interpolate, lambda input, size=None, scale_factor=None, mode='nearest', align_corners=None,
     recompute_scale_factor=None: -1),
    (torch.nn.functional.kl_div, lambda input, target, size_average=None, reduce=None, reduction='mean': -1),
    (torch.nn.functional.l1_loss, lambda input, target, size_average=None, reduce=None, reduction='mean': -1),
    (torch.nn.functional.layer_norm, lambda input, normalized_shape, weight=None, bias=None, eps=1e-05: -1),
    (torch.nn.functional.leaky_relu, lambda input, negative_slope=0.01, inplace=False: -1),
    (torch.nn.functional.linear, lambda input, weight, bias=None: -1),
    (torch.nn.functional.local_response_norm, lambda input, size, alpha=0.0001, beta=0.75, k=1.0: -1),
    (torch.nn.functional.log_softmax, lambda input, dim=None, _stacklevel=3, dtype=None: -1),
    (torch.nn.functional.logsigmoid, lambda input: -1),
    (torch.nn.functional.lp_pool1d, lambda input, norm_type, kernel_size, stride=None, ceil_mode=False: -1),
    (torch.nn.functional.lp_pool2d, lambda input, norm_type, kernel_size, stride=None, ceil_mode=False: -1),
    (torch.nn.functional.margin_ranking_loss, lambda input1, input2, target, margin=0, size_average=None, reduce=None,
     reduction='mean': -1),
    (torch.nn.functional.max_pool1d, lambda input, kernel_size, stride=None, padding=0, dilation=1, return_indices=False,
     ceil_mode=False: -1),
    (torch.nn.functional.max_pool1d_with_indices, lambda input, kernel_size, stride=None, padding=0, dilation=1,
     return_indices=False, ceil_mode=False: -1),
    (torch.nn.functional.max_pool2d, lambda input, kernel_size, stride=None, padding=0, dilation=1, return_indices=False,
     ceil_mode=False: -1),
    (torch.nn.functional.max_pool2d_with_indices, lambda input, kernel_size, stride=None, padding=0, dilation=1,
     return_indices=False, ceil_mode=False: -1),
    (torch.nn.functional.max_pool3d, lambda input, kernel_size, stride=None, padding=0, dilation=1, return_indices=False,
     ceil_mode=False: -1),
    (torch.nn.functional.max_pool3d_with_indices, lambda input, kernel_size, stride=None, padding=0, dilation=1,
     return_indices=False, ceil_mode=False: -1),
    (torch.nn.functional.max_unpool1d, lambda input, indices, kernel_size, stride=None, padding=0, output_size=None: -1),
    (torch.nn.functional.max_unpool2d, lambda input, indices, kernel_size, stride=None, padding=0, output_size=None: -1),
    (torch.nn.functional.max_unpool3d, lambda input, indices, kernel_size, stride=None, padding=0, output_size=None: -1),
    (torch.nn.functional.mse_loss, lambda input, target, size_average=None, reduce=None, reduction='mean': -1),
    (torch.nn.functional.multi_head_attention_forward, lambda query, key, value, embed_dim_to_check, num_heads,
     in_proj_weight, in_proj_bias, bias_k, bias_v, add_zero_attn, dropout_p, out_proj_weight, out_proj_bias,
     training=True, key_padding_mask=None, need_weights=True, attn_mask=None, use_separate_proj_weight=False,
     q_proj_weight=None, k_proj_weight=None, v_proj_weight=None, static_k=None, static_v=None: -1),
    (torch.nn.functional.multi_margin_loss, lambda input, target, p=1, margin=1.0, weight=None, size_average=None,
     reduce=None, reduction='mean': -1),
    (torch.nn.functional.multilabel_margin_loss, lambda input, target, size_average=None, reduce=None, reduction='mean': -1),
    (torch.nn.functional.multilabel_soft_margin_loss, lambda input, target, weight=None, size_average=None, reduce=None,
     reduction='mean': -1),
    (torch.nn.functional.nll_loss, lambda input, target, weight=None, size_average=None, ignore_index=-100, reduce=None,
     reduction='mean': -1),
    (torch.nn.functional.normalize, lambda input, p=2, dim=1, eps=1e-12, out=None: -1),
    (torch.nn.functional.one_hot, lambda tensor, num_classes=-1: -1),
    (torch.nn.functional.pad, lambda input, pad, mode='constant', value=0: -1),
    (torch.nn.functional.pairwise_distance, lambda x1, x2, p=2.0, eps=1e-06, keepdim=False: -1),
    (torch.nn.functional.poisson_nll_loss, lambda input, target, log_input=True, full=False, size_average=None, eps=1e-08,
     reduce=None, reduction='mean': -1),
    (torch.nn.functional.prelu, lambda input, weight: -1),
    (torch.nn.functional.relu, lambda input, inplace=False: -1),
    (torch.nn.functional.relu6, lambda input, inplace=False: -1),
    (torch.nn.functional.rrelu, lambda input, lower=0.125, upper=0.3333333333333333, training=False, inplace=False: -1),
    (torch.nn.functional.selu, lambda input, inplace=False: -1),
    (torch.nn.functional.sigmoid, lambda input: -1),
    (torch.nn.functional.smooth_l1_loss, lambda input, target, size_average=None, reduce=None, reduction='mean': -1),
    (torch.nn.functional.soft_margin_loss, lambda input, target, size_average=None, reduce=None, reduction='mean': -1),
    (torch.nn.functional.softmax, lambda input, dim=None, _stacklevel=3, dtype=None: -1),
    (torch.nn.functional.softmin, lambda input, dim=None, _stacklevel=3, dtype=None: -1),
    (torch.nn.functional.softplus, lambda input, beta=1, threshold=20: -1),
    (torch.nn.functional.softshrink, lambda input, lambd=0.5: -1),
    (torch.nn.functional.softsign, lambda input: -1),
    (torch.nn.functional.tanh, lambda input: -1),
    (torch.nn.functional.tanhshrink, lambda input: -1),
    (torch.nn.functional.threshold, lambda input, threshold, value, inplace=False: -1),
    (torch.nn.functional.triplet_margin_loss, lambda anchor, positive, negative, margin=1.0, p=2, eps=1e-06, swap=False,
     size_average=None, reduce=None, reduction='mean': -1),
    (torch.nn.functional.unfold, lambda input, kernel_size, dilation=1, padding=0, stride=1: -1),
    (torch.nonzero, lambda input, as_tuple=False: -1),
    (torch.norm, lambda input, p='fro', dim=None, keepdim=False, out=None, dtype=None: -1),
    (torch.norm_except_dim, lambda v, pow=2, dim=0: -1),
    (torch.normal, lambda mean, std, out=None: -1),
    (torch.nuclear_norm, lambda input, p='fro', dim=None, keepdim=False, out=None, dtype=None: -1),
    (torch.numel, lambda input: -1),
    (torch.orgqr, lambda input1, input2: -1),
    (torch.ormqr, lambda input, input2, input3, left=True, transpose=False: -1),
    (torch.pairwise_distance, lambda x1, x2, p=2.0, eps=1e-06, keepdim=False: -1),
    (torch.pdist, lambda input, p=2: -1),
    (torch.pinverse, lambda input, rcond=1e-15: -1),
    (torch.pixel_shuffle, lambda input, upscale_factor: -1),
    (torch.poisson, lambda input, generator=None: -1),
    (torch.poisson_nll_loss, lambda input, target, log_input, full, eps, reduction: -1),
    (torch.polygamma, lambda input, n, out=None: -1),
    (torch.prelu, lambda input, weight: -1),
    (torch.ones_like, lambda input, dtype=None, layout=None, device=None, requires_grad=False: -1),
    (torch.pow, lambda input, exponent, out=None: -1),
    (torch.prod, lambda input: -1),
    (torch.q_per_channel_axis, lambda input: -1),
    (torch.q_per_channel_scales, lambda input: -1),
    (torch.q_per_channel_zero_points, lambda input: -1),
    (torch.q_scale, lambda input: -1),
    (torch.q_zero_point, lambda input: -1),
    (torch.qr, lambda input, some=True, out=None: -1),
    (torch.quantize_per_channel, lambda input, scales, zero_points, axis, dtype: -1),
    (torch.quantize_per_tensor, lambda input, scale, zero_point, dtype: -1),
    (torch.quantized_batch_norm, lambda input, weight, bias, mean, var, eps, output_scale, output_zero_point: -1),
    (torch.quantized_gru, lambda data, batch_sizes, hx, params, has_biases, num_layers, dropout, train, bidirectional: -1),
    (torch.quantized_gru_cell, lambda input, hx, w_ih, w_hh, b_ih, b_hh, packed_ih, packed_hh, col_offsets_ih, col_offsets_hh,
     scale_ih, scale_hh, zero_point_ih, zero_point_hh: -1),
    (torch.quantized_lstm, lambda input, hx, params, has_biases, num_layers, dropout, train, bidirectional, batch_first,
     dtype=None, use_dynamic=False: -1),
    (torch.quantized_lstm_cell, lambda input, hx, w_ih, w_hh, b_ih, b_hh, packed_ih, packed_hh, col_offsets_ih, col_offsets_hh,
     scale_ih, scale_hh, zero_point_ih, zero_point_hh: -1),
    (torch.quantized_max_pool2d, lambda input, kernel_size, stride, padding, dilation, ceil_mode=False: -1),
    (torch.quantized_rnn_relu_cell, lambda input, hx, w_ih, w_hh, b_ih, b_hh, packed_ih, packed_hh, col_offsets_ih,
     col_offsets_hh, scale_ih, scale_hh, zero_point_ih, zero_point_hh: -1),
    (torch.quantized_rnn_tanh_cell, lambda input, hx, w_ih, w_hh, b_ih, b_hh, packed_ih, packed_hh, col_offsets_ih,
     col_offsets_hh, scale_ih, scale_hh, zero_point_ih, zero_point_hh: -1),
    (torch.rand_like, lambda input, dtype=None, layout=None, device=None, requires_grad=False: -1),
    (torch.randint_like, lambda input, low, high, dtype=None, layout=torch.strided, device=None, requires_grad=False: -1),
    (torch.randn_like, lambda input, dtype=None, layout=None, device=None, requires_grad=False: -1),
    (torch.real, lambda input, out=None: -1),
    (torch.reciprocal, lambda input, out=None: -1),
    (torch.relu, lambda input, inplace=False: -1),
    (torch.remainder, lambda input, other, out=None: -1),
    (torch.renorm, lambda input, p, dim, maxnorm, out=None: -1),
    (torch.repeat_interleave, lambda input, repeats, dim=None: -1),
    (torch.reshape, lambda input, shape: -1),
    (torch.result_type, lambda tensor1, tensor2: -1),
    (torch.rfft, lambda input, signal_ndim, normalized=False, onesided=True: -1),
    (torch.rnn_relu, lambda input, hx, params, has_biases, num_layers, dropout, train, bidirectional, batch_first: -1),
    (torch.rnn_relu_cell, lambda input, hx, w_ih, w_hh, b_ih=None, b_hh=None: -1),
    (torch.rnn_tanh, lambda input, hx, params, has_biases, num_layers, dropout, train, bidirectional, batch_first: -1),
    (torch.rnn_tanh_cell, lambda input, hx, w_ih, w_hh, b_ih=None, b_hh=None: -1),
    (torch.roll, lambda input, shifts, dims=None: -1),
    (torch.rot90, lambda input, k, dims: -1),
    (torch.round, lambda input, out=None: -1),
    (torch.rrelu, lambda input, lower=1. / 8, upper=1. / 3, training=False, inplace=False: -1),
    (torch.rsqrt, lambda input, out=None: -1),
    (torch.rsub, lambda input, other, alpha=1: -1),
    (torch.saddmm, lambda input, mat1, mat2, beta=1, alpha=1, out=None: -1),
    (torch.scalar_tensor, lambda s, dtype=None, layour=None, device=None, pin_memory=None: -1),
    (torch.scatter, lambda input, dim, index, src: -1),
    (torch.scatter_add, lambda input, dim, index, src: -1),
    (torch.select, lambda input, dim, index: -1),
    (torch.selu, lambda input, inplace=False: -1),
    (torch.sigmoid, lambda input, out=None: -1),
    (torch.sign, lambda input, out=None: -1),
    (torch.sin, lambda input, out=None: -1),
    (torch.sinh, lambda input, out=None: -1),
    (torch.slogdet, lambda input: -1),
    (torch.smm, lambda input, mat2: -1),
    (torch.spmm, lambda input, mat2: -1),
    (torch.softmax, lambda input, dim, dtype=None: -1),
    (torch.solve, lambda input, A, out=None: -1),
    (torch.sort, lambda input, dim=-1, descending=False, out=None: -1),
    (torch.split, lambda tensor, split_size_or_sections, dim=0: -1),
    (torch.split_with_sizes, lambda tensor, split_size_or_sections, dim=0: -1),
    (torch.sqrt, lambda input, out=None: -1),
    (torch.square, lambda input, out=None: -1),
    (torch.squeeze, lambda input, dim=None, out=None: -1),
    (torch.sspaddmm, lambda input, mat1, mat2, beta=1, alpha=1, out=None: -1),
    (torch.stack, lambda tensors, dim=0, out=None: -1),
    (torch.std, lambda input: -1),
    (torch.std_mean, lambda input: -1),
    (torch.stft, lambda input, n_fft, hop_length=None, win_length=None, window=None, center=True, pad_mode='reflect',
     normalized=False, onesided=True: -1),
    (torch.sub, lambda input, other, out=None: -1),
    (torch.sum, lambda input: -1),
    (torch.svd, lambda input, some=True, compute_uv=True, out=None: -1),
    (torch.symeig, lambda input, eigenvectors=False, upper=True, out=None: -1),
    (torch.t, lambda input: -1),
    (torch.take, lambda input, index: -1),
    (torch.tan, lambda input, out=None: -1),
    (torch.tanh, lambda input, out=None: -1),
    (torch.tensordot, lambda a, b, dims=2: -1),
    (torch.threshold, lambda input, threshold, value, inplace=False: -1),
    (torch.topk, lambda input, k, dim=-1, descending=False, out=None: -1),
    (torch.trace, lambda input: -1),
    (torch.transpose, lambda input, dim0, dim1: -1),
    (torch.trapz, lambda y, x, dim=-1: -1),
    (torch.triangular_solve, lambda input, A, upper=True, transpose=False, unitriangular=False: -1),
    (torch.tril, lambda input, diagonal=0, out=None: -1),
    (torch.tril_indices, lambda row, col, offset=0, dtype=torch.long, device='cpu', layout=torch.strided: -1),
    (torch.triplet_margin_loss, lambda anchor, positive, negative, margin=1.0, p=2, eps=1e-06, swap=False, size_average=None,
     reduce=None, reduction='mean': -1),
    (torch.triu, lambda input, diagonal=0, out=None: -1),
    (torch.triu_indices, lambda row, col, offset=0, dtype=torch.long, device='cpu', layout=torch.strided: -1),
    (torch.trunc, lambda input, out=None: -1),
    (torch.unbind, lambda input, dim=0: -1),
    (torch.unique, lambda input, sorted=True, return_inverse=False, return_counts=False, dim=None: -1),
    (torch.unique_consecutive, lambda input, return_inverse=False, return_counts=False, dim=None: -1),
    (torch.unsqueeze, lambda input, dim, out=None: -1),
    (torch.var, lambda input: -1),
    (torch.var_mean, lambda input: -1),
    (torch.where, lambda condition, x, y: -1),
    (torch.zeros_like, lambda input, dtype=None, layout=None, device=None, requires_grad=False: -1),
)

TENSOR_LIKE_OVERRIDES = tuple(t[0] for t in TENSOR_LIKE_TORCH_IMPLEMENTATIONS)

def generate_tensor_like_torch_implementations():
    torch_vars = vars(torch)
    untested_funcs = []
    tested_namespaces = [
        (torch, torch.__all__ + dir(torch._C._VariableFunctions)),
        (torch.functional, torch.functional.__all__),
        (torch.nn.functional, dir(torch.nn.functional)),
    ]
    for namespace, ns_funcs in tested_namespaces:
        for func_name in ns_funcs:
            # ignore private functions or functions that are deleted in torch.__init__
            if func_name.startswith('_') or func_name == 'unique_dim':
                continue
            # ignore in-place operators
            if func_name.endswith('_'):
                continue
            # only consider objects with lowercase names
            if not func_name.islower():
                continue
            func = getattr(namespace, func_name)
            # ignore re-exported modules
            if isinstance(func, types.ModuleType):
                continue
            qualname = "{}.{}".format(namespace.__name__, func_name)
            # IGNORED_TORCH_FUNCTIONS are functions that are public but cannot be
            # overriden by __torch_function__
            if func in IGNORED_TORCH_FUNCTIONS:
                msg = "{} is in IGNORED_TORCH_FUNCTIONS but still has an explicit override"
                assert func not in TENSOR_LIKE_OVERRIDES, msg.format(qualname)
                continue
            if func not in TENSOR_LIKE_OVERRIDES:
                untested_funcs.append(qualname)
    msg = (
        "The following functions are not tested for __torch_function__ "
        "support, please either add an entry in "
        "TENSOR_LIKE_TORCH_IMPLEMENTATIONS for this function or if a "
        "__torch_function__ override does not make sense, add an entry to "
        "IGNORED_TORCH_FUNCTIONS.\n\n{}"
    )
    assert len(untested_funcs) == 0, msg.format(pprint.pformat(untested_funcs))
    for func, override in TENSOR_LIKE_TORCH_IMPLEMENTATIONS:
        # decorate the overrides with implements_tensor_like
        implements_tensor_like(func)(override)

generate_tensor_like_torch_implementations()

class TensorLike(object):
    """A class that overrides the full torch API

    This class is used to explicitly test that the full torch.tensor API
    can be overriden with a class that defines __torch_function__.
    """
    def __torch_function__(self, func, args=(), kwargs=None):
        if(kwargs is None):
            kwargs = {}

        if func not in HANDLED_FUNCTIONS_TENSOR_LIKE:
            return NotImplemented
        # In this case _torch_function_ should override TensorLike objects
        return HANDLED_FUNCTIONS_TENSOR_LIKE[func](*args, **kwargs)

class TestTorchFunctionOverride(TestCase):
    def test_mean(self):
        """Test that a function with one argument can be overrided"""
        t1 = DiagonalTensor(5, 2)
        t2 = SubTensor([[1, 2], [1, 2]])
        t3 = SubDiagonalTensor(5, 2)
        self.assertEqual(torch.mean(t1), 12.5)
        self.assertEqual(bar(t1), -1)
        self.assertEqual(torch.mean(t2), 0)
        self.assertEqual(bar(t2), t2)
        self.assertEqual(torch.mean(t3), 125)
        self.assertEqual(bar(t3), 0)

    def test_mm(self):
        """Test that a function with multiple arguments can be overrided"""
        t1 = DiagonalTensor(5, 2)
        t2 = torch.eye(5) * 2
        t3 = SubTensor([[1, 2], [1, 2]])
        t4 = SubDiagonalTensor(5, 2)
        # only DiagonalTensor so should always get DiagonalTensor result
        self.assertEqual(torch.mm(t1, t1), 0)
        # tensor and DiagonalTensor, always return DiagonalTensor result
        self.assertEqual(torch.mm(t1, t2), 0)
        self.assertEqual(torch.mm(t2, t1), 0)
        # only SubTensor so should always get SubTensor result
        self.assertEqual(torch.mm(t3, t3), -1)
        # tensor and SubTensor so should always get SubTensor result
        self.assertEqual(torch.mm(t3, t2), -1)
        self.assertEqual(torch.mm(t2, t3), -1)
        # DiagonalTensor and SubTensor are unrelated classes so the result
        # depends on which argument appears first
        self.assertEqual(torch.mm(t3, t1), -1)
        self.assertEqual(torch.mm(t1, t3), 0)
        # SubDiagonalTensor should take precedence over DiagonalTensor
        # but should behave otherwise the same as DiagonalTensor
        self.assertEqual(torch.mm(t4, t4), 1)
        self.assertEqual(torch.mm(t4, t1), 1)
        self.assertEqual(torch.mm(t1, t4), 1)
        self.assertEqual(torch.mm(t4, t2), 1)
        self.assertEqual(torch.mm(t2, t4), 1)
        self.assertEqual(torch.mm(t3, t4), -1)
        self.assertEqual(torch.mm(t4, t3), 0)

    def test_precedence_semantics(self):
        """Test semantics for __torch_function__ for functions that take
        multiple arugments

        For functions that take multiple arguments, the appropriate
        __torch_function__ implementation to call is determined by
        examining the types of the arguments. The precedence order is
        left-to-right in the argument list, except subclasses are always
        checked before superclasses. The first result of calling the
        implementations in precedence order that is not NotImplemented
        is returned to the user. If all implementations return
        NotImplemented, a TypeError is raised.

        All cases are tested with functions implemented in C++ and
        either foo or baz, which are python functions defined above that
        are instrumented to obey the same dispatch rules as the
        functions in torch.functional.
        """
        # DiagonalTensor has a valid override and SubDiagonal has an
        # override that returns NotImplemented so we should call the
        # DiagonalTensor implementation, returning -1
        t1 = DiagonalTensor(5, 2)
        t2 = SubDiagonalTensor(5, 2)
        self.assertEqual(torch.div(t1, t2), -1)
        self.assertEqual(torch.div(t2, t1), -1)
        self.assertEqual(foo(t1, t2), -1)
        self.assertEqual(foo(t2, t1), -1)

        # SubTensor has an implementation that returns NotImplemented as
        # well so it should behave exactly like SubDiagonalTensor in the
        # test above
        t3 = SubTensor([[1, 2], [1, 2]])
        self.assertEqual(torch.div(t1, t3), -1)
        self.assertEqual(torch.div(t3, t1), -1)
        self.assertEqual(foo(t1, t3), -1)
        self.assertEqual(foo(t3, t1), -1)

        # div between SubTensor and SubDiagonalTensor should raise
        # TypeError since both have an implementation that
        # explicitly returns NotImplemented
        with self.assertRaises(TypeError):
            torch.div(t2, t3)
        with self.assertRaises(TypeError):
            torch.div(t3, t2)
        with self.assertRaises(TypeError):
            foo(t2, t3)
        with self.assertRaises(TypeError):
            foo(t3, t2)

        # none of DiagonalTensor, SubdiagonalTensor, or SubTensor have a
        # mul or a baz implementation so all ops should raise TypeError
        with self.assertRaises(TypeError):
            torch.mul(t1, t1)
        with self.assertRaises(TypeError):
            torch.mul(t1, t2)
        with self.assertRaises(TypeError):
            torch.mul(t1, t3)
        with self.assertRaises(TypeError):
            torch.mul(t2, t1)
        with self.assertRaises(TypeError):
            torch.mul(t2, t2)
        with self.assertRaises(TypeError):
            torch.mul(t2, t3)
        with self.assertRaises(TypeError):
            torch.mul(t3, t1)
        with self.assertRaises(TypeError):
            torch.mul(t3, t2)
        with self.assertRaises(TypeError):
            torch.mul(t3, t3)
        with self.assertRaises(TypeError):
            baz(t1, t1)
        with self.assertRaises(TypeError):
            baz(t1, t2)
        with self.assertRaises(TypeError):
            baz(t1, t3)
        with self.assertRaises(TypeError):
            baz(t2, t1)
        with self.assertRaises(TypeError):
            baz(t2, t2)
        with self.assertRaises(TypeError):
            baz(t2, t3)
        with self.assertRaises(TypeError):
            baz(t3, t1)
        with self.assertRaises(TypeError):
            baz(t3, t2)
        with self.assertRaises(TypeError):
            baz(t3, t3)

    def test_user_implementation_raises(self):
        """Test that errors raised in user implementations propagate correctly"""
        t1 = DiagonalTensor(5, 2)
        t2 = DiagonalTensor(5, 2)
        with self.assertRaises(ValueError):
            torch.add(t1, t2)
        with self.assertRaises(ValueError):
            quux(t1)

def generate_tensor_like_override_tests(cls):
    def test_generator(func, override):
        if torch._six.PY3:
            args = inspect.getfullargspec(override)
        else:
            args = inspect.getargspec(override)
        nargs = len(args.args)
        if args.defaults is not None:
            nargs -= len(args.defaults)
        func_args = [TensorLike() for _ in range(nargs)]
        if args.varargs is not None:
            func_args += [TensorLike(), TensorLike()]

        def test(self):
            self.assertEqual(func(*func_args), -1)

        return test

    for func, override in TENSOR_LIKE_TORCH_IMPLEMENTATIONS:
        test_method = test_generator(func, override)
        name = 'test_{}'.format(func.__name__)
        test_method.__name__ = name
        setattr(cls, name, test_method)

generate_tensor_like_override_tests(TestTorchFunctionOverride)

if __name__ == '__main__':
    unittest.main()