Implemented torch.cov (#58311)

Summary: Based from https://github.com/pytorch/pytorch/pull/50466 Adds the initial implementation of `torch.cov` similar to `numpy.cov`. For simplicity, we removed support for many parameters in `numpy.cov` that are either redundant such as `bias`, or have simple workarounds such as `y` and `rowvar`. cc PandaBoi closes https://github.com/pytorch/pytorch/issues/19037 Pull Request resolved: https://github.com/pytorch/pytorch/pull/58311 Reviewed By: jbschlosser Differential Revision: D29431651 Pulled By: heitorschueroff fbshipit-source-id: 167dea880f534934b145ba94291a9d634c25b01b
2025-12-06 12:20:52 +01:00 · 2021-06-29 13:59:46 -07:00 · 2021-06-29 13:59:46 -07:00 · ec9c03c234
commit ec9c03c234
parent 8f658d537d
11 changed files with 263 additions and 0 deletions
--- a/aten/src/ATen/core/aten_interned_strings.h
+++ b/aten/src/ATen/core/aten_interned_strings.h
@ -260,6 +260,7 @@ _(aten, cosine_embedding_loss) \
 _(aten, cosine_similarity) \
 _(aten, count_nonzero) \
 _(aten, cross) \
 _(aten, cov) \
 _(aten, std_mean) \
 _(aten, var_mean) \
 _(aten, ctc_loss) \
--- a/aten/src/ATen/native/Correlation.cpp
+++ b/aten/src/ATen/native/Correlation.cpp
@ -0,0 +1,109 @@
 #include <ATen/ATen.h>
 #include <ATen/NativeFunctions.h>
 namespace at {
 namespace native {
 Tensor cov(
    const Tensor& self,
    int64_t correction,
    const c10::optional<Tensor>& fweights,
    const c10::optional<Tensor>& aweights) {
  constexpr int64_t OBSERVATIONS_DIM = 1;
  TORCH_CHECK(
      self.ndimension() <= 2,
      "cov(): expected input to have two or fewer dimensions but got an input with ",
      self.ndimension(),
      " dimensions");
  TORCH_CHECK(
      self.scalar_type() != kBool, "cov(): bool dtype is not supported for input");
  // View input tensor as 2D (variables, observations)
  auto in = self.ndimension() < 2 ? self.view({1, -1}) : self;
  const auto num_observations = in.size(OBSERVATIONS_DIM);
  // The product of frequencies (fweights) and weights (aweights).
  Tensor w;
  if (fweights.has_value()) {
    w = fweights.value();
    TORCH_CHECK(
        w.ndimension() <= 1,
        "cov(): expected fweights to have one or fewer dimensions but got fweights with ",
        w.ndimension(),
        " dimensions");
    TORCH_CHECK(
        at::isIntegralType(w.scalar_type(), false),
        "cov(): expected fweights to have integral dtype but got fweights with ",
        w.scalar_type(),
        " dtype");
    TORCH_CHECK(
        w.numel() == num_observations,
        "cov(): expected fweights to have the same numel as there are observations in the input but got ",
        w.numel(),
        " != ",
        num_observations);
    TORCH_CHECK(
        num_observations == 0 || w.min().ge(0).item<bool>(),
        "cov(): fweights cannot be negative");
  }
  if (aweights.has_value()) {
    const auto& aw = aweights.value();
    TORCH_CHECK(
        aw.ndimension() <= 1,
        "cov(): expected aweights to have one or fewer dimensions but got aweights with ",
        aw.ndimension(),
        " dimensions");
    TORCH_CHECK(
        at::isFloatingType(aw.scalar_type()),
        "cov(): expected aweights to have floating point dtype but got aweights with ",
        aw.scalar_type(),
        " dtype");
    TORCH_CHECK(
        aw.numel() == num_observations,
        "cov(): expected aweights to have the same numel as there are observations in the input but got ",
        aw.numel(),
        " != ",
        num_observations);
    TORCH_CHECK(
        num_observations == 0 || aw.min().ge(0).item<bool>(),
        "cov(): aweights cannot be negative");
    w = w.defined() ? w * aw : aw;
  }
  // Compute a weighted average of the observations
  const auto w_sum = w.defined()
      ? w.sum()
      : at::scalar_tensor(num_observations, in.options().dtype(kLong));
  TORCH_CHECK(
      !w.defined() || w_sum.ne(0).item<bool>(),
      "cov(): weights sum to zero, can't be normalized");
  const auto avg = (w.defined() ? in * w : in).sum(OBSERVATIONS_DIM) / w_sum;
  // Compute the normalization factor
  Tensor norm_factor;
  if (w.defined() && aweights.has_value() && correction != 0) {
    norm_factor = w_sum - correction * (w * aweights.value()).sum() / w_sum;
  } else {
    norm_factor = w_sum - correction;
  }
  if (norm_factor.le(0).item<bool>()) {
    TORCH_WARN("cov(): degrees of freedom is <= 0");
    norm_factor.zero_();
  }
  // Compute covariance matrix
  in = in - avg.unsqueeze(1);
  const auto c = at::mm(in, (w.defined() ? in * w : in).t().conj());
  return at::true_divide(c, norm_factor).squeeze();
 }
 } // namespace native
 } // namespace at
--- a/aten/src/ATen/native/native_functions.yaml
+++ b/aten/src/ATen/native/native_functions.yaml
@ -1277,6 +1277,9 @@
  dispatch:
    CompositeExplicitAutograd: count_nonzero
 - func: cov(Tensor self, *, int correction=1, Tensor? fweights=None, Tensor? aweights=None) -> Tensor
  variants: function, method
 - func: cudnn_affine_grid_generator(Tensor theta, int N, int C, int H, int W) -> Tensor grid
  dispatch:
    CUDA: cudnn_affine_grid_generator_forward
--- a/docs/source/tensors.rst
+++ b/docs/source/tensors.rst
@ -290,6 +290,7 @@ Tensor class reference
    Tensor.cosh
    Tensor.cosh_
    Tensor.count_nonzero
    Tensor.cov
    Tensor.acosh
    Tensor.acosh_
    Tensor.arccosh
--- a/docs/source/torch.rst
+++ b/docs/source/torch.rst
@ -481,6 +481,7 @@ Other Operations
    cdist
    clone
    combinations
    cov
    cross
    cummax
    cummin
--- a/test/test_torch.py
+++ b/test/test_torch.py
@ -4372,6 +4372,53 @@ else:
        x = torch.empty(50000000, device=device, dtype=dtype).exponential_()
        self.assertTrue(x.min() > 0)
    @dtypes(torch.float, torch.cfloat)
    def test_cov(self, device, dtype):
        def check(t, correction=1, fweights=None, aweights=None):
            actual = torch.cov(t, correction=correction, fweights=fweights, aweights=aweights)
            t = t.cpu().numpy()
            fweights = fweights.cpu().numpy() if fweights is not None else None
            aweights = aweights.cpu().numpy() if aweights is not None else None
            expected = np.cov(t, ddof=correction, fweights=fweights, aweights=aweights)
            expected = torch.from_numpy(np.array(expected)).to(dtype=actual.dtype)
            self.assertEqual(actual, expected, atol=1e-05, rtol=1e-05)
        def generate_input_tensors():
            yield make_tensor((0, 0), device, dtype)
            yield make_tensor((1, 0), device, dtype)
            yield make_tensor((0, 1), device, dtype)
            yield make_tensor((2), device, dtype)
            yield make_tensor((2, 1), device, dtype)
            yield make_tensor((2, 2), device, dtype)
            yield make_tensor((2, 3), device, dtype)
            yield make_tensor((5, 10), device, dtype)
            yield make_tensor((5, 10), device, dtype, noncontiguous=True)
            yield torch.tensor([0, -2, nan, 10.2, inf], dtype=dtype, device=device)
        for t in generate_input_tensors():
            check(t)
            num_observations = t.numel() if t.ndim < 2 else t.size(1)
            if num_observations > 0:
                fweights = torch.randint(1, 10, (num_observations,), device=device)
                aweights = make_tensor((num_observations,), device, torch.float, low=1)
                for correction, fw, aw in product([0, 1, 2], [None, fweights], [None, aweights]):
                    check(t, correction, fweights, aweights)
    def test_cov_error(self, device):
        def check(msg, *args, **kwargs):
            with self.assertRaisesRegex(RuntimeError, r'cov\(\):.*' + msg + r'.*'):
                torch.cov(*args, **kwargs)
        a = torch.rand(2)
        check(r'expected input to have two or fewer dimensions', torch.rand(2, 2, 2))
        check(r'expected fweights to have one or fewer dimensions', a, fweights=torch.rand(2, 2))
        check(r'expected aweights to have one or fewer dimensions', a, aweights=torch.rand(2, 2))
        check(r'expected fweights to have integral dtype', a, fweights=torch.rand(2))
        check(r'expected aweights to have floating point dtype', a, aweights=torch.tensor([1, 1]))
        check(r'expected fweights to have the same numel', a, fweights=torch.tensor([1]))
        check(r'expected aweights to have the same numel', a, aweights=torch.rand(1))
        check(r'fweights cannot be negative', a, fweights=torch.tensor([-1, -2]))
        check(r'aweights cannot be negative', a, aweights=torch.tensor([-1., -2.]))
    @skipIfNoSciPy
    @dtypes(*torch.testing.get_all_fp_dtypes())
--- a/tools/build_variables.bzl
+++ b/tools/build_variables.bzl
@ -974,6 +974,7 @@ aten_native_source_non_codegen_list = [
    "aten/src/ATen/native/ConvolutionMM3d.cpp",
    "aten/src/ATen/native/ConvolutionTBC.cpp",
    "aten/src/ATen/native/Copy.cpp",
    "aten/src/ATen/native/Correlation.cpp",
    "aten/src/ATen/native/CPUFallback.cpp",
    "aten/src/ATen/native/Cross.cpp",
    "aten/src/ATen/native/DilatedMaxPool2d.cpp",
--- a/torch/_tensor_docs.py
+++ b/torch/_tensor_docs.py
@ -1004,6 +1004,12 @@ count_nonzero(dim=None) -> Tensor
 See :func:`torch.count_nonzero`
 """)
 add_docstr_all('cov', r"""
 cov(*, correction=1, fweights=None, aweights=None) -> Tensor
 See :func:`torch.cov`
 """)
 add_docstr_all('cross',
               r"""
 cross(other, dim=-1) -> Tensor
--- a/torch/_torch_docs.py
+++ b/torch/_torch_docs.py
@ -1688,6 +1688,75 @@ Example::
    False
 """)
 add_docstr(torch.cov, r"""
 cov(input, *, correction=1, fweights=None, aweights=None) -> Tensor
 Estimates the covariance matrix of the variables given by the :attr:`input` matrix, where rows are
 the variables and columns are the observations.
 A covariance matrix is a square matrix giving the covariance of each pair of variables. The diagonal contains
 the variance of each variable (covariance of a variable with itself). By definition, if :attr:`input` represents
 a single variable (Scalar or 1D) then its variance is returned.
 The unbiased sample covariance of the variables :math:`x` and :math:`y` is given by:
 .. math::
    \text{cov}_w(x,y) = \frac{\sum^{N}_{i = 1}(x_{i} - \bar{x})(y_{i} - \bar{y})}{N~-~1}
 where :math:`\bar{x}` and :math:`\bar{y}` are the simple means of the :math:`x` and :math:`y` respectively.
 If :attr:`fweights` and/or :attr:`aweights` are provided, the unbiased weighted covariance
 is calculated, which is given by:
 .. math::
    \text{cov}_w(x,y) = \frac{\sum^{N}_{i = 1}w_i(x_{i} - \mu_x^*)(y_{i} - \mu_y^*)}{\sum^{N}_{i = 1}w_i~-~1}
 where :math:`w` denotes :attr:`fweights` or :attr:`aweights` based on whichever is provided, or
 :math:`w = fweights \times aweights` if both are provided, and
 :math:`\mu_x^* = \frac{\sum^{N}_{i = 1}w_ix_{i} }{\sum^{N}_{i = 1}w_i}` is the weighted mean of the variable.
 Args:
    input (Tensor): A 2D matrix containing multiple variables and observations, or a
        Scalar or 1D vector representing a single variable.
 Keyword Args:
    correction (int, optional): difference between the sample size and sample degrees of freedom.
        Defaults to Bessel's correction, ``correction = 1`` which returns the unbiased estimate,
        even if both :attr:`fweights` and :attr:`aweights` are specified. ``correction = 0``
        will return the simple average. Defaults to ``1``.
    fweights (tensor, optional): A Scalar or 1D tensor of observation vector frequencies representing the number of
        times each observation should be repeated. Its numel must equal the number of columns of :attr:`input`.
        Must have integral dtype. Ignored if ``None``. `Defaults to ``None``.
    aweights (tensor, optional): A Scalar or 1D array of observation vector weights.
        These relative weights are typically large for observations considered “important” and smaller for
        observations considered less “important”. Its numel must equal the number of columns of :attr:`input`.
        Must have floating point dtype. Ignored if ``None``. `Defaults to ``None``.
 Returns:
    (Tensor) The covariance matrix of the variables.
 Example::
    >>> x = torch.tensor([[0, 2], [1, 1], [2, 0]]).T
    >>> x
    tensor([[0, 1, 2],
            [2, 1, 0]])
    >>> torch.cov(x)
    tensor([[ 1., -1.],
            [-1.,  1.]])
    >>> torch.cov(x, correction=0)
    tensor([[ 0.6667, -0.6667],
            [-0.6667,  0.6667]])
    >>> fw = torch.randint(1, 10, (3,))
    >>> fw
    tensor([1, 6, 9])
    >>> aw = torch.rand(3)
    >>> aw
    tensor([0.4282, 0.0255, 0.4144])
    >>> torch.cov(x, fweights=fw, aweights=aw)
    tensor([[ 0.4169, -0.4169],
            [-0.4169,  0.4169]])
 """)
 add_docstr(torch.cat,
           r"""
 cat(tensors, dim=0, *, out=None) -> Tensor
--- a/torch/overrides.py
+++ b/torch/overrides.py
@ -374,6 +374,7 @@ def get_testing_overrides() -> Dict[Callable, Callable]:
        torch.clamp_min: lambda input, min, out=None: -1,
        torch.clamp_max: lambda input, max, out=None: -1,
        torch.column_stack: lambda tensors, out=None: -1,
        torch.cov: lambda input, correction=1, fweights=None, aweights=None: -1,
        torch.clone: lambda input: -1,
        torch.combinations: lambda input, r=2, with_replacement=False: -1,
        torch.complex: lambda real, imag: -1,
--- a/torch/testing/_internal/common_methods_invocations.py
+++ b/torch/testing/_internal/common_methods_invocations.py
@ -3037,6 +3037,22 @@ def sample_inputs_std_var(op_info, device, dtype, requires_grad, **kwargs):
    ]
 def sample_inputs_cov(op_info, device, dtype, requires_grad, **kwargs):
    shapes = [(2,), (1, 2), (3, 2), (2, 3)]
    inputs = []
    for shape in shapes:
        t = make_tensor(shape, device, dtype, requires_grad=requires_grad)
        inputs.append(SampleInput(t))
        num_observations = t.numel() if t.ndimension() < 2 else t.size(1)
        fweights = make_tensor((num_observations,), device, torch.int, low=0, high=10, requires_grad=requires_grad)
        aweights = make_tensor((num_observations,), device, torch.float, low=0, high=1, requires_grad=requires_grad)
        for correction, fw, aw in product(range(num_observations), [None, fweights], [None, aweights]):
            inputs.append(SampleInput(t, kwargs={'correction': correction, 'fweights': fw, 'aweights': aw}))
    return inputs
 def _sample_inputs_svd(op_info, device, dtype, requires_grad=False, is_linalg_svd=False):
    """
    This function generates input for torch.svd with distinct singular values so that autograd is always stable.
@ -5285,6 +5301,14 @@ op_db: List[OpInfo] = [
                       SkipInfo('TestUnaryUfuncs', 'test_reference_numerics_hard', device_type='cpu',
                                dtypes=[torch.cfloat, torch.cdouble], active_if=IS_MACOS),
                   )),
    OpInfo('cov',
           dtypes=all_types_and_complex_and(torch.half, torch.bfloat16),
           dtypesIfCUDA=all_types_and_complex_and(torch.half, *[torch.bfloat16] if CUDA11OrLater else []),
           backward_dtypesIfCUDA=all_types_and_complex_and(torch.half, *[torch.bfloat16] if CUDA11OrLater else []),
           sample_inputs_func=sample_inputs_cov,
           supports_out=False,
           # JIT test not working for tensor kwargs (https://github.com/pytorch/pytorch/issues/58507)
           skips=(SkipInfo('TestJit', 'test_variant_consistency_jit'),)),
    OpInfo('cross',
           dtypes=all_types_and_complex(),
           dtypesIfCUDA=all_types_and_complex_and(torch.half),