mirror of
https://github.com/zebrajr/pytorch.git
synced 2025-12-07 12:21:27 +01:00
This is a new version of #15648 based on the latest master branch. Unlike the previous PR where I fixed a lot of the doctests in addition to integrating xdoctest, I'm going to reduce the scope here. I'm simply going to integrate xdoctest, and then I'm going to mark all of the failing tests as "SKIP". This will let xdoctest run on the dashboards, provide some value, and still let the dashboards pass. I'll leave fixing the doctests themselves to another PR. In my initial commit, I do the bare minimum to get something running with failing dashboards. The few tests that I marked as skip are causing segfaults. Running xdoctest results in 293 failed, 201 passed tests. The next commits will be to disable those tests. (unfortunately I don't have a tool that will insert the `#xdoctest: +SKIP` directive over every failing test, so I'm going to do this mostly manually.) Fixes https://github.com/pytorch/pytorch/issues/71105 @ezyang Pull Request resolved: https://github.com/pytorch/pytorch/pull/82797 Approved by: https://github.com/ezyang
138 lines
5.6 KiB
Python
138 lines
5.6 KiB
Python
import torch
|
|
from torch.distributions import constraints
|
|
from torch.distributions.distribution import Distribution
|
|
from torch.distributions.utils import broadcast_all, probs_to_logits, lazy_property, logits_to_probs
|
|
|
|
__all__ = ['Binomial']
|
|
|
|
def _clamp_by_zero(x):
|
|
# works like clamp(x, min=0) but has grad at 0 is 0.5
|
|
return (x.clamp(min=0) + x - x.clamp(max=0)) / 2
|
|
|
|
|
|
class Binomial(Distribution):
|
|
r"""
|
|
Creates a Binomial distribution parameterized by :attr:`total_count` and
|
|
either :attr:`probs` or :attr:`logits` (but not both). :attr:`total_count` must be
|
|
broadcastable with :attr:`probs`/:attr:`logits`.
|
|
|
|
Example::
|
|
|
|
>>> # xdoctest: +IGNORE_WANT("non-deterinistic")
|
|
>>> m = Binomial(100, torch.tensor([0 , .2, .8, 1]))
|
|
>>> x = m.sample()
|
|
tensor([ 0., 22., 71., 100.])
|
|
|
|
>>> m = Binomial(torch.tensor([[5.], [10.]]), torch.tensor([0.5, 0.8]))
|
|
>>> x = m.sample()
|
|
tensor([[ 4., 5.],
|
|
[ 7., 6.]])
|
|
|
|
Args:
|
|
total_count (int or Tensor): number of Bernoulli trials
|
|
probs (Tensor): Event probabilities
|
|
logits (Tensor): Event log-odds
|
|
"""
|
|
arg_constraints = {'total_count': constraints.nonnegative_integer,
|
|
'probs': constraints.unit_interval,
|
|
'logits': constraints.real}
|
|
has_enumerate_support = True
|
|
|
|
def __init__(self, total_count=1, probs=None, logits=None, validate_args=None):
|
|
if (probs is None) == (logits is None):
|
|
raise ValueError("Either `probs` or `logits` must be specified, but not both.")
|
|
if probs is not None:
|
|
self.total_count, self.probs, = broadcast_all(total_count, probs)
|
|
self.total_count = self.total_count.type_as(self.probs)
|
|
else:
|
|
self.total_count, self.logits, = broadcast_all(total_count, logits)
|
|
self.total_count = self.total_count.type_as(self.logits)
|
|
|
|
self._param = self.probs if probs is not None else self.logits
|
|
batch_shape = self._param.size()
|
|
super(Binomial, self).__init__(batch_shape, validate_args=validate_args)
|
|
|
|
def expand(self, batch_shape, _instance=None):
|
|
new = self._get_checked_instance(Binomial, _instance)
|
|
batch_shape = torch.Size(batch_shape)
|
|
new.total_count = self.total_count.expand(batch_shape)
|
|
if 'probs' in self.__dict__:
|
|
new.probs = self.probs.expand(batch_shape)
|
|
new._param = new.probs
|
|
if 'logits' in self.__dict__:
|
|
new.logits = self.logits.expand(batch_shape)
|
|
new._param = new.logits
|
|
super(Binomial, new).__init__(batch_shape, validate_args=False)
|
|
new._validate_args = self._validate_args
|
|
return new
|
|
|
|
def _new(self, *args, **kwargs):
|
|
return self._param.new(*args, **kwargs)
|
|
|
|
@constraints.dependent_property(is_discrete=True, event_dim=0)
|
|
def support(self):
|
|
return constraints.integer_interval(0, self.total_count)
|
|
|
|
@property
|
|
def mean(self):
|
|
return self.total_count * self.probs
|
|
|
|
@property
|
|
def mode(self):
|
|
return ((self.total_count + 1) * self.probs).floor().clamp(max=self.total_count)
|
|
|
|
@property
|
|
def variance(self):
|
|
return self.total_count * self.probs * (1 - self.probs)
|
|
|
|
@lazy_property
|
|
def logits(self):
|
|
return probs_to_logits(self.probs, is_binary=True)
|
|
|
|
@lazy_property
|
|
def probs(self):
|
|
return logits_to_probs(self.logits, is_binary=True)
|
|
|
|
@property
|
|
def param_shape(self):
|
|
return self._param.size()
|
|
|
|
def sample(self, sample_shape=torch.Size()):
|
|
shape = self._extended_shape(sample_shape)
|
|
with torch.no_grad():
|
|
return torch.binomial(self.total_count.expand(shape), self.probs.expand(shape))
|
|
|
|
def log_prob(self, value):
|
|
if self._validate_args:
|
|
self._validate_sample(value)
|
|
log_factorial_n = torch.lgamma(self.total_count + 1)
|
|
log_factorial_k = torch.lgamma(value + 1)
|
|
log_factorial_nmk = torch.lgamma(self.total_count - value + 1)
|
|
# k * log(p) + (n - k) * log(1 - p) = k * (log(p) - log(1 - p)) + n * log(1 - p)
|
|
# (case logit < 0) = k * logit - n * log1p(e^logit)
|
|
# (case logit > 0) = k * logit - n * (log(p) - log(1 - p)) + n * log(p)
|
|
# = k * logit - n * logit - n * log1p(e^-logit)
|
|
# (merge two cases) = k * logit - n * max(logit, 0) - n * log1p(e^-|logit|)
|
|
normalize_term = (self.total_count * _clamp_by_zero(self.logits)
|
|
+ self.total_count * torch.log1p(torch.exp(-torch.abs(self.logits)))
|
|
- log_factorial_n)
|
|
return value * self.logits - log_factorial_k - log_factorial_nmk - normalize_term
|
|
|
|
def entropy(self):
|
|
total_count = int(self.total_count.max())
|
|
if not self.total_count.min() == total_count:
|
|
raise NotImplementedError("Inhomogeneous total count not supported by `entropy`.")
|
|
|
|
log_prob = self.log_prob(self.enumerate_support(False))
|
|
return -(torch.exp(log_prob) * log_prob).sum(0)
|
|
|
|
def enumerate_support(self, expand=True):
|
|
total_count = int(self.total_count.max())
|
|
if not self.total_count.min() == total_count:
|
|
raise NotImplementedError("Inhomogeneous total count not supported by `enumerate_support`.")
|
|
values = torch.arange(1 + total_count, dtype=self._param.dtype, device=self._param.device)
|
|
values = values.view((-1,) + (1,) * len(self._batch_shape))
|
|
if expand:
|
|
values = values.expand((-1,) + self._batch_shape)
|
|
return values
|