import torch
import matplotlib.pyplot as plt
import seaborn as sns
import matplotlib.gridspec as gridspec

# Create a 2D Gaussian distribution with mean vector [0, 0] 
# and covariance matrix [[1, 1], [1, 2]]
norm2d = torch.distributions.MultivariateNormal(loc = torch.zeros(2), 
                                covariance_matrix=torch.eye(2) + 1.)

# Create a 2D grid of points in the range [-3, 3] 
# with 100 steps in each direction
xs = torch.linspace(-3., 3., steps=100)
ys = torch.linspace(-3.,3., steps=100)
xx, yy = torch.meshgrid(xs, ys, indexing="xy")

# Compute the density of the multivariate Gaussian at each point on the grid
norm2d_densities = norm2d.log_prob(torch.vstack((xx.ravel(), 
                            yy.ravel())).t()).reshape(xx.shape).exp()

# Compute the marginal density of the Gaussian for each variable
marginal_x = torch.distributions.Normal(norm2d.loc[0], 
                            norm2d.covariance_matrix[0, 0])

marginal_y = torch.distributions.Normal(norm2d.loc[1], 
                            norm2d.covariance_matrix[1, 1])

marginal_x_vals = marginal_x.log_prob(xs).exp().numpy()
marginal_y_vals = marginal_y.log_prob(ys).exp().numpy()

# Plot the results
fig = plt.figure(figsize=(8, 8))
gs = gridspec.GridSpec(3, 3)
ax_main = plt.subplot(gs[1:3, :2])
ax_xDist = plt.subplot(gs[0, :2], sharex=ax_main)
ax_yDist = plt.subplot(gs[1:3, 2], sharey=ax_main)

contours = ax_main.contour(xx, yy, norm2d_densities, 
                           6, colors="black")
ax_main.clabel(contours, inline=True, fontsize=8)

ax_main.imshow(norm2d_densities, 
               extent=[-3, 3, -3, 3], origin="lower", 
               cmap="Purples", alpha=0.3)

ax_xDist.plot(xs, marginal_x_vals, color="k")
ax_yDist.plot(marginal_y_vals, ys, color="k")

ax_xDist.fill_between(xs, marginal_x_vals, 0, color='purple', alpha=0.3)

ax_xDist.set_ylim((0, 0.3))

ax_yDist.fill_betweenx(ys, marginal_y_vals, 0, color='purple', alpha=0.3)

ax_yDist.set_xlim((0, 0.3))
sns.despine();

samples = norm2d.sample((500,))

print("Mean: {0}".format(samples.mean(0)))
print("Covariance:")
print(samples.T.cov())

plt.scatter(samples[:, 0], samples[:, 1])
plt.show()

Mean: tensor([0.0398, 0.0600])
Covariance:
tensor([[1.8607, 1.0072],
        [1.0072, 2.0132]])

import torch
import matplotlib.pyplot as plt
import seaborn as sns
import matplotlib.gridspec as gridspec

dir1 = torch.distributions.Dirichlet(torch.tensor([1., 1., 1.]))
samples1 = dir1.sample([10000, ])

dir10 = torch.distributions.Dirichlet(torch.tensor([10., 10., 10.]))
samples10 = dir10.sample([10000, ])

# Only the relative proportions determine the mean
print("Means:")
print(samples1.mean(0))
print(samples10.mean(0))

print("Variances:")
# The variance is inversely proportional to the concentration parameter
print(samples1.var(0))
print(samples10.var(0))

Means:
tensor([0.3336, 0.3284, 0.3380])
tensor([0.3320, 0.3344, 0.3336])
Variances:
tensor([0.0557, 0.0550, 0.0559])
tensor([0.0072, 0.0073, 0.0075])

# Source: https://gist.github.com/tboggs/8778945

from __future__ import division, print_function

import numpy as np
import matplotlib.pyplot as plt
import matplotlib.tri as tri

_corners = np.array([[0, 0], [1, 0], [0.5, 0.75**0.5]])
_AREA = 0.5 * 1 * 0.75**0.5
_triangle = tri.Triangulation(_corners[:, 0], _corners[:, 1])

# For each corner of the triangle, the pair of other corners
_pairs = [_corners[np.roll(range(3), -i)[1:]] for i in range(3)]
# The area of the triangle formed by point xy and another pair or points
tri_area = lambda xy, pair: 0.5 * np.linalg.norm(np.cross(*(pair - xy)))

def xy2bc(xy, tol=1.e-4):
    '''Converts 2D Cartesian coordinates to barycentric.
    Arguments:
        `xy`: A length-2 sequence containing the x and y value.
    '''
    coords = np.array([tri_area(xy, p) for p in _pairs]) / _AREA
    return np.clip(coords, tol, 1.0 - tol)

class Dirichlet(object):
    def __init__(self, alpha):
        '''Creates Dirichlet distribution with parameter `alpha`.'''
        from math import gamma
        from operator import mul
        self._alpha = np.array(alpha)
        self._coef = gamma(np.sum(self._alpha)) / \
                     np.multiply.reduce([gamma(a) for a in self._alpha])
    def pdf(self, x):
        '''Returns pdf value for `x`.'''
        from operator import mul
        return self._coef * np.multiply.reduce([xx ** (aa - 1)
                                    for (xx, aa)in zip(x, self._alpha)])
    def sample(self, N):
        '''Generates a random sample of size `N`.'''
        return np.random.dirichlet(self._alpha, N)

def draw_pdf_contours(dist, border=False, nlevels=200, subdiv=8, **kwargs):
    '''Draws pdf contours over an equilateral triangle (2-simplex).
    Arguments:
        `dist`: A distribution instance with a `pdf` method.
        `border` (bool): If True, the simplex border is drawn.
        `nlevels` (int): Number of contours to draw.
        `subdiv` (int): Number of recursive mesh subdivisions to create.
        kwargs: Keyword args passed on to `plt.triplot`.
    '''
    from matplotlib import ticker, cm
    import math

    refiner = tri.UniformTriRefiner(_triangle)
    trimesh = refiner.refine_triangulation(subdiv=subdiv)
    pvals = [dist.pdf(xy2bc(xy)) for xy in zip(trimesh.x, trimesh.y)]

    plt.tricontourf(trimesh, pvals, nlevels, cmap='jet', **kwargs)
    plt.axis('equal')
    plt.xlim(0, 1)
    plt.ylim(0, 0.75**0.5)
    plt.axis('off')
    if border is True:
        plt.triplot(_triangle, linewidth=1)

def plot_points(X, barycentric=True, border=True, **kwargs):
    '''Plots a set of points in the simplex.
    Arguments:
        `X` (ndarray): A 2xN array (if in Cartesian coords) or 3xN array
                       (if in barycentric coords) of points to plot.
        `barycentric` (bool): Indicates if `X` is in barycentric coords.
        `border` (bool): If True, the simplex border is drawn.
        kwargs: Keyword args passed on to `plt.plot`.
    '''
    if barycentric is True:
        X = X.dot(_corners)
    plt.plot(X[:, 0], X[:, 1], 'k.', ms=1, **kwargs)
    plt.axis('equal')
    plt.xlim(0, 1)
    plt.ylim(0, 0.75**0.5)
    plt.axis('off')
    if border is True:
        plt.triplot(_triangle, linewidth=1)

if __name__ == '__main__':
    f = plt.figure(figsize=(8, 6))
    alphas = [[0.999] * 3,
              [5] * 3,
              [2, 5, 15]]
    for (i, alpha) in enumerate(alphas):
        plt.subplot(2, len(alphas), i + 1)
        dist = Dirichlet(alpha)
        draw_pdf_contours(dist)
        title = r'$\alpha$ = (%.3f, %.3f, %.3f)' % tuple(alpha)
        plt.title(title, fontdict={'fontsize': 8})
        plt.subplot(2, len(alphas), i + 1 + len(alphas))
        plot_points(dist.sample(5000))

Probability Theory¶

Basic Concepts¶

Random Variables¶

Expectation and Variance¶

Continuous random variables¶

Common Distributions¶

Bernoulli Distribution¶

Beta distribution¶

Multi-noulli Distribution¶

Dirichlet Distribution¶

Uniform distribution¶

Gaussian Distribution¶

The multivariate Gaussian distribution¶

Estimators and bias¶

Concentration of measure inequalities¶