TutorialName = 'essential_probability'
exec(open('tbc.py').read()) # define TBC and TBC_above
import numpy as np
import matplotlib
matplotlib.use('TkAgg')
import matplotlib.pyplot as plt
%matplotlib inline


# dict of parameter values: the means and standard deviations for x and y
unc = {'mx':1.0, 'my':2.3, 'sx':1.0, 'sy':0.5}

def unc_p_xy(x, y, mx, my, sx, sy):
    '''returns pdf of 2D uncorrelated gaussian distribution evaluated at (x,y)'''
    return np.exp(-0.5 * ( ((x-mx)/sx)**2 + ((y-my)/sy)**2 )) / (2*np.pi * sx * sy)


TBC()


TBC()


def unc_p_x(x, mx, my, sx, sy):
    '''returns p(x) for uncorrelated 2D Gaussian distribution'''
    TBC()

def unc_p_y(y, mx, my, sx, sy):
    '''returns p(y) for uncorrelated 2D Gaussian distribution'''
    TBC()

def unc_p_x_given_y(x, y, **kwargs):
    '''returns p(x|y) for uncorrelated 2D Gaussian distribution'''
    TBC()

def unc_p_y_given_x(y, x, **kwargs):
    '''returns p(x|y) for uncorrelated 2D Gaussian distribution'''
    TBC()

TBC_above()


# x bounds
xmin = -4.0
xmax = 6.0
dx = 0.1

# y bounds
ymin = -0.2
ymax = 4.8
dy = 0.1

# defind the x and y values and the meshgrid
xvalues = np.arange(xmin, xmax+dx, dx)
yvalues = np.arange(ymin, ymax+dy, dy)
grid_x, grid_y = np.meshgrid(xvalues, yvalues, indexing='ij')


# plot the x and y grids as a sanity check
plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].imshow(grid_x.T, cmap='gray', origin='lower', extent=[xmin, xmax, ymin, ymax]);
ax[1].imshow(grid_y.T, cmap='gray', origin='lower', extent=[xmin, xmax, ymin, ymax]);


# evaluate p(x,y)
ugrid_p_xy = unc_p_xy(grid_x, grid_y, **unc)


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.imshow(ugrid_p_xy.T, origin='lower', extent=[xmin, xmax, ymin, ymax]);
plt.xlabel('x');
plt.ylabel('y');


# Marginalize over y. The result should be a 1D array, since it is still a function of x.
# As you might guess, the comment below indicates that the remaining notebook cells assume your answer is stored
# in a variable named ugrid_p_x.

TBC() 
# ugrid_p_x = ...


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(xvalues, ugrid_p_x, 'bo', label='grid calculation');
plt.plot(xvalues, unc_p_x(xvalues, **unc), 'r-', label='analytic expression');
plt.xlabel('x');
plt.ylabel('p(x)');
plt.legend();


# verify that it's normalized (within reasonable numerical error)

TBC()

# print(...)


# marginalize p(x,y) over x and verify that it's normalized

TBC()

# ugrid_p_y = ...
# print(...)


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(yvalues, ugrid_p_y, 'bo', label='grid calculation');
plt.plot(yvalues, unc_p_y(yvalues, **unc), 'r-', label='analytic expression');
plt.xlabel('y');
plt.xlabel('p(y)');
plt.legend();


xi = 30 # index into the grid of x's
fixed_x = xvalues[xi]
print(fixed_x)
yi = 40 # similarly for y
fixed_y = yvalues[yi]
print(fixed_y)


# p(x,y) = p(x|y) p(y)
# ugrid_p_x_given_y = ...

# verify that it's normalized
# print(...)

TBC()


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(xvalues, ugrid_p_x_given_y, 'bo', label='grid calculation');
plt.plot(xvalues, unc_p_x_given_y(xvalues, fixed_y, **unc), 'r-', label='analytic expression');
plt.xlabel('x');
plt.ylabel('p(x|y=' + str(fixed_y) + ')');
plt.legend();


# ugrid_p_y_given_x = ...

# verify that it's normalized
# print(...)

TBC()


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(yvalues, ugrid_p_y_given_x, 'bo', label='grid calculation');
plt.plot(yvalues, unc_p_y_given_x(yvalues, fixed_x, **unc), 'r-', label='analytic expression');
plt.xlabel('y');
plt.ylabel('p(y|x=' + str(fixed_x) + ')');
plt.legend();


cor = {'mx':1.0, 'my':2.3, 'sx':1.0, 'sy':0.5, 'r':-0.5} # parameter values

def cor_p_xy(x, y, mx, my, sx, sy, r):
    return np.exp(-0.5/(1.0-r**2)*( ((x-mx)/sx)**2 + ((y-my)/sy)**2 -2.0*r*(x-mx)/sx*(y-my)/sy )) / (2*np.pi*sx*sy*np.sqrt(1.0-r**2))


TBC()


# marginal
def cor_p_x(x, mx, my, sx, sy, r):
    TBC()

def cor_p_y(y, mx, my, sx, sy, r):
    TBC()

# conditional distributions
def cor_p_x_given_y(x, y, mx, my, sx, sy, r):
    TBC()
    
def cor_p_y_given_x(y, x, mx, my, sx, sy, r):
    TBC()
    
TBC_above()


cgrid_p_xy = cor_p_xy(grid_x, grid_y, **cor)


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.imshow(cgrid_p_xy.T, origin='lower', extent=[xmin, xmax, ymin, ymax]);
plt.xlabel('x');
plt.ylabel('y');


# cgrid_p_x = ...
# print(...)

TBC()


plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].plot(xvalues, cgrid_p_x, 'bo');
ax[0].plot(xvalues, cor_p_x(xvalues, **cor), 'r-');
ax[0].set_xlabel('x');
ax[0].set_ylabel('p(x)');
ax[0].set_title('correlated p(x,y)');
ax[1].plot(xvalues, ugrid_p_x, 'bo');
ax[1].plot(xvalues, unc_p_x(xvalues, **unc), 'r-');
ax[1].set_xlabel('x');
ax[1].set_ylabel('p(x)');
ax[1].set_title('uncorrelated p(x,y)');


# cgrid_p_y = ...
# print(...)

TBC()


plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].plot(yvalues, cgrid_p_y, 'bo');
ax[0].plot(yvalues, cor_p_y(yvalues, **cor), 'r-');
ax[0].set_xlabel('y');
ax[0].set_ylabel('p(y)');
ax[0].set_title('correlated p(x,y)');
ax[1].plot(yvalues, ugrid_p_y, 'bo');
ax[1].plot(yvalues, unc_p_y(yvalues, **unc), 'r-');
ax[1].set_xlabel('y');
ax[1].set_ylabel('p(y)');
ax[1].set_title('uncorrelated p(x,y)');


# cgrid_p_x_given_y = ...
# print(...)

TBC()


plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].plot(xvalues, cgrid_p_x_given_y, 'bo');
ax[0].plot(xvalues, cor_p_x_given_y(xvalues, fixed_y, **cor), 'r-');
ax[0].set_xlabel('x');
ax[0].set_ylabel('p(x|y=' + str(fixed_y) + ')');
ax[0].set_title('correlated p(x,y)');
ax[1].plot(xvalues, ugrid_p_x_given_y, 'bo');
ax[1].plot(xvalues, unc_p_x_given_y(xvalues, fixed_y, **unc), 'r-');
ax[1].set_xlabel('x');
ax[1].set_ylabel('p(x|y=' + str(fixed_y) + ')');
ax[1].set_title('uncorrelated p(x,y)');


# cgrid_p_y_given_x = ...
# print(...)

TBC()


plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].plot(yvalues, cgrid_p_y_given_x, 'bo');
ax[0].plot(yvalues, cor_p_y_given_x(yvalues, fixed_x, **cor), 'r-');
ax[0].set_xlabel('y');
ax[0].set_ylabel('p(y|x=' + str(fixed_x) + ')');
ax[0].set_title('correlated p(x,y)');
ax[1].plot(yvalues, ugrid_p_y_given_x, 'bo');
ax[1].plot(yvalues, unc_p_y_given_x(yvalues, fixed_x, **unc), 'r-');
ax[1].set_xlabel('y');
ax[1].set_ylabel('p(y|x=' + str(fixed_x) + ')');
ax[1].set_title('uncorrelated p(x,y)');

Tutorial: Essential Probability¶

Analytic and numerical manipulations of probability distributions¶

Unsolicited advice¶

0. Setup¶

1. Uncorrelated distributions¶

1a. Analytics: marginalizing and conditioning¶

1b. Numerics: probabilities on a grid¶

1c. Comparing analytic and numerical results of marginal distributions¶

First, $p(x)$¶

Next, $p(y)$¶

1d. Comparing analytic and numerical results of conditional distributions¶

First, $p(x|y)$¶

Next, $p(y|x)$¶

2. Correlated distributions¶

2a. analytics¶

2b. numerics¶

2c. Marginal distributions¶

First, $p(x)$¶

Next, $p(y)$¶

2d. Conditional distributions¶

First, $p(x|y)$¶

Next, $p(y|x)$¶