TutorialName = 'working_with_samples'
exec(open('tbc.py').read()) # define TBC and TBC_above
import numpy as np
import scipy.stats as st
import matplotlib
matplotlib.use('TkAgg')
import matplotlib.pyplot as plt
%matplotlib inline


cor = {'mx':1.0, 'my':2.3, 'sx':1.0, 'sy':0.5, 'r':-0.5} # parameter values
# Note that we do not need to explicitly define a function for the density this time!


N = 100000 # number of samples
samples = np.empty((N,2))
TBC()
# samples[:,0] = np.random.normal( ...
# samples[:,1] = np.random.normal( ...


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(samples[:,0], samples[:,1], 'b.');
plt.xlabel('x');
plt.ylabel('y');


def p_x(x, mx, my, sx, sy, r):
    return TBC()

def p_y(y, mx, my, sx, sy, r):
    return TBC()

TBC_above()


# these are only used for plotting the above functions this time
xvalues = np.arange(-4.0, 6.0, 0.1)
yvalues = np.arange(-0.2, 4.8, 0.1)


plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].hist(samples[:,0], bins=25, density=True, histtype='step', color='b', linewidth=2, label='samples');
ax[0].plot(xvalues, p_x(xvalues, **cor), 'r-', label='analytic');
ax[0].set_xlabel('x');
ax[0].set_ylabel('p(x)');
ax[0].legend();
ax[1].hist(samples[:,1], bins=25, density=True, histtype='step', color='b', linewidth=2, label='samples');
ax[1].plot(yvalues, p_y(yvalues, **cor), 'r-', label='analytic');
ax[1].set_xlabel('y');
ax[1].set_ylabel('p(y)');


def p_x_given_y(x, y, mx, my, sx, sy, r):
    return TBC()

def p_y_given_x(y, x, mx, my, sx, sy, r):
    return TBC()

TBC_above()


# continuing to follow previous notebook
fixed_x = -1.0
fixed_y = 3.8


TBC()
# j_fixed_x = np.where( ...
# j_fixed_y = np.where( ...


# fiddled with "bins" here to get something like the same resolution as elsewhere
plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].hist(samples[j_fixed_y,0], bins=10, density=True, histtype='step', color='b', linewidth=2, label='samples');
ax[0].plot(xvalues, p_x_given_y(xvalues, fixed_y, **cor), 'r-', label='analytic');
ax[0].set_xlabel('x');
ax[0].set_ylabel('p(x|y=' + str(fixed_y) + ')');
ax[0].legend();
ax[1].hist(samples[j_fixed_x,1], bins=20, density=True, histtype='step', color='b', linewidth=2, label='samples');
ax[1].plot(yvalues, p_y_given_x(yvalues, fixed_x, **cor), 'r-', label='analytic');
ax[1].set_xlabel('y');
ax[1].set_ylabel('p(y|x=' + str(fixed_x) + ')');


print(len(j_fixed_x) / samples.shape[0])
print(len(j_fixed_y) / samples.shape[0])


TBC()
# weights_fixed_x = st.norm.pdf( ...
# weights_fixed_y = st.norm.pdf( ...


plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].hist(samples[:,0], weights=weights_fixed_y, bins=25, density=True, histtype='step', color='b', linewidth=2, label='samples');
ax[0].plot(xvalues, p_x_given_y(xvalues, fixed_y, **cor), 'r-', label='analytic');
ax[0].set_xlabel('x');
ax[0].set_ylabel('p(x|y=' + str(fixed_y) + ')');
ax[0].legend();
ax[1].hist(samples[:,1], weights=weights_fixed_x, bins=25, density=True, histtype='step', color='b', linewidth=2, label='samples');
ax[1].plot(yvalues, p_y_given_x(yvalues, fixed_x, **cor), 'r-', label='analytic');
ax[1].set_xlabel('y');
ax[1].set_ylabel('p(y|x=' + str(fixed_x) + ')');


np.sum(samples[:,0]*weights_fixed_y) / np.sum(weights_fixed_y)


nu = 4.0 # giving things names is rarely a bad thing
tau = 1.0
weights_q = st.norm.pdf(samples[:,0], loc=nu, scale=tau)


s = 1.0/np.sqrt( 1.0/cor['sx']**2 + 1.0/tau**2 )
m = s**2*( cor['mx']/cor['sx']**2 + nu/tau**2 )
anax = st.norm.pdf(xvalues, m, s)
s = 1.0/np.sqrt( 1.0/cor['sy']**2 + 1.0/(tau**2 + cor['sx']**2*(1.0-cor['r']**2)) )
m = s**2*( cor['my']/cor['sy']**2 + ((nu-cor['mx'])*cor['sy']/(cor['r']*cor['sx'])+cor['my'])/(tau**2 + cor['sx']**2*(1.0-cor['r']**2)) )
anay = st.norm.pdf(yvalues, m, s)

plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].hist(samples[:,0], weights=weights_q, bins=25, density=True, histtype='step', linewidth=2, label='weighted samples');
ax[0].plot(xvalues, anax, '-', label='weighted analytic');
ax[0].plot(xvalues, p_x(xvalues, **cor), '-', label='unweighted analytic');
ax[0].set_xlabel('x');
ax[0].set_ylabel('marginal prob of x');
ax[0].legend();
ax[1].hist(samples[:,1], weights=weights_q, bins=25, density=True, histtype='step', linewidth=2, label='weighted samples');
ax[1].plot(yvalues, anay, '-', label='weighted analytic');
ax[1].plot(yvalues, p_y(yvalues, **cor), '-', label='unweighted analytic');
ax[1].set_xlabel('y');
ax[1].set_ylabel('marginal prob of y');


TBC() # weights_q2 =


plt.rcParams['figure.figsize'] = (14.0, 5.0)
fig, ax = plt.subplots(1,2);
ax[0].hist(samples[:,0], weights=weights_q2, bins=25, density=True, histtype='step', color='b', linewidth=2, label='weighted samples');
ax[0].plot(xvalues, p_x(xvalues, **cor), 'r-', label='just p(x,y)');
ax[0].set_xlabel('x');
ax[0].set_ylabel('marginal prob of x');
ax[0].legend();
ax[1].hist(samples[:,1], weights=weights_q2, bins=25, density=True, histtype='step', color='b', linewidth=2, label='weighted samples');
ax[1].plot(yvalues, p_y(yvalues, **cor), 'r-', label='just p(x,y)');
ax[1].set_xlabel('y');
ax[1].set_ylabel('marginal prob of y');

Tutorial: Working with Samples¶

1. Produce some samples¶

2. Marginalization¶

3. Conditioning¶

4. Importance weighting¶