TutorialName = 'bayes_law'
exec(open('tbc.py').read()) # define TBC and TBC_above
import numpy as np
import scipy.stats as st
import matplotlib
matplotlib.use('TkAgg')
import matplotlib.pyplot as plt
%matplotlib inline


data = {'n':361, 's':57}


TBC()


TBC()


def prior(f, some, parameters):
    # return the prior density evaluated at x, p(f)
    TBC()

TBC_above()


# Parameters that make the prior equivalent to Uniform(0,1), in a dictionary (as with data, above),
# Make the dictionry keys the names of the parameter arguments to "prior", so we can pass it **prior_params.
TBC() # prior_params = { ...


fgrid = np.linspace(0.0, 1.0, 500)

plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(fgrid, prior(fgrid, **prior_params), 'k-');
plt.xlabel('f');
plt.ylabel('p(f)');


# here f would be our model paramter, and s and n would be from our data dictionary
def likelihood(f, s, n):
    TBC()
    
TBC_above()


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(fgrid, prior(fgrid, **prior_params), 'k-', label='p(f)');
plt.plot(fgrid, likelihood(fgrid, **data), 'b-', label='P(s|f)');
plt.xlabel('f');
plt.legend();


print('This does NOT need to be 1.0:', np.trapz(likelihood(fgrid, **data), x=fgrid))


sgrid = np.arange(0.0, data['n']+1)

test_f = np.pi/10.0
print('This had better be exactly 1.0 (to within numerical error):', likelihood(test_f, sgrid, data['n']).sum())


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(sgrid, likelihood(0.01, sgrid, data['n']), 'b.', label='f=0.01');
plt.plot(sgrid, likelihood(0.1, sgrid, data['n']), 'r.', label='f=0.1');
plt.plot(sgrid, likelihood(0.7, sgrid, data['n']), 'k.', label='f=0.07');
plt.xlabel('s');
plt.ylabel('P(s|f)');
plt.legend();


posterior = prior # you can have this one

def get_post_params(prior, parameters, n, s):
    # Note: this function's argument list should include the prior's parameters at the front.
    # Return the posterior parameters as a dictionary.
    # Since the posterior distribution (function) is the same as the prior distribution 
    # (function), this dictionary's keys should be the same as "prior_params" has.
    TBC()

TBC_above()


post_params = get_post_params(**prior_params, **data)

plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(fgrid, prior(fgrid, **prior_params), 'k-', label='p(f)');
plt.plot(fgrid, likelihood(fgrid, **data), 'b-', label='p(s|f)');
plt.plot(fgrid, posterior(fgrid, **post_params), 'r-', label='p(f|s)');
plt.xlabel('f');
plt.legend();


TBC() # post_fgrid = ...posterior evaluated at f = "fgrid"


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(fgrid, posterior(fgrid, **post_params), 'r-', label='analytic');
plt.plot(fgrid, post_fgrid, 'b.', label='grid');
plt.xlabel('f');
plt.ylabel('p(f|s)');
plt.legend();


def summarize_posterior(post_params):
    # Find the 50th, 15.85th and 84.15th percentiles of the posterior distribution.
    # Return these as a numpy array with shape (3,), in that order.
    TBC()
    
TBC_above()


print('My best fit and interval:', summarize_posterior(post_params))
print("Should be pretty much zeros:", summarize_posterior(post_params) - np.loadtxt('solutions/bayeslaw.dat'))


data2 = {'n':200, 's':40}


TBC()
# post_params_2 = posterior from just the second data set
# post_params_both = posterior from both data sets


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(fgrid, prior(fgrid, **prior_params), 'k-', label='p(f)');
plt.plot(fgrid, posterior(fgrid, **post_params), 'r-', label='p(f|s_1)');
plt.plot(fgrid, posterior(fgrid, **post_params_2), 'b-', label='p(f|s_2)');
plt.xlabel('f');
plt.legend();


plt.rcParams['figure.figsize'] = (7.0, 5.0)
plt.plot(fgrid, prior(fgrid, **prior_params), 'k-', label=r'$p(f)$');
plt.plot(fgrid, posterior(fgrid, **post_params), 'r-', label=r'$p(f|s_1)$');
plt.plot(fgrid, posterior(fgrid, **post_params_both), 'b-', label=r'$p(f|s_1,s_2)$');
plt.xlabel('f');
plt.legend();


print('Just data1:', summarize_posterior(post_params))
print('Just data2:', summarize_posterior(post_params_2))
print('Both data1 and data2', summarize_posterior(post_params_both))


data_both = {'n':data['n']+data2['n'], 's':data['s']+data2['s']}


Npredict = 10000
TBC()
# f_from_posterior = ...
# s_post_predicted = ...


plt.hist(s_post_predicted, density=True, label='your samples', bins=20);
plt.axvline(x=data_both['s'], label='measured s', color='C1')
plt.xlabel(r'$s\prime$', fontsize='x-large');
plt.ylabel(r'$P(s\prime|s)$', fontsize='x-large');
plt.legend(fontsize='x-large');

Tutorial: Bayes' Law¶

Background¶

Solution and implementation¶

Prior¶

Likelihood¶

Posterior¶

Comparison with brute force¶

Summarizing the constraint on $f$¶

Updating with new data¶

Check the goodness of fit¶