TutorialName = 'toy_grid'
exec(open('tbc.py').read()) # define TBC and TBC_above
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline
import scipy.stats as st
from scipy.optimize import minimize
import incredible as cr


TBC() # answer in Markdown


truth = {'x0':17.1, 'y0':12.75, 'mu0':50.0, 'sigma':3.0}


dim_x = 32
dim_y = 32


mock_image = np.zeros((dim_y, dim_x))

# Use the generative model to put some photons in mock_image.
# Each value in the array should equal the number of photons that land in that pixel.
# Remember that the indexing goes like mock_image[y_index, x_index], as above!
TBC()


plt.imshow(mock_image, origin='lower');


mock_image = np.loadtxt('data/toy_photometry.dat')


plt.imshow(mock_image, origin='lower');


class Image:
    def __init__(self, image):
        self.im = image
        self.imx,self.imy = np.meshgrid(range(image.shape[1]), range(image.shape[0]))

data = Image(mock_image)


plt.rcParams['figure.figsize'] = (12.0, 4.0)
fig, ax = plt.subplots(1,3)
ax[0].imshow(data.im, origin='lower');
ax[0].set_title('data.im');
ax[1].imshow(data.imx, origin='lower');
ax[1].set_title('data.imx');
ax[2].imshow(data.imy, origin='lower');
ax[2].set_title('data.imy');


def log_prior(x0, y0, mu0, sigma):
    TBC()
    
TBC_above()


log_prior(**truth)


def mean_img(x0, y0, mu0, sigma):
    '''
    Return an array with the expected mean counts in each pixel for these model parameters
    '''
    TBC()

def log_likelihood(data, **params):
    '''
    `data` is an Image object, as defined above
    '''
    mu = mean_img(**params)
    TBC()
    
TBC_above()


# check that it works
log_likelihood(data, **truth)


plt.imshow(mean_img(**truth), origin='lower');


mean_img(**truth).sum()


def log_posterior(data, **params):
    lnp = log_prior(**params)
    if np.isfinite(lnp):
        lnp += log_likelihood(data, **params)
    return lnp


## check that it works
log_posterior(data, **truth)


paramnames = ['x0', 'y0', 'mu0', 'sigma'] # the canonical parameter order, because I said so


def mlnpost(p, data):
    """
    p: a numpy array of parameter values in the order x0, y0, mu0, sigma
    Return value: minus the log-posterior
    """
    TBC()
    
TBC_above()


params = {'x0':16.0, 'y0':16.0, 'mu0':data.im.sum(), 'sigma':5.0}


TBC() # bounds = [..., ..., ..., (0.0001,None)] # sigma=0 precisely would yield division by zero


bestfit = minimize(mlnpost, [params[k] for k in paramnames], args=(data), bounds=bounds)
bestfit


TBC()

#x0_min = 
#x0_max = 
#y0_min = 
#y0_max = 
#mu0_min = 
#mu0_max = 
#sigma_min = 
#sigma_max =


dim = 100
x0_values = np.linspace(x0_min, x0_max, dim)
y0_values = np.linspace(y0_min, y0_max, dim)
mu0_values = np.linspace(mu0_min, mu0_max, dim)
sigma_values = np.linspace(sigma_min, sigma_max, dim)


%%time
for i in range(1000):
    log_posterior(data, **truth)


dim = 10
x0_values = np.linspace(x0_min, x0_max, dim)
y0_values = np.linspace(y0_min, y0_max, dim)
mu0_values = np.linspace(mu0_min, mu0_max, dim)
sigma_values = np.linspace(sigma_min, sigma_max, dim)


%%time
lnpost_grid = np.empty((len(x0_values), len(y0_values), len(mu0_values), len(sigma_values)))
for i,x0 in enumerate(x0_values):
    for j,y0 in enumerate(y0_values):
        for k,mu0 in enumerate(mu0_values):
            for l,sigma in enumerate(sigma_values):
                lnpost_grid[i,j,k,l] = log_posterior(data, x0=x0, y0=y0, mu0=mu0, sigma=sigma)


post_grid = np.exp(lnpost_grid - lnpost_grid.max())

TBC()
#marg1d = [{'x':x0_values, 'density': ... },
#          {'x':y0_values, 'density': ... },
#          {'x':mu0_values, 'density': ... },
#          {'x':sigma_values, 'density': ... }]


plt.rcParams['figure.figsize'] = (20.0, 4.0)
fig, ax = plt.subplots(1,4)
ci1d = [cr.whist_ci(marg, plot=axes) for marg,axes in zip(marg1d,ax)]
for i in range(4):
    ax[i].set_xlabel(paramnames[i])
    ax[i].axvline(truth[paramnames[i]], color='C1', label='truth');
ax[0].legend();


#mu0_min = 
#mu0_max = 
#sigma_min = 
#sigma_max =


%%time
dim = 100
mu0_values = np.linspace(mu0_min, mu0_max, dim)
sigma_values = np.linspace(sigma_min, sigma_max, dim)
lnpost_grid = np.empty((len(mu0_values), len(sigma_values)))
for k,mu0 in enumerate(mu0_values):
    for l,sigma in enumerate(sigma_values):
        lnpost_grid[k,l] = log_posterior(data, x0=truth['x0'], y0=truth['y0'], mu0=mu0, sigma=sigma)
post_grid = np.exp(lnpost_grid - lnpost_grid.max())


TBC()
#marg1d = [{'x':mu0_values, 'density': ... },
#          {'x':sigma_values, 'density': ... }]


plt.rcParams['figure.figsize'] = (12.0, 4.0)
fig, ax = plt.subplots(1,2)
ci1d = [cr.whist_ci(marg, plot=axes) for marg,axes in zip(marg1d,ax)]
for i in range(2):
    ax[i].set_xlabel(paramnames[i+2])
    ax[i].axvline(truth[paramnames[i+2]], color='C1', label='truth')
ax[0].legend();


plt.rcParams['figure.figsize'] = (5.0, 5.0)
cr2d = cr.whist2d_ci({'x':mu0_values, 'y':sigma_values, 'z':post_grid.T}, sigmas=np.array([1,2,3]));
plt.xlabel('mu0');
plt.ylabel('sigma');


ci1d


plt.rcParams['figure.figsize'] = (12.0, 4.0)
fig, ax = plt.subplots(1,2)
ax[0].imshow(data.im, origin='lower');
ax[0].set_title('data');
ax[1].imshow(mean_img(truth['x0'], truth['y0'], cr2d['mode'][0], cr2d['mode'][1]), origin='lower');
ax[1].set_title(r'$\mu(x,y)$ of posterior mode');


mu0_values2,sigma_values2 = np.meshgrid(mu0_values, sigma_values, indexing='ij')
j = np.random.choice(np.prod(post_grid.shape), size=10000, p=post_grid.flatten()/post_grid.sum())
mu0_ppd = mu0_values2.flatten()[j]
sigma_ppd = sigma_values2.flatten()[j]


TBC() # N_ppd = ...


plt.rcParams['figure.figsize'] = (5.0, 4.0)
plt.hist(N_ppd, label='PPD');
plt.axvline(data.im.sum(), color='C1', label='data');
plt.legend();
plt.xlabel('N');


TBC() # dxy_ppd = ...


def find_offsets(image, x0, y0):
    j = np.where(image.im.flatten() > 0)[0]
    return (np.concatenate((image.imx.flatten()[j] - x0, image.imy.flatten()[j] - y0)), 
            np.concatenate((image.im.flatten()[j], image.im.flatten()[j])))

dxy_data = find_offsets(data, truth['x0'], truth['y0'])


plt.hist(dxy_ppd, density=True, label='PPD');
plt.hist(dxy_data[0], weights=dxy_data[1], density=True, histtype='step', lw=2, label='data');
plt.xlabel(r'$\Delta x$, $\Delta y$');
plt.legend();


from cashstatistic import cash_mod, cash_mod_expectations


C = cash_mod(mean_img(truth['x0'], truth['y0'], cr2d['mode'][0], cr2d['mode'][1]), data.im).sum()


cexp = cash_mod_expectations( mean_img(truth['x0'], truth['y0'], cr2d['mode'][0], cr2d['mode'][1]) )


print('Actual C:', C.sum())
print('Gaussian prediction for C (mean and stdev):', cexp[0].sum(), '+/-', np.sqrt(cexp[1].sum()))

Tutorial: Toy Photometry Model on a Grid¶

Problem definition¶

Generate data¶

Implementation¶

Evaluating the posterior¶

Finding credible regions¶

Curbing our ambition¶

Goodness of fit¶

Parting thoughts¶