from os import getcwd
from os.path import exists as file_exists
from yaml import safe_load
import numpy as np
from scipy.optimize import minimize
import scipy.stats as st
import statsmodels.api as sm
import matplotlib.pyplot as plt
%matplotlib inline

import incredible as cr
import lrgs

thisTutorial = 'approximate_methods'
if getcwd() == '/content':
    # assume we are in Colab, and the user's data directory is linked to their drive/Physics267_data
    from google.colab import drive
    drive.mount('/content/drive')
    datapath = '/content/drive/MyDrive/Physics267_data/' + thisTutorial + '/' 
else:
    # assume we are running locally somewhere and have the data under ./data/
    datapath = 'data/'

table = np.loadtxt(datapath+'data.txt')
x = table[:,0]
y = table[:,1]

plt.rcParams['figure.figsize'] = (4.0, 3.0)
plt.plot(x, y, '.');
plt.xlabel("x"); plt.ylabel("y");

model = sm.OLS(y, sm.add_constant(x))
ols = model.fit()

ols.params

array([-2.75994154,  0.69626281])

ols.normalized_cov_params

array([[ 0.11651851, -0.01751249],
       [-0.01751249,  0.0038586 ]])

np.sqrt(ols.normalized_cov_params.diagonal())

array([0.34134808, 0.06211765])

param_names = ['a', 'b']

true_post = {'1D':{'a':st.norm(ols.params[0], np.sqrt(ols.normalized_cov_params[0,0])),
                   'b':st.norm(ols.params[1], np.sqrt(ols.normalized_cov_params[1,1]))},
             '2D':{'68.3':cr.cov_ellipse(ols.normalized_cov_params, center=ols.params, level=0.68268949),
                   '95.4':cr.cov_ellipse(ols.normalized_cov_params, center=ols.params, level=0.95449974)}
            }

def minus_lnp(params, x, y):
    # return -ln(posterior) given params, a 1D np.array [a,b]

guess = [0.0, 0.0]

LA = minimize(minus_lnp, guess, args=(x,y))
LA

  message: Optimization terminated successfully.
  success: True
   status: 0
      fun: 43.40431004851482
        x: [-2.760e+00  6.963e-01]
      nit: 3
      jac: [ 0.000e+00  4.768e-07]
 hess_inv: [[ 1.165e-01 -1.751e-02]
            [-1.751e-02  3.859e-03]]
     nfev: 15
     njev: 5

assert np.allclose(LA.x, ols.params)

assert np.allclose(LA.hess_inv, ols.normalized_cov_params)

plt.rcParams['figure.figsize'] = (4.0, 3.0)
plt.plot(true_post['2D']['68.3'][0], true_post['2D']['68.3'][1], '-', color='b', label='OLS');
plt.plot(true_post['2D']['95.4'][0], true_post['2D']['95.4'][1], '-', color='b');
cr.cov_ellipse(LA.hess_inv, center=LA.x, level=0.68268949, plot=plt, fmt='--', color='r', label="LA");
cr.cov_ellipse(LA.hess_inv, center=LA.x, level=0.95449974, plot=plt, fmt='--', color='r');
plt.xlabel("a"); plt.ylabel("b");
plt.legend();

# priors = {'a':..., 'b':...}

class ABC:
    def __init__(self, x, ytrue, priors):
        self.x = x
        self.y = ytrue
        self.s_true = self.summaries(x, ytrue)
        self.priors = priors
        self.param_names = [p for p in priors.keys()]
    # derived classes must define the following
    def summaries(self, x, y):
        # return summary statistics as a 1D np.array
        raise Exception('ABC::summaries should be defined by a deriving class')
    def distance(self, s1, s2):
        # return scalar distance between 2 sets of summary statistics
        raise Exception('ABC::distance should be defined by a deriving class')
    def simulate(self):
        # return a simulated 1D array y, given self.x and additional parameters arguments (with default values)
        raise Exception('ABC::simulate should be defined by a deriving class')
    # the important part
    def run(self, Nsim):
        self.samples = np.full((Nsim, len(self.param_names)), np.nan)
        self.distances = np.full(Nsim, np.nan)
        for i in range(Nsim):
            params = {p:self.priors[p].rvs() for p in self.param_names}
            ysim = self.simulate(**params)
            # compute summaries and distance from self.s_true
            # store params in the ith row of self.samples
            # store distance in the ith entry of self.distances
    # useful visualizations
    def distance_hist(self):
        plt.rcParams['figure.figsize'] = (4.0, 3.0)
        plt.hist(self.distances);
        plt.xlabel("d");
    def select_distances(self, eps):
        self.selection = np.flatnonzero(self.distances < eps)
        self.samples2 = self.samples[self.selection,:]
        print('Acceptance rate:', self.samples2.shape[0]/self.samples.shape[0], '(', self.samples2.shape[0], 'accepted samples )')
    def plot_acceptances(self, truth=None, truth_tri=None, size=8.0, show_rejects=True):
        plt.rcParams['figure.figsize'] = (size, size)
        n = len(self.param_names)
        fig = plt.figure()
        axes = []
        for i,p in enumerate(self.param_names):
            axes.append([])
            ax = fig.add_subplot(n, n, (i*n)+i+1)
            ax0 = ax
            ax.hist(self.samples2[:,i], density=True, label='ABC');
            if truth is not None:
                aa = np.linspace(*self.priors[p].ppf([0.0001,0.9999]), 100)
                ax.plot(aa, truth['1D'][p].pdf(aa), label='truth');
            if i==n-1:
                ax.set_xlabel(p);
            else:
                ax.get_xaxis().set_ticklabels([])
            ax.get_yaxis().set_ticklabels([])
            for j,q in enumerate(self.param_names):
                if j == i:
                    break
                ax = fig.add_subplot(n, n, (i*n)+j+1)
                axes[-1].append(ax)
                if show_rejects:
                    ax.plot(self.samples[:,j], self.samples[:,i], ',', color='C2');
                ax.plot(self.samples2[:,j], self.samples2[:,i], '.');
                if truth is not None:
                    for k in truth['2D'].keys():
                        ax.plot(truth['2D'][k][0], truth['2D'][k][1], color='C1', label='truth');
                if i==n-1:
                    ax.set_xlabel(q);
                else:
                    ax.get_xaxis().set_ticklabels([])
                if j==0:
                    ax.set_ylabel(p);
                else:
                    ax.get_yaxis().set_ticklabels([])
            axes[-1].append(ax0)
        if truth_tri is not None:
             cr.whist_triangle_plot(truth_tri, axes=axes, linecolor1D='C1', linecolor2D='C1', fill2D=False);

# Any notes about these decisions can go here

# class ABC_ours(ABC):
#     def summaries(self, x, y):
#         # return summary statistics as a 1D np.array
#     def distance(self, s1, s2):
#         # return scalar distance between 2 sets of summary statistics
#     def simulate(self, a=0.0, b=0.0):
#         # return a simulated 1D array y, given self.x and additional parameters arguments (with default values)

abc = ABC_ours(x, y, priors)

abc.run(1)
print(abc.samples)
print(abc.distances)

[[-2.7244331   0.50411893]]
[0.66515504]

%time abc.run(20000)

CPU times: user 7.41 s, sys: 40.4 ms, total: 7.45 s
Wall time: 7.52 s

abc.distance_hist();

eps = np.quantile(abc.distances, 0.5)
print("eps =", eps)
abc.select_distances(eps)
abc.plot_acceptances(truth=true_post, size=4.0)

eps = 0.6959394234143433
Acceptance rate: 0.5 ( 10000 accepted samples )

eps = np.quantile(abc.distances, 0.1)
print("eps =", eps)
abc.select_distances(eps)
abc.plot_acceptances(truth=true_post, size=4.0)

eps = 0.14008944453157685
Acceptance rate: 0.1 ( 2000 accepted samples )

eps = np.quantile(abc.distances, 0.1)
print("eps =", eps)
abc.select_distances(eps)
abc.plot_acceptances(truth=true_post, size=4.0)

eps = 0.14008944453157685
Acceptance rate: 0.1 ( 2000 accepted samples )

eps = np.quantile(abc.distances, 0.01)
print("eps =", eps)
abc.select_distances(eps)
abc.plot_acceptances(truth=true_post, size=4.0)

eps = 0.038449764295854
Acceptance rate: 0.01 ( 200 accepted samples )

I_have_recorded_my_thoughts = False # change to True when it is true

assert I_have_recorded_my_thoughts

# class ABC_OLS(ABC_ours):
#     def summaries(self, x, y):
#         # return summary statistics, the OLS estimators of a and b, as a 1D np.array

abc1 = ABC_OLS(x, y, priors)

assert all(ols.params == abc1.summaries(x,y))

%time abc1.run(20000)

CPU times: user 11.7 s, sys: 44.4 ms, total: 11.7 s
Wall time: 11.8 s

abc1.distance_hist();

eps = np.quantile(abc1.distances, 0.5)
print("eps =", eps)
abc1.select_distances(eps)
abc1.plot_acceptances(truth=true_post, size=4.0)

eps = 0.6545126265864643
Acceptance rate: 0.5 ( 10000 accepted samples )

eps = np.quantile(abc1.distances, 0.1)
print("eps =", eps)
abc1.select_distances(eps)
abc1.plot_acceptances(truth=true_post, size=4.0)

eps = 0.19439434899714933
Acceptance rate: 0.1 ( 2000 accepted samples )

eps = np.quantile(abc1.distances, 0.05)
print("eps =", eps)
abc1.select_distances(eps)
abc1.plot_acceptances(truth=true_post, size=4.0)

eps = 0.1347688101494705
Acceptance rate: 0.05 ( 1000 accepted samples )

eps = np.quantile(abc1.distances, 0.01)
print("eps =", eps)
abc1.select_distances(eps)
abc1.plot_acceptances(truth=true_post, size=4.0)

eps = 0.05867312084143261
Acceptance rate: 0.01 ( 200 accepted samples )

# class ABC_OLS2(ABC_OLS):
#     def distance(self, s1, s2):
#         # return scalar distance between 2 sets of summary statistics

abc2 = ABC_OLS2(x, y, priors)

abc2.run(1)

%time abc2.run(20000)

CPU times: user 11.5 s, sys: 45.5 ms, total: 11.5 s
Wall time: 11.5 s

abc2.distance_hist();

eps = np.quantile(abc2.distances, 0.5)
print("eps =", eps)
abc2.select_distances(eps)
abc2.plot_acceptances(truth=true_post, size=4.0)

eps = 3.057937865615461
Acceptance rate: 0.5 ( 10000 accepted samples )

eps = np.quantile(abc2.distances, 0.1)
print("eps =", eps)
abc2.select_distances(eps)
abc2.plot_acceptances(truth=true_post, size=4.0)

eps = 1.3243872565570287
Acceptance rate: 0.1 ( 2000 accepted samples )

eps = np.quantile(abc2.distances, 0.05)
print("eps =", eps)
abc2.select_distances(eps)
abc2.plot_acceptances(truth=true_post, size=4.0)

eps = 0.9501546177624834
Acceptance rate: 0.05 ( 1000 accepted samples )

eps = np.quantile(abc2.distances, 0.01)
print("eps =", eps)
abc2.select_distances(eps)
abc2.plot_acceptances(truth=true_post, size=4.0)

eps = 0.4210760671844682
Acceptance rate: 0.01 ( 200 accepted samples )

Yes_I_totally_see_that = False # change to True when true

assert Yes_I_totally_see_that

param_names2 = param_names + ['s2']

table2 = np.loadtxt(datapath+'data2.txt')
x2 = table2[:,0]
y2 = table2[:,1]

plt.rcParams['figure.figsize'] = (4.0, 3.0)
plt.plot(x2, y2, '.');
plt.xlabel("x"); plt.ylabel("y");

par = lrgs.Parameters(np.matrix([x2]).T, np.matrix([y2]).T, M_inv=[np.asmatrix(np.zeros(2)) for i in range(len(x2))], Sigma_prior=(-2., np.matrix(np.zeros((1,1)))))

chain = lrgs.Chain(par, 15000)

%time chain.run(fix='y') # <10s on an old laptop

CPU times: user 9.26 s, sys: 80 ms, total: 9.34 s
Wall time: 9.47 s

chdict = chain.to_dict(['B','Sigma'])
charr = np.array([chdict[p] for p in ['B_0_0','B_1_0','Sigma_0_0']]).T

#plt.rcParams['figure.figsize'] = (12.0, 2.0*len(param_names2))
#fig, ax = plt.subplots(len(param_names2), 1);
#cr.plot_traces(charr, ax, labels=param_names2);

charr = charr[10:,:]
tri = cr.whist_triangle(charr, bins=50, smooth2D=1);

cr.whist_triangle_plot(tri, paramNames=param_names2);

def minus_lnp2(params, x, y):
    # return -ln(posterior) given params, a 1D np.array [a,b,s2]

guess2 = [0.0, 0.0, 1.0]

LA2 = minimize(minus_lnp2, guess2, bounds=[(None,None), (None,None), (0.0,None)], args=(x2, y2))
LA2

  message: CONVERGENCE: NORM_OF_PROJECTED_GRADIENT_<=_PGTOL
  success: True
   status: 0
      fun: 59.8988630297158
        x: [-2.718e+00  5.945e-01  2.791e+00]
      nit: 15
      jac: [ 7.105e-07  0.000e+00 -7.105e-07]
     nfev: 72
     njev: 18
 hess_inv: <3x3 LbfgsInvHessProduct with dtype=float64>

LA2_mean = LA2.x
LA2_cov = LA2.hess_inv.todense()
print("mean:", LA2_mean)
print("cov:", LA2_cov)

mean: [-2.71795238  0.59450388  2.7914622 ]
cov: [[ 0.19321949 -0.0404238  -0.05339119]
 [-0.0404238   0.02055936  0.05755932]
 [-0.05339119  0.05755932  0.80633199]]

fig,ax = cr.whist_triangle_plot(tri, paramNames=param_names2, linecolor1D='b', linecolor2D='b', fill2D=False);
for i,p in enumerate(param_names2):
    aa = np.linspace(LA2_mean[i]-4*np.sqrt(LA2_cov[i,i]), LA2_mean[i]+4*np.sqrt(LA2_cov[i,i]), 100)
    ax[i][i].plot(aa, st.norm.pdf(aa, LA2_mean[i], np.sqrt(LA2_cov[i,i])), '--', color='r');
    ax[i][i].set_xlim(min(ax[i][i].get_xlim()[0], LA2_mean[i]-4*np.sqrt(LA2_cov[i,i])), max(ax[i][i].get_xlim()[1], LA2_mean[i]+4*np.sqrt(LA2_cov[i,i])))
    ax[i][i].set_ylim(0.0, max(ax[i][i].get_ylim()[1], st.norm.pdf(aa, LA2_mean[i], np.sqrt(LA2_cov[i,i])).max()*1.1))
    for j,q in enumerate(param_names2):
        if i==j:
            break
        cr.cov_ellipse(LA2_cov[np.ix_([j,i],[j,i])], center=LA2_mean[[j,i]], level=0.68268949, plot=ax[i][j], fmt='--', color='r')
        cr.cov_ellipse(LA2_cov[np.ix_([j,i],[j,i])], center=LA2_mean[[j,i]], level=0.95449974, plot=ax[i][j], fmt='--', color='r')
        ax[i][j].set_xlim(min(ax[i][j].get_xlim()[0], LA2_mean[j]-4*np.sqrt(LA2_cov[j,j])), max(ax[i][j].get_xlim()[1], LA2_mean[j]+4*np.sqrt(LA2_cov[j,j])))
        ax[i][j].set_ylim(min(ax[i][j].get_ylim()[0], LA2_mean[i]-4*np.sqrt(LA2_cov[i,i])), max(ax[i][j].get_ylim()[1], LA2_mean[i]+4*np.sqrt(LA2_cov[i,i])))

# priors2 = {'a':..., 'b':..., 's2':...}

# class ABC_scat(ABC):
#     def summaries(self, x, y):
#         # return summary statistics as a 1D np.array
#     def distance(self, s1, s2):
#         # return scalar distance between 2 sets of summary statistics
#     def simulate(self, a=0.0, b=0.0, s2=1.0):
#         # return a simulated 1D array y, given self.x and additional parameters arguments (with default values)

abc3 = ABC_scat(x2, y2, priors2)

abc3.run(1)
print(abc3.samples)
print(abc3.distances)

[[-2.94627433  0.86675959 12.19002481]]
[9.7587713]

%time abc3.run(20000)

CPU times: user 15.1 s, sys: 95.3 ms, total: 15.2 s
Wall time: 15.5 s

abc3.distance_hist();

eps = np.quantile(abc3.distances, 0.5)
print("eps =", eps)
abc3.select_distances(eps)
abc3.plot_acceptances(truth_tri=tri, size=6.0, show_rejects=False)

eps = 5.974735324540064
Acceptance rate: 0.5 ( 10000 accepted samples )

eps = np.quantile(abc3.distances, 0.1)
print("eps =", eps)
abc3.select_distances(eps)
abc3.plot_acceptances(truth_tri=tri, size=6.0, show_rejects=False)

eps = 2.8341680811343344
Acceptance rate: 0.1 ( 2000 accepted samples )

eps = np.quantile(abc3.distances, 0.05)
print("eps =", eps)
abc3.select_distances(eps)
abc3.plot_acceptances(truth_tri=tri, size=6.0, show_rejects=False)

eps = 2.183490628701815
Acceptance rate: 0.05 ( 1000 accepted samples )

eps = np.quantile(abc3.distances, 0.01)
print("eps =", eps)
abc3.select_distances(eps)
abc3.plot_acceptances(truth_tri=tri, size=6.0, show_rejects=False)

eps = 1.2939580058803228
Acceptance rate: 0.01 ( 200 accepted samples )

Yes_this_all_checks_out = False # change to True when true

assert Yes_this_all_checks_out

def bootstrap(x, y):
    # i = list of indices into x and y encoding the resampling; see np.random.choice
    return x[i],y[i]

%%time
boot = np.full((20000,3), np.nan)
for i in range(boot.shape[0]):
    xb,yb = bootstrap(x2, y2)
    boot[i,:] = abc3.summaries(xb, yb)

CPU times: user 9.47 s, sys: 56.3 ms, total: 9.53 s
Wall time: 9.77 s

boot_tri = cr.whist_triangle(boot, bins=50, smooth2D=1);
fig,ax = cr.whist_triangle_plot(boot_tri, paramNames=param_names2, linecolor1D='r', linecolor2D='r', linestyle1D='--', linestyle2D='--', fill2D=False);
cr.whist_triangle_plot(tri, linecolor1D='b', linecolor2D='b', fill2D=False, axes=ax);

Tutorial: Approximate Methods¶

Case: ordinary least squares¶

Laplace Approximation¶

Approximate Bayesian Computation¶

Arbitrary summary statistics¶

Optimal summary statistics¶

Case: linear model with unknown scatter¶

Laplace Approximation¶

Approximate Bayes¶

Bootstrap¶

Parting thoughts¶