from os import getcwd
from os.path import exists as file_exists
from yaml import safe_load
import numpy as np
from scipy.optimize import minimize
import scipy.stats as st
import matplotlib.pyplot as plt
%matplotlib inline

import dynesty
from dynesty import plotting as dyplot
import emcee
import incredible as cr
from pygtc import plotGTC

thisTutorial = 'microlensing'
if getcwd() == '/content':
    # assume we are in Colab, and the user's data directory is linked to their drive/Physics267_data
    from google.colab import drive
    drive.mount('/content/drive')
    datapath = '/content/drive/MyDrive/Physics267_data/' + thisTutorial + '/' 
else:
    # assume we are running locally somewhere and have the data under ./data/
    datapath = 'data/'

dat = np.loadtxt(datapath+'phot.dat.gz')
dat.shape

(4062, 5)

data = {'t':dat[:,0],    # date
        'I':dat[:,1],    # I magnitude
        'Ierr':dat[:,2], # I magnitude uncertainty
        't0':2450000.}   # reference time
data['t'] -= data['t0']

plt.rcParams['figure.figsize'] = (20.0, 4.0)
plt.errorbar(data['t'], data['I'], yerr=data['Ierr'], fmt='.');
plt.xlabel('HJD - '+str(data['t0']));
plt.ylabel('I magnitude');
plt.gca().invert_yaxis();

# bad_data = ...

plt.rcParams['figure.figsize'] = (20.0, 4.0)
plt.errorbar(data['t'][~bad_data], data['I'][~bad_data], yerr=data['Ierr'][~bad_data], fmt='.');
plt.errorbar(data['t'][bad_data], data['I'][bad_data], yerr=data['Ierr'][bad_data], fmt='rD');
plt.xlabel('HJD - '+str(data['t0']));
plt.ylabel('I magnitude');
plt.gca().invert_yaxis();

for k in ['I', 'Ierr', 't']:
    data[k] = data[k][~bad_data]
    # below is in principle a more elegant option, but it slowed down the notebook by a factor >2, so no
    #data[k] = np.ma.masked_array(data=data[k], mask=bad_data)

paramnames = ['I0', 'p', 'tmax', 'tE']
param_labels = [r'$I_0$', r'$p$', r'$t_{max}$', r'$t_E$']

def model_I(t, I0, p, tmax, tE):
    """
    Return the model lightcurve in magnitude units, I(t), where t can be an array.
    """

plt.rcParams['figure.figsize'] = (6.0, 4.0)
plt.xlabel(r'$(t-t_\mathrm{max})/t_\mathrm{E}$');
plt.ylabel(r'$I-I_0$');
plt.gca().invert_yaxis();
tgrid = np.linspace(-3.0, 3.0, 1000)
plt.plot(tgrid, model_I(tgrid, I0=0.0, p=0.1, tmax=0.0, tE=1.0), label='p=0.1');
plt.plot(tgrid, model_I(tgrid, I0=0.0, p=0.5, tmax=0.0, tE=1.0), label='p=0.5');
plt.plot(tgrid, model_I(tgrid, I0=0.0, p=1.0, tmax=0.0, tE=1.0), label='p=1.0');
plt.plot(tgrid, model_I(tgrid, I0=0.0, p=2.0, tmax=0.0, tE=1.0), label='p=2.0');
plt.plot(tgrid, model_I(tgrid, I0=0.0, p=10.0, tmax=0.0, tE=1.0), label='p=10.0');
plt.legend();

#priors = {'I0':...,
#           'p':...,
#           'tmax':...,
#           'tE':...}

# P_microlens = ...
P_constant = 1.0 - P_microlens

def log_like(params):
    # params is a 1D array of values, whose order is given by paramnames

guess = [np.mean(data['I']), 1.0, np.mean(data['t']), 100.]
print(log_like(guess))
assert(np.isfinite(log_like(guess)))

-485883.1636646219

def log_posterior(pvec):
    '''
    Our usual log-posterior function, able to take a vector argument to satisfy emcee
    '''
    lnp = 0.0
    for i,p in enumerate(paramnames):
        lnp += priors[p].logpdf(pvec[i])
    if lnp != -np.inf:
        lnp += log_like(pvec)
    return lnp

# start = ...
# or, e.g.
# def objective(pvec):
#     return -log_posterior(pvec)
# guess = ...
# opt = minimize(objective, guess, method='Nelder-Mead') # (I used Nelder-Mead because I was too lazy to encode the prior boundaries on the parameters)
# print(opt)
# assert opt.success
# start = opt.x

       message: Optimization terminated successfully.
       success: True
        status: 0
           fun: -7983.1021989030605
             x: [ 1.673e+01  9.585e-01  6.700e+03  2.024e+01]
           nit: 219
          nfev: 380
 final_simplex: (array([[ 1.673e+01,  9.585e-01,  6.700e+03,  2.024e+01],
                       [ 1.673e+01,  9.585e-01,  6.700e+03,  2.024e+01],
                       ...,
                       [ 1.673e+01,  9.585e-01,  6.700e+03,  2.024e+01],
                       [ 1.673e+01,  9.585e-01,  6.700e+03,  2.024e+01]]), array([-7.983e+03, -7.983e+03, -7.983e+03, -7.983e+03,
                       -7.983e+03]))

plt.rcParams['figure.figsize'] = (20.0, 4.0)
plt.errorbar(data['t'], data['I'], yerr=data['Ierr'], fmt='.', zorder=0);
tgrid = np.linspace(data['t'].min(), data['t'].max(), 1000)
plt.plot(tgrid, model_I(tgrid, *start));
plt.xlabel('HJD - '+str(data['t0']));
plt.ylabel('I magnitude');
plt.gca().invert_yaxis();

npars = len(paramnames)
nwalkers = 2 * npars
esampler = emcee.EnsembleSampler(nwalkers, npars, log_posterior)
estart = np.array([np.array(start)*(1.0 + 0.001*np.random.randn(npars)) for j in range(nwalkers)])

%%time
esampler.run_mcmc(estart, 5000); # run for longer if you want/need

CPU times: user 38.1 s, sys: 170 ms, total: 38.3 s
Wall time: 39.3 s

plt.rcParams['figure.figsize'] = (16.0, 3.0*npars)
fig, ax = plt.subplots(npars, 1);
cr.plot_traces(esampler.chain[:min(8,nwalkers),:,:], ax, labels=param_labels);

burn = 500 # adjust as needed
echain = esampler.chain[:,burn:,:]

R = cr.GelmanRubinR(echain)
print(R)
assert R.max() < 1.1

[1.00187628 1.00778347 1.00208209 1.00602891]

neff = cr.effective_samples(echain, maxlag=750, throw=True)
print(neff)
assert neff.min() > 300 # this is fewer than we would normally like, but we only want these results to compare to nested sampling

[584.39707869 706.58364499 478.13198863 651.53018595]

echain = np.concatenate(echain, axis=0)
plotGTC(echain, paramNames=param_labels, figureSize=6, customLabelFont={'size':10}, customTickFont={'size':10});

def ptform(u):
    '''
    Input: a vector in the unit cube, 0 <= u[i] <= 1.
    Output: a vector in our parameter space, output[i] = quantile_i(u[i]).
    '''

print(ptform([0.25]*len(paramnames)))
print(ptform([0.5]*len(paramnames)))
print(ptform([0.75]*len(paramnames)))

[np.float64(15.97275), np.float64(0.875), np.float64(5688.490447500022), np.float64(422.677937499946)]
[np.float64(16.5795), np.float64(1.75), np.float64(6111.168384999968), np.float64(845.355874999892)]
[np.float64(17.18625), np.float64(2.625), np.float64(6533.846322499914), np.float64(1268.033812499838)]

sampler = dynesty.NestedSampler(log_like, ptform, len(paramnames))

%%time
sampler.run_nested()

results = sampler.results
results.summary()

Summary
=======
nlive: 500
niter: 16979
ncall: 93755
eff(%): 18.643
logz: 7966.879 +/-  0.443

try:
    dynesty.plotting.runplot(results); # this sometimes fails for no identifiable reason; don't worry about it if so
except:
    pass

/Users/amantz/miniconda3_2024/envs/p267/lib/python3.12/site-packages/dynesty/plotting.py:252: RuntimeWarning: overflow encountered in exp
  np.exp(logwt), logz if logplot else np.exp(logz)

/Users/amantz/miniconda3_2024/envs/p267/lib/python3.12/site-packages/dynesty/plotting.py:282: RuntimeWarning: overflow encountered in exp
  zspan = (0., 1.05 * np.exp(logz[-1] + 3. * logzerr[-1]))

plt.rcParams['figure.figsize'] = (12.0, 4.0)
Ndiscard = len(results['logz']) // 2
plt.plot(results['logz'][Ndiscard:]);
plt.xlabel("Iteration - "+str(Ndiscard), fontsize=12);
plt.ylabel("Log Evidence", fontsize=12);

fig, axes = dyplot.traceplot(results, quantiles=st.norm.cdf([-1,1]), labels=param_labels)

dchain = results.samples_equal()
plotGTC([echain, dchain], paramNames=param_labels, figureSize=6, customLabelFont={'size':10}, customTickFont={'size':10});

assert np.allclose(echain.mean(axis=0), dchain.mean(axis=0), rtol=0.01)
assert np.allclose(echain.std(axis=0), dchain.std(axis=0), rtol=0.1)

paramnames2 = paramnames[:1]
param_labels2 = param_labels[:1]

priors2 = {k:priors[k] for k in paramnames2}

def ptform2(u):
    '''
    Input: a vector in the unit cube, 0 <= u[i] <= 1.
    Output: a vector in our parameter space, output[i] = quantile_i(u[i]).
    '''

def log_like2(params):
    # params is a 1D array of length 1, containing I0

print(ptform2([0.25]))
print(ptform2([0.5]))
print(ptform2([0.75]))
assert np.isfinite(log_like2(guess[:1]))

[15.97275]
[16.5795]
[17.18625]

sampler2 = dynesty.NestedSampler(log_like2, ptform2, len(paramnames2))

%%time
sampler2.run_nested()

results2 = sampler2.results
results2.summary()

Summary
=======
nlive: 500
niter: 5030
ncall: 24378
eff(%): 22.684
logz: -43307.463 +/-  0.236

try:
    dynesty.plotting.runplot(results2);
except:
    pass

/Users/amantz/miniconda3_2024/envs/p267/lib/python3.12/site-packages/dynesty/plotting.py:318: UserWarning: Attempting to set identical low and high ylims makes transformation singular; automatically expanding.
  axes[i].set_ylim([ymin, ymax])

dyplot.traceplot(results2, quantiles=st.norm.cdf([-1,1]), labels=param_labels2);

print("Microlensing model: logz =", results.logz[-1], "+/-", results.logzerr[-1])
print("Constant model: logz =", results2.logz[-1], "+/-", results2.logzerr[-1])
print("Difference in logz =", results.logz[-1]-results2.logz[-1], "+/-", np.sqrt(results.logzerr[-1]**2+results2.logzerr[-1]**2))

Microlensing model: logz = 7966.879087988207 +/- 0.4428516123919006
Constant model: logz = -43307.462915090895 +/- 0.23606142794953755
Difference in logz = 51274.3420030791 +/- 0.5018391658327206

print("Prior ratio:", P_microlens / P_constant)
print("Evidence ratio:", np.exp(results.logz[-1]-results2.logz[-1]))
print("Posterior ratio:", np.exp(results.logz[-1]-results2.logz[-1]) * P_microlens / P_constant)

Prior ratio: 1.0
Evidence ratio: inf
Posterior ratio: inf

/var/folders/94/15_9sbbs5d94bjspzjf0whj00000gn/T/ipykernel_19640/2187677686.py:2: RuntimeWarning: overflow encountered in exp
  print("Evidence ratio:", np.exp(results.logz[-1]-results2.logz[-1]))
/var/folders/94/15_9sbbs5d94bjspzjf0whj00000gn/T/ipykernel_19640/2187677686.py:3: RuntimeWarning: overflow encountered in exp
  print("Posterior ratio:", np.exp(results.logz[-1]-results2.logz[-1]) * P_microlens / P_constant)

dchain2 = results2.samples_equal()

plt.rcParams['figure.figsize'] = (20.0, 4.0)
plt.errorbar(data['t'], data['I'], yerr=data['Ierr'], fmt='.', zorder=0, label='data');
plt.plot(tgrid, model_I(tgrid, *dchain.mean(axis=0)), label='microlensing');
plt.axhline(dchain2.mean(), color='C2', label='constant');
plt.xlabel('HJD - '+str(data['t0']));
plt.ylabel('I magnitude');
plt.gca().invert_yaxis();
plt.legend();

I_have_answers_to_these_questions = False # change to True when true

assert I_have_answers_to_these_questions

Tutorial: Microlensing Lightcurve¶

Data¶

Model¶

Fit the microlensing model using standard MCMC¶

Fit the microlensing model using nested sampling¶

Fit a constant model using nested sampling¶

Parting thoughts¶

Endnotes¶

Note 1¶