from os import getcwd
from os.path import exists as file_exists
from yaml import safe_load, safe_dump
from astropy.io import fits
from astropy.visualization import LogStretch
from astropy.wcs import WCS
logstretch = LogStretch()
from numba import njit
import numpy as np
from regions import Regions
import scipy.stats as st
import matplotlib.pyplot as plt
%matplotlib inline

import incredible as cr
from pygtc import plotGTC

thisTutorial = 'xray_image'
if getcwd() == '/content':
    # assume we are in Colab, and the user's data directory is linked to their drive/Physics267_data
    from google.colab import drive
    drive.mount('/content/drive')
    datapath = '/content/drive/MyDrive/Physics267_data/' + thisTutorial + '/' 
else:
    # assume we are running locally somewhere and have the data under ./data/
    datapath = 'data/'

imfits = fits.open(datapath + 'image_0.6-2.0keV.fits.gz')
exfits = fits.open(datapath + 'expmap_1.25kev.fits.gz')

imfits.info()

Filename: ../../data/public/xray_image/image_0.6-2.0keV.fits.gz
No.    Name      Ver    Type      Cards   Dimensions   Format
  0  PRIMARY       1 PrimaryHDU     983   (883, 883)   int16

exfits.info()

Filename: ../../data/public/xray_image/expmap_1.25kev.fits.gz
No.    Name      Ver    Type      Cards   Dimensions   Format
  0  PRIMARY       1 PrimaryHDU     173   (883, 883)   float32

im = imfits[0].data
ex = exfits[0].data
print(im.shape, im.dtype)
print(ex.shape, ex.dtype)

(883, 883) >i2
(883, 883) >f4

ex *= imfits[0].header['exposure']

plt.rcParams['figure.figsize'] = (12.0, 6.0)
fig, ax = plt.subplots(1,2);
ax[0].imshow(logstretch(im), cmap='gray', origin='lower');
ax[0].set_title('image (log scale)');
ax[1].imshow(ex, cmap='gray', origin='lower');
ax[1].set_title('exposure map');

data = {'im': im, 'ex':ex}
data['imx'], data['imy'] = np.meshgrid(np.arange(im.shape[1]), np.arange(im.shape[0]))

plt.rcParams['figure.figsize'] = (6.0, 6.0)
fig, ax = plt.subplots(1,2);
ax[0].imshow(data['imx'], cmap='gray', origin='lower');
ax[0].set_title('imx');
ax[1].imshow(data['imy'], cmap='gray', origin='lower');
ax[1].set_title('imy');

print(data['imx'].min(), data['imx'].max())
print(data['imy'].min(), data['imy'].max())

0 882
0 882

%%html
   <div class="JS9Menubar"></div>
   <div class="JS9"></div>
   <link type="text/css" rel="stylesheet" href="//js9.si.edu/jupyter/js9-allinone.css">
   <script type="text/javascript" src="//js9.si.edu/jupyter/js9-allinone.js"></script>

# region_string = """
# FK5
# circle(...
# ...
# box(...
# ...
# """

wcs = WCS(imfits[0].header)
regions = Regions.parse(region_string, format='ds9')
# One wonders why the below is not a single function call... perhaps in some future version...
regions_pix = [region.to_pixel(wcs) for region in regions]
region_mask = np.full(im.shape, 0.0)
for region in regions_pix:
    region_mask += region.to_mask().to_image(im.shape)
region_mask = (region_mask != 0.0)

WARNING: FITSFixedWarning: 'datfix' made the change 'Set DATEREF to '1998-01-01' from MJDREF.
Set MJD-END to 53973.732083 from DATE-END'. [astropy.wcs.wcs]

plt.rcParams['figure.figsize'] = (12.0, 6.0)
fig, ax = plt.subplots(1,2);
ax[0].imshow(logstretch(im), cmap='gray', origin='lower');
ax[0].set_title('image (log scale)');
ax[1].imshow(region_mask, cmap='gray', origin='lower');
ax[1].set_title('region mask from JS9');

# exp_mask = ...

plt.rcParams['figure.figsize'] = (12.0, 6.0)
fig, ax = plt.subplots(1,2);
ax[0].imshow(ex, cmap='gray', origin='lower');
ax[0].set_title('exposure map');
ax[1].imshow(exp_mask, cmap='gray', origin='lower');
ax[1].set_title('low exposure mask');

combined_mask = np.logical_or(region_mask, exp_mask)

plt.rcParams['figure.figsize'] = (16.0, 6.0)
fig, ax = plt.subplots(1,3);
ax[0].imshow(logstretch(im), cmap='gray', origin='lower');
ax[0].set_title('image (log scale)');
ax[1].imshow(logstretch(np.where(combined_mask, np.nan, im)), cmap='gray', origin='lower');
ax[1].set_title('masked image (log scale)');
ax[2].imshow(np.where(combined_mask, 0.0, ex), cmap='gray', origin='lower');
ax[2].set_title('masked exposure map');

goodpix = np.flatnonzero(~combined_mask)

data['flatim'] = data['im'].flatten()[goodpix].astype('int64') # numba refuses to work with short int
data['flatex'] = data['ex'].flatten()[goodpix].astype('float64') # numba refuses to work with single precision float
data['flatx'] = data['imx'].flatten()[goodpix]
data['flaty'] = data['imy'].flatten()[goodpix]
data['goodpix'] = goodpix

# new_im = ...

plt.rcParams['figure.figsize'] = (12.0, 6.0)
fig, ax = plt.subplots(1,2);
ax[0].imshow(logstretch(data['im']), cmap='gray', origin='lower');
ax[0].set_title('original image (log scale)');
ax[1].imshow(logstretch(new_im), cmap='gray', origin='lower');
ax[1].set_title('rebuilt image (log scale)');

assert np.all(np.logical_or(data['im']==new_im, np.isnan(new_im)))

@njit
def betaModel(r, S0, rc, beta):
    '''
    Evaluate the beta model given above as a function of radius
    '''

betaModel(1.0, 1.0, 1.0, 0.67) # get it compiled and check for errors of whatever kind

%%time
for i in range(1000000):
    betaModel(1.0, 0.0, 1.0, 0.67);

CPU times: user 317 ms, sys: 1.55 ms, total: 318 ms
Wall time: 318 ms

plt.rcParams['figure.figsize'] = (6., 4.)
rgrid = 10.**np.linspace(-1., 1.)
plt.loglog(rgrid, betaModel(rgrid, 1.0, 1.0, 0.5), label=r'$\beta=0.5$')
plt.loglog(rgrid, betaModel(rgrid, 1.0, 1.0, 0.67), label=r'$\beta=0.67$')
plt.loglog(rgrid, betaModel(rgrid, 1.0, 1.0, 1.0), label=r'$\beta=1.0$')
plt.legend();
plt.xlabel(r'$r/r_\mathrm{c}$');
plt.ylabel(r'$S(r)/S_0$');

paramnames = ['x0', 'y0', 'S0', 'rc', 'beta', 'B']
paramnames2 = paramnames + ['S02', 'rc2', 'beta2']

class Profile:
    def __init__(self, img, x0, y0, rmax, nbins=32):
        r2 = np.exp(np.linspace(0.0, np.log(rmax), nbins))
        r1 = np.concatenate(([0.0], r2[:-1]))
        N = np.zeros(r1.shape)
        E = np.zeros(r1.shape)
        npix = np.zeros(r1.shape)
        d = np.sqrt((img['flatx'] - x0)**2 + (img['flaty'] - y0)**2)
        for i in range(len(N)):
            j = np.logical_and(d >= r1[i], d < r2[i])
            N[i] += img['flatim'][j].sum()
            E[i] += img['flatex'][j].sum()
            npix[i] += j.sum()
        r = np.sqrt(r1 * r2)
        r[0] = np.sqrt(0.3 * r2[0]) # fiat
        j = np.flatnonzero(npix > 0) # divide by zero warnings are annoying
        self.r1 = r1[j]
        self.r2 = r2[j]
        self.r = r[j]
        self.N = N[j]
        self.E = E[j]
        self.npix = npix[j]

stupid_profile = Profile(data, data['flatx'].mean(), data['flaty'].mean(), 600.); # hopefully 600 is large enough for a maximum radius?

fig, ax = plt.subplots(1,3, figsize=(20.0, 4.0))
ax[0].loglog(stupid_profile.r, stupid_profile.N, '.');
ax[1].loglog(stupid_profile.r, stupid_profile.N/stupid_profile.npix, '.');
ax[2].loglog(stupid_profile.r, stupid_profile.N/stupid_profile.E, '.');
ax[0].set_ylabel('Total counts'); ax[1].set_ylabel('Average counts/pixel'); ax[2].set_ylabel('Average surface brightness');
for i in range(3): ax[i].set_xlabel('Radius (pixels)');

# guess = {'x0':..., 'y0':..., 'S0':..., 'rc':..., 'beta':..., 'B':...}

guess_profile = Profile(data, guess['x0'], guess['y0'], 600.); # hopefully 600 is large enough for a maximum radius?

fig, ax = plt.subplots(1,3, figsize=(20.0, 4.0))
ax[0].loglog(guess_profile.r, guess_profile.N, '.');
ax[0].plot(guess_profile.r, betaModel(guess_profile.r, guess['S0'], guess['rc'], guess['beta'])*guess_profile.E + guess['B']*guess_profile.npix, '-', label='Total');
ax[0].plot(guess_profile.r, betaModel(guess_profile.r, guess['S0'], guess['rc'], guess['beta'])*guess_profile.E, '--', label='beta');
ax[0].plot(guess_profile.r, guess['B']*guess_profile.npix, '--', label='background');
ax[0].legend()
ax[1].loglog(guess_profile.r, guess_profile.N/guess_profile.npix, '.');
ax[1].plot(guess_profile.r, betaModel(guess_profile.r, guess['S0'], guess['rc'], guess['beta'])*guess_profile.E/guess_profile.npix + guess['B'], '-');
ax[1].plot(guess_profile.r, betaModel(guess_profile.r, guess['S0'], guess['rc'], guess['beta'])*guess_profile.E/guess_profile.npix, '--');
ax[1].plot(guess_profile.r, guess['B']+0*guess_profile.npix, '--');
ax[2].loglog(guess_profile.r, guess_profile.N/guess_profile.E, '.');
ax[2].plot(guess_profile.r, betaModel(guess_profile.r, guess['S0'], guess['rc'], guess['beta']) + guess['B']/guess_profile.E*guess_profile.npix, '-');
ax[2].plot(guess_profile.r, betaModel(guess_profile.r, guess['S0'], guess['rc'], guess['beta']), '--');
ax[2].plot(guess_profile.r, guess['B']/guess_profile.E*guess_profile.npix, '--');
ax[0].set_ylabel('Total counts'); ax[1].set_ylabel('Average counts/pixel'); ax[2].set_ylabel('Average surface brightness');
for i in range(3): ax[i].set_xlabel('Radius (pixels)');

%%time
print("Here we are benchmarking a function that will be called many times.")

Here we are benchmarking a function that will be called many times.

CPU times: user 793 ms, sys: 6.18 ms, total: 799 ms
Wall time: 804 ms

%%time
print("Here we are doing some kind of calculation.")

Here we are doing some kind of calculation.

CPU times: user 2.87 s, sys: 14 ms, total: 2.88 s
Wall time: 2.89 s

%%time
print("Now we finally get samples from the posterior.")

Now we finally get samples from the posterior.

CPU times: user 8min 31s, sys: 4.17 s, total: 8min 35s
Wall time: 8min 54s

Don't forget to check whatever diagnostics apply to your analysis.

Also, don't forget to coerce the results into the format described above.

fig, ax = plt.subplots(len(paramnames), 1, figsize=(20, len(paramnames)*3));
if chains.__class__ == list:
    cr.plot_traces(chains[:min(8,len(chains))], ax, labels=paramnames);
else:
    cr.plot_traces(chains[:min(8,chains.shape[0]),:,:], ax, labels=paramnames);

R = cr.GelmanRubinR(chains)
print("R =", R)
assert np.all(R < 1.1) # this is permissive, but fine for practice, I guess

R = [1.00906184 1.00228357 1.00263847 1.00343508 1.0057456  1.01370015]

maxlag = 750 # you might need to change this

neff = cr.effective_samples(chains, maxlag=maxlag, throw=True)
print("neff =", neff)
assert np.all(neff > 200) # this is not a lot, but fine for practice, I guess

neff = [695.34157466 659.57945742 613.12109672 604.57153732 618.27613321
 723.61318041]

chain1 = np.concatenate(chains, axis=0)

plotGTC(chain1, paramNames=paramnames, figureSize=8, customLabelFont={'size':12}, customTickFont={'size':12});

fitvec = np.median(chain1, axis=0)
fit = {p:v for p,v in zip(paramnames, fitvec)}

fit_profile = Profile(data, fit['x0'], fit['y0'], 600.); # hopefully 600 is large enough for a maximum radius?

plt.rcParams['figure.figsize'] = (6., 4.)
plt.loglog(fit_profile.r, fit_profile.N/fit_profile.E, '.');
plt.plot(fit_profile.r, betaModel(fit_profile.r, fit['S0'], fit['rc'], fit['beta']) + fit['B']/fit_profile.E*fit_profile.npix, '-', label='Total');
plt.plot(fit_profile.r, betaModel(fit_profile.r, fit['S0'], fit['rc'], fit['beta']), '--', label='beta');
plt.plot(fit_profile.r, fit['B']/fit_profile.E*fit_profile.npix, '--', label='background');
plt.ylabel('Average surface brightness');
plt.xlabel('Radius (pixels)');
plt.legend();

I_have_contemplated_this_deeply = False # change to True when true

assert I_have_contemplated_this_deeply

%%time
print("Doing something")

Doing something

CPU times: user 25.6 s, sys: 118 ms, total: 25.7 s
Wall time: 25.8 s

%%time
print("Getting samples from the posterior")

Getting samples from the posterior

CPU times: user 37min 16s, sys: 15.4 s, total: 37min 32s
Wall time: 38min 52s

fig, ax = plt.subplots(len(paramnames2), 1, figsize=(20, len(paramnames2)*3));
if chains2.__class__ == list:
    cr.plot_traces(chains2[:min(8,len(chains2))], ax, labels=paramnames2);
else:
    cr.plot_traces(chains2[:min(8,chains2.shape[0]),:,:], ax, labels=paramnames2);

R = cr.GelmanRubinR(chains2)
print("R =", R)
assert np.all(R < 1.1) # see previous comment

R = [1.01007049 1.00990772 1.03011342 1.03870945 1.03788039 1.02453344
 1.03833828 1.03903007 1.02631541]

maxlag = 750 # might need to change this

neff = cr.effective_samples(chains2, maxlag=maxlag, throw=True)
print("neff =", neff)
assert np.all(neff > 150) # see previous comment, but even more so

neff = [911.56116356 598.72063906 265.32221939 203.2590344  198.55110551
 397.47457603 199.03412226 206.23140254 317.81870231]

chain2 = np.concatenate(chains2, axis=0)

plotGTC(chain2, paramNames=paramnames2, figureSize=12, customLabelFont={'size':12}, customTickFont={'size':12});

fitvec2 = np.median(chain2, axis=0)
fit2 = {p:v for p,v in zip(paramnames2, fitvec2)}

fit2_profile = Profile(data, fit2['x0'], fit2['y0'], 600.); # hopefully 600 is large enough for a maximum radius?

fig, ax = plt.subplots(1, 2, figsize=(12, 4));
ax[0].loglog(fit2_profile.r, fit2_profile.N/fit2_profile.E, '.');
ax[0].plot(fit2_profile.r, betaModel(fit2_profile.r, fit2['S0'], fit2['rc'], fit2['beta']) + betaModel(fit2_profile.r, fit2['S02'], fit2['rc2'], fit2['beta2']) + fit2['B']/fit2_profile.E*fit2_profile.npix, '-', label='Total');
ax[0].plot(fit2_profile.r, betaModel(fit2_profile.r, fit2['S0'], fit2['rc'], fit2['beta']), '--', label='beta1');
ax[0].plot(fit2_profile.r, betaModel(fit2_profile.r, fit2['S02'], fit2['rc2'], fit2['beta2']), '--', label='beta2');
ax[0].plot(fit2_profile.r, fit2['B']/fit2_profile.E*fit2_profile.npix, '--', label='background');
ax[0].set_ylabel('Average surface brightness');
ax[0].set_xlabel('Radius (pixels)');
ax[0].legend(); ax[0].set_title('Double-beta model');
ax[0].set_ylim(np.min(fit2_profile.N/fit2_profile.E)*0.1, None);

ax[1].loglog(fit_profile.r, fit_profile.N/fit_profile.E, '.');
ax[1].plot(fit_profile.r, betaModel(fit_profile.r, fit['S0'], fit['rc'], fit['beta']) + fit['B']/fit_profile.E*fit_profile.npix, '-', label='Total');
ax[1].plot(fit_profile.r, betaModel(fit_profile.r, fit['S0'], fit['rc'], fit['beta']), '--', label='beta1');
ax[1].plot(fit_profile.r, fit['B']/fit_profile.E*fit_profile.npix, '--', label='background');
ax[1].set_ylabel('Average surface brightness');
ax[1].set_xlabel('Radius (pixels)');
ax[1].legend(); ax[1].set_title('Single-beta model');
ax[1].set_ylim(np.min(fit_profile.N/fit_profile.E)*0.1, None);

I_have_contemplated_this_also = False # change to True when true

assert I_have_contemplated_this_also

# DIC1 = ...
# DIC2 = ...

print("DIC for single-beta:", DIC1)
print("DIC for double-beta:", DIC2)

DIC for single-beta: -379347.2511380915
DIC for double-beta: -381236.94055270386

print(safe_dump({p:float(fit[p]) for p in fit.keys()}))

B: 0.05760377559837962
S0: 1.0913064031979797e-05
beta: 0.5523713419075944
rc: 4.297661488980443
x0: 481.2308121007575
y0: 552.9641413615096

print(safe_dump({p:float(fit2[p]) for p in fit2.keys()}))

B: 0.08224146654627448
S0: 1.060412887584387e-05
S02: 1.087409233494593e-06
beta: 1.051480053347683
beta2: 0.6754178792032468
rc: 6.3288677042804835
rc2: 17.851522070789038
x0: 481.24341164621484
y0: 553.016665909281

print("DIC1-DIC2:", DIC1-DIC2)

DIC1-DIC2: 1889.6894146123668
Total wall time for solutions: 49.0 min 4.447072744369507 sec!!!

Tutorial: X-ray Image Data¶

Nature of the data¶

Working with the data¶

Defining the model¶

Visualizing the model¶

Do inference for a single beta model + background¶

Testing the single-beta fit¶

Do inference for a double beta model + background¶

Testing the double-beta fit¶

Quick and dirty model comparison¶

Parting thoughts¶

Endnotes¶

Note 1¶

Note 2¶