Added script to compute apparent mags from ILAPHv3 instrumental photo…

…metry, accounting for phot dispersion, c20-c22 offset.
gnarayan · Nov 16, 2017 · 2f8666e · 2f8666e
1 parent 9ef4cd3
commit 2f8666e
Showing 1 changed file with 285 additions and 0 deletions.
diff --git a/data/photometry/20171019/ACAS/AS/calc_zptmag_apparent_mags_hierarchical_ILAPHv3.py b/data/photometry/20171019/ACAS/AS/calc_zptmag_apparent_mags_hierarchical_ILAPHv3.py
@@ -0,0 +1,285 @@
+#!/usr/bin/env python
+import sys
+import os
+import glob
+import numpy as np
+import matplotlib.pyplot as plt
+from matplotlib.backends.backend_pdf import PdfPages
+import seaborn as sns
+import astropy.table as at
+from numpy.lib.recfunctions import append_fields
+from scipy.stats import linregress
+import pymc3 as pm
+import pandas as pd
+from collections import OrderedDict
+
+def main():
+    ref = 'FMAG'  # which photometry package should be used to compute zeropoints
+    mintime = 0.7 # mininum exposure length to consider for computing zeropoints
+
+    stars     = ['GD-153', 'GD-71', 'G191B2B'] # what stars are standards
+    marker    = ['o',      'd',     '*']       # markers to use for each standard in plots
+    use_stars = ['GD-153', 'G191B2B', 'GD-71'] # what stars are to be used to get zeropoints
+
+    standard_mags_file = '../calspec_standards_WFC3_UVIS2_IR_vegamag.txt' # standard's apparent magnitudes in each band
+    smags = at.Table.read(standard_mags_file, format='ascii')
+    smags = smags.to_pandas()
+    smags.set_index('objID', inplace=True)
+
+
+    # cut out some fields we do not need to make indexing the data frame a little easier
+    dref = 'ERRMAG'
+    drop_fields = ['X', 'Y', 'BCKGRMS', 'SKY', 'FITS-FILE']
+
+    mag_table = OrderedDict() # stores combined magnitudes and zeropoints in each passband
+    all_mags   = at.Table.read('../src/all+standardmeasures_C20_C22_ILAPHv3_AS.txt', format='ascii')
+    mask = (all_mags[dref] < 0.5) & (np.abs(all_mags[ref]) < 50) & (all_mags['EXPTIME'] >= mintime)
+    nbad = len(all_mags[~mask])
+    print(all_mags[~mask])
+    print("Trimming {:n} bad observations".format(nbad))
+    all_mags = all_mags[mask]
+    all_mags.rename_column('OBJECT-NAME','objID')
+    all_mags.rename_column('FILTER','pb')
+    cycle_flag = [ 1 if x <= 56700 else 0 for x in all_mags['MJD'] ]
+    cycle_flag = np.array(cycle_flag)
+    all_mags['cycle'] = cycle_flag
+
+    for pb in np.unique(all_mags['pb']):
+        mask = (all_mags['pb'] == pb)
+        mag_table[pb] = all_mags[mask].to_pandas()
+
+    # init some structure to store the results for each passband
+    result_table = OrderedDict()
+    # drop some fields we do not need from the results
+    drop_fields = ['mc_error', 'hpd_2.5', 'hpd_97.5']
+    # keep a track of all_objects
+    all_objects = set()
+    # and variable names
+    var_names = ['zeropoint', 'c20_offset', 'sig_intrinsic', 'nu']
+    nvar = len(var_names)
+
+    # work on each passband in the table
+    for i, pb in enumerate(mag_table):
+        all_mags = mag_table[pb]
+        mask = all_mags['objID'].isin(use_stars)
+
+        # you could also exclude the standards from here
+        # sample_mags   = all_mags[~mask]
+        sample_mags   = all_mags
+
+        # the standards are "special" - they have apparent magnitudes from a
+        # model and are used to set the zeropoint for everything else
+        standard_mags = all_mags[mask].copy()
+
+        # what are the unique stars
+        standards  = standard_mags['objID'].unique()
+        nstandards = len(standards)
+        # map each star to an integer
+        standard_ind = range(nstandards)
+        standard_map = dict(zip(standards, standard_ind))
+        # construct an index with the integer mapping for each star in the table
+        standard_idx = [standard_map[x] for x in standard_mags['objID']]
+        standard_mags['idx'] = standard_idx
+        standard_idx = standard_mags['idx'].values
+        standard_cycle_idx = standard_mags['cycle'].values
+
+        # get the apparent magnitude corresponding to each standard measurement
+        mag_app_i  = np.array([smags.loc[x.replace('-','').lower(), pb] for x in standards])
+        # the zeropoint guess is just the average difference of the apparent mags and the instrumental mags
+        zpt_est = np.average(mag_app_i[standard_idx] - standard_mags[ref])
+
+        samples  = sample_mags['objID'].unique()
+        all_objects.update(samples)
+        nsamples = len(samples)
+        sample_ind = range(nsamples)
+        sample_map = dict(zip(samples, sample_ind))
+        sample_idx = [sample_map[x] for x in sample_mags['objID']]
+        sample_mags['idx'] = sample_idx
+        sample_idx = sample_mags['idx'].values
+        sample_cycle_idx = sample_mags['cycle'].values
+
+        with pm.Model() as hierarchical:
+            # parameters from intrinsic dispersion and the zeropoint and cycle 20 offset in each passband
+            sig_int  = pm.HalfCauchy('sig_{}'.format(pb), beta=1)
+            zpt      = pm.Normal('zpt_{}'.format(pb), mu=zpt_est, sd=1)
+
+            if 1 in np.unique(sample_cycle_idx):
+                c20off   = pm.Normal('c20off_{}'.format(pb), mu=0, sd=1)
+                c20flag  = True
+                n_plot_vars = nvar + 1
+                out_vars  = var_names.copy()
+            else:
+                c20flag = False
+                n_plot_vars = nvar
+                out_vars = var_names.copy()
+                out_vars.remove('c20_offset')
+
+            # a nuisance parameter for the DOF of the student-T distribution in each passband
+            nu       = pm.HalfCauchy("nu", beta=5)
+
+            # the actual uncertainty is the observed uncertainty and the intrinsic dispersion in quadrature
+            full_var_i = (sig_int**2. + standard_mags[dref]**2.)
+            full_var_j = (sig_int**2. + sample_mags[dref]**2.)
+
+            # the instrumental magnitudes of the standards (i) is the apparent magnitudes - the zeropoint
+            mag_inst_i = mag_app_i[standard_idx] - zpt
+
+            # create parameters for the apparent magntiudes for the sample stars - we want to infer these numbers
+            mag_app_j  = pm.Uniform('mag_app_{}_j'.format(pb), lower=8, upper=23, shape=nsamples)
+
+            #  the instrumnetal mags of the sample stars is the apparent magnitudes - the zeropoint
+            if c20flag:
+                mag_inst_j = mag_app_j[sample_idx] - sample_cycle_idx*c20off - zpt
+            else:
+                mag_inst_j = mag_app_j[sample_idx] - zpt
+
+            likelihood_sig_zpt = pm.StudentT('likelihood_sig_zpt', nu=nu, mu=mag_inst_i, lam=1./full_var_i, observed=standard_mags[ref])
+            # the likelihood of the apparent mags and dispersion given the sample instrumental mags and applying the zeropoint
+            likelihood_mag_sig = pm.StudentT('likelihood_mag_sig', nu=nu, mu=mag_inst_j, lam=1./full_var_j, observed=sample_mags[ref])
+            likelihood = pm.math.concatenate([likelihood_mag_sig, likelihood_sig_zpt])
+
+            # run the MCMC
+            print("\n\nRunning {}".format(pb))
+            trace = pm.sample(njobs=4, draws=15000, tune=5000, init='advi+adapt_diag')
+
+            # make a plot for sanity checking
+            fig2, axs = plt.subplots(nrows=n_plot_vars, ncols=2)
+            pm.traceplot(trace, ax=axs)
+            fig2.savefig('htrace_ILAPHv3_{}.pdf'.format(pb))
+
+            # get the results
+            out = pm.df_summary(trace)
+            nicenames = out_vars + samples.tolist()
+            out['objID'] = nicenames
+            out.set_index('objID', inplace=True)
+            out.drop(drop_fields, axis=1, inplace=True)
+            columns = {'mean':pb, 'sd':'d'+pb}
+            out.rename(columns=columns, inplace=True)
+            result_table[pb] = out
+    out_pb_order = ['F275W', 'F336W', 'F475W', 'F625W', 'F775W', 'F160W']
+    pbcolor      = ['purple', 'blue', 'green', 'red', 'orange', 'black']
+    out = None
+    for pb in out_pb_order:
+        this_pb = result_table.get(pb, None)
+        if this_pb is None:
+            continue
+
+        if out is None:
+            out = this_pb
+        else:
+            out = pd.concat([out, this_pb], axis=1)
+    if out is None:
+        message = 'No data was processed in any filter for any objects'
+        raise RuntimeError(message)
+
+    # sort the output rows
+    sorter = var_names + sorted(list(all_objects))
+    objID = out.index.tolist()
+    out['objID'] = objID
+    out['objID'] = out['objID'].astype("category")
+    out['objID'].cat.set_categories(sorter, inplace=True)
+    out.sort_values(['objID'], inplace=True)
+    objID = out.index.tolist()
+
+    # just moves object ID to the first column
+    cols = out.columns.tolist()
+    cols = cols[-1:] + cols[:-1]
+    out = out[cols]
+
+    # convert to astropy table to pretty print output
+    out = at.Table.from_pandas(out)
+
+    name_map = at.Table.read('name_map.dat', names=['old','new'], format='ascii.no_header')
+    name_map = dict(zip(name_map['old'], name_map['new']))
+    print(name_map)
+
+    out2 = out.copy(copy_data=True)
+    objID = out2['objID']
+    for i, n in enumerate(objID):
+        if n.startswith('SDSS-J'):
+            n = n.split('.')[0].replace('-','')
+        elif n.startswith('WD'):
+            n = n.replace('WD-','wd').split('-')[0].split('+')[0]
+        else:
+            pass
+        n = n.lower().replace('-','')
+        n = name_map.get(n, n)
+        out2['objID'][i] = n
+
+    cols = out2.colnames
+    for c in cols:
+        if out2[c].dtype == np.float64:
+            out2[c].format = '%.6f'
+    print(out2)
+    out2.write('ILAPHv3_phot.txt', format='ascii.fixed_width', delimiter='  ', overwrite=True, fill_values=['NaN',])
+
+    objID = out['objID']
+    nobj = len(objID[nvar:])
+
+    fig_big = plt.figure(figsize=(12,12))
+    with PdfPages('ILAPHv3.pdf') as pdf:
+        for j, obj in enumerate(objID[nvar:]):
+            fig = plt.figure(figsize=(12, 12))
+            for i, pb in enumerate(out_pb_order):
+                thispb = mag_table[pb]
+
+                mask = (thispb['objID'] == obj)
+                if len(thispb[mask]) == 0:
+                    message = 'No data for {}'.format(obj)
+                    print(message)
+                    continue
+
+                ax = fig.add_subplot(3,2,i+1)
+                ax_big = fig_big.add_subplot(3, 2, i+1)
+
+                time = thispb[mask]['MJD']
+                mag  = thispb[mask][ref]
+                err  = thispb[mask][dref]
+                cycle = thispb[mask]['cycle']
+                zpt = out[0][pb]
+                c20off = out[1][pb]
+                if np.isnan(c20off) or pb=='F275W':
+                    c20off = 0.
+                ax.errorbar(time, mag+zpt+c20off*cycle, yerr=err, color=pbcolor[i], linestyle='None', marker='o', ms=3)
+
+                mask2 = (out['objID'] == obj)
+                wmag  = out[mask2][pb].data[0]
+                werr  = out[mask2]['d'+pb].data[0]
+                sig_int = out[2][pb]
+
+                xmin, xmax = ax.get_xlim()
+                ax_big.errorbar(time, mag-wmag+zpt+c20off*cycle, yerr=err, color=pbcolor[i], linestyle='None', marker='o', ms=3, label='')
+
+                ax.fill_between([xmin, xmax], wmag + sig_int, wmag - sig_int, color='lightgray', label='int disp')
+                ax.fill_between([xmin, xmax],  wmag+werr, wmag-werr, color='gray', label='ucer')
+                ax.axhline(wmag, color=pbcolor[i], linestyle='--', lw=3, label='{:.3f}+/-{:.3f}, {:.3f}'.format(wmag, werr, sig_int))
+                ax.legend(frameon=True, fontsize='x-small')
+                ax.set_xlabel('MJD')
+                ax.set_ylabel(pb)
+                ax.invert_yaxis()
+                if j == nobj-1:
+                    xmin, xmax = ax_big.get_xlim()
+                    ax_big.fill_between([xmin, xmax], sig_int, -sig_int, color='lightgray')
+                    ax_big.axhline(0., color=pbcolor[i], linestyle='--', lw=3, label = 'N(0, {:.3f})'.format(sig_int))
+                    ax_big.legend(frameon=False, fontsize='small')
+                    ax_big.set_xlabel('MJD')
+                    ax_big.set_ylabel(pb)
+                    ax_big.invert_yaxis()
+            fig.suptitle(obj)
+            fig.tight_layout()
+            pdf.savefig(fig)
+            plt.close(fig)
+        fig_big.tight_layout()
+        fig_big.savefig('ILAPHv3_combined.pdf')
+        plt.close(fig_big)
+
+
+
+
+
+
+
+
+
+if __name__=='__main__':
+    sys.exit(main())