In [None]:
# Reads in photometry from different sources, normalizes them, and puts them
# onto a BJD time scale

# Created 2021 Dec. 28 by E.S.

In [1]:
import numpy as np
import pandas as pd
from astropy.time import Time
import matplotlib.pyplot as plt
from sklearn.preprocessing import MinMaxScaler

%matplotlib qt

In [11]:
## USER INPUTS

photometry_source_file = "rw_ari_asas3_vband_prepolished.txt"
epoch_writeout_file = "junk_hjds_rw_ari.csv" # generated as-we-go
bjd_file = "rw_ari_asas3_bjd.csv" # to be read in after manual correction
writeout_polished_file = "rw_ari_asas3_vband_polished.txt"

In [3]:
stem_super = "/Users/bandari/Documents/git.repos/rrlyrae_metallicity/notebooks_for_development/"
stem_moore_macadam = stem_super + "polished_macadam_moore_photometry/"
stem_public_sources = stem_super + "all_photometry_program_stars/polished/"
bjd_sources = stem_super + "all_photometry_program_stars/bjds/"

In [5]:
# read in photometry

#df = pd.read_csv(stem_public_sources + photometry_source_file)
df = pd.read_csv(stem_public_sources + photometry_source_file, delim_whitespace=True)

In [6]:
# if there's a bunch of too-old stuff, remove it
#df = df.where(np.logical_and(df["JD"]>2456474-400,df["JD"]<2456474+400)).dropna(how="all").reset_index()
#df = df.where(df["JD"]<=2459238.567486600).dropna(how="all").reset_index()

In [7]:
df.keys()

Index(['HJD', 'MAG_1', 'MAG_0', 'MAG_2', 'MAG_3', 'MAG_4', 'MER_1', 'MER_0',
       'MER_2', 'MER_3', 'MER_4', 'GRADE', 'FRAME'],
      dtype='object')

In [8]:
df["HJD"] = np.add(2450000,df["HJD"])

In [10]:
# write out only JD, for conversion

#df["JD"] = np.add(df["obsmjd"],2400000.5)
#df["JD"].to_csv(epoch_writeout_file, header=False, index=False)
df["HJD"].to_csv(epoch_writeout_file, header=False, index=False)

# at this point, do conversion step manually online

In [9]:
# FYI: location of Wichita (approx. center of U.S.)

'''
lat_wichita = 37.688889
lon_wichita = -97.336111
'''

'\nlat_wichita = 37.688889\nlon_wichita = -97.336111\n'

# read bjds back in and tack onto the dataframe

In [12]:
intermed_bjd = pd.read_csv(bjd_sources + bjd_file, names=["BJD"])
print(bjd_sources + bjd_file)

df["BJD"] = intermed_bjd.values

#df = df.join(intermed_bjd["BJD"])

/Users/bandari/Documents/git.repos/rrlyrae_metallicity/notebooks_for_development/all_photometry_program_stars/bjds/rw_ari_asas3_bjd.csv


In [13]:
len(df)

399

In [14]:
df

Unnamed: 0,HJD,MAG_1,MAG_0,MAG_2,MAG_3,MAG_4,MER_1,MER_0,MER_2,MER_3,MER_4,GRADE,FRAME,BJD
0,2.452636e+06,11.880,11.989,99.999,99.999,99.999,0.029,0.047,0.022,0.023,0.024,C,32205,2.452636e+06
1,2.452645e+06,11.875,11.936,11.690,11.600,11.526,0.039,0.041,0.027,0.025,0.026,A,33529,2.452645e+06
2,2.452647e+06,11.894,12.018,11.717,11.605,11.503,0.032,0.038,0.022,0.022,0.023,A,33831,2.452647e+06
3,2.452654e+06,11.963,12.200,11.757,11.608,11.584,0.024,0.041,0.021,0.022,0.025,A,34704,2.452654e+06
4,2.452658e+06,11.771,11.856,11.639,11.576,11.559,0.032,0.041,0.029,0.030,0.033,A,35381,2.452658e+06
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
394,2.453669e+06,29.999,29.999,29.999,29.999,29.999,0.042,0.047,0.037,0.040,0.045,C,163830,2.453669e+06
395,2.454695e+06,29.999,29.999,29.999,29.999,29.999,0.035,0.039,0.028,0.030,0.035,C,282268,2.454695e+06
396,2.455024e+06,29.999,29.999,29.999,29.999,29.999,0.044,0.047,0.039,0.046,0.054,C,320730,2.455024e+06
397,2.453342e+06,12.180,12.274,11.873,11.664,11.593,0.047,0.078,0.040,0.041,0.045,B,122810,2.453342e+06


In [15]:
# in case of weird naming conventions
'''
df["Magnitude"] = df["MAG_0"]
df["Uncertainty"] = df["MER_0"]
'''

# look at the data, choose what we want

In [16]:
plt.clf()
plt.scatter(df["BJD"],
            df["Magnitude"])
plt.show()

In [11]:
plt.clf()
plt.scatter(df["BJD"],
            df["MAG_0"])
plt.scatter(df["BJD"],
            df["MAG_1"])
plt.scatter(df["BJD"],
            df["MAG_2"])
plt.scatter(df["BJD"],
            df["MAG_3"])
plt.scatter(df["BJD"],
            df["MAG_4"])
plt.show()

In [14]:
plt.clf()
plt.scatter(df["BJD"],
            df["mag_autocorr"])
plt.show()

In [13]:
plt.clf()
plt.scatter(df["JD"].where(df["Band"] == "V"),
            df["Magnitude"].where(df["Band"] == "V"), color="k")
plt.scatter(df["BJD"].where(df["Band"] == "V"),
            df["Magnitude"].where(df["Band"] == "V"), color="b")
plt.show()

In [18]:
plt.clf()
plt.scatter(df["BJD"].where(df["Observer Code"] == "SAH"),
            df["Magnitude"].where(df["Observer Code"] == "SAH"), color="k")
plt.show()

In [13]:
df.keys()

Index(['JD', 'Magnitude', 'Uncertainty', 'HQuncertainty', 'Band',
       'Observer Code', 'Comment Code(s)', 'Comp Star 1', 'Comp Star 2',
       'Charts', 'Comments', 'Transfomed', 'Airmass', 'Validation Flag',
       'Cmag', 'Kmag', 'HJD', 'Star Name', 'Observer Affiliation',
       'Measurement Method', 'Grouping Method', 'ADS Reference', 'Digitizer',
       'Credit', 'BJD'],
      dtype='object')

In [12]:
print(np.min(df["JD"]))
print(np.max(df["JD"]))

2439144.571
2459546.39706


In [11]:
len(df)

30529

In [15]:
df["Band"].value_counts()

KeyError: 'Band'

In [16]:
df["Observer Code"].value_counts()

KeyError: 'Observer Code'

In [17]:
# choose photometric subset

#df_subset_photo = df
#df_subset_photo = df.where(np.logical_and(df["BJD"] > 2452456,df["Band"] == "V"))
#df_subset_photo = df.where(np.logical_or(df["BJD"] < 2455109,df["BJD"] > 2455535))
#df_subset_photo = df.where(df["Band"] == "V")
df_subset_photo = df.where(df["MAG_0"] < 20)
#df_subset = df[["JD", "sdf"]]

In [18]:
# check to confirm
plt.clf()
plt.scatter(df_subset_photo["BJD"],df_subset_photo["Magnitude"])
#plt.scatter(df_subset_photo["BJD"],df_subset_photo["MAG_0"])
plt.show()

In [13]:
np.max(df_subset_photo["BJD"])

2456809.3022545683

In [14]:
df_subset_photo.keys()

Index(['index', 'JD', 'Magnitude', 'Uncertainty', 'HQuncertainty', 'Band',
       'Observer Code', 'Comment Code(s)', 'Comp Star 1', 'Comp Star 2',
       'Charts', 'Comments', 'Transfomed', 'Airmass', 'Validation Flag',
       'Cmag', 'Kmag', 'HJD', 'Star Name', 'Observer Affiliation',
       'Measurement Method', 'Grouping Method', 'ADS Reference', 'Digitizer',
       'Credit', 'BJD'],
      dtype='object')

# feature scale the photometry

### wait! scaling of error bars won't be the same, since an offset is being subtracted off

In [29]:
'''
scaler = MinMaxScaler() # min-max mapped to 0-to-1
df_subset_photo[['mag_scaled']] = scaler.fit_transform(df_subset_photo[['Magnitude']])
# df_subset_photo[['error_scaled']] = scaler.transform(df_subset_photo[['Uncertainty']])
'''

In [21]:
'''
plt.scatter(df_subset_photo["BJD"],df_subset_photo["mag_scaled"])
plt.show()
'''

# write out as 'polished' photometry

In [None]:
# cols BJD, mag, error

In [19]:
# remove rows of all NaNs

df_subset_photo_dropna = df_subset_photo.dropna(axis=0, how='all')

In [20]:
# write out only the relevant cols

df_subset_photo_dropna.to_csv(stem_public_sources + writeout_polished_file, 
                              columns=["BJD","Magnitude","Uncertainty"], index=False)
print(stem_public_sources + writeout_polished_file)

/Users/bandari/Documents/git.repos/rrlyrae_metallicity/notebooks_for_development/all_photometry_program_stars/polished/rw_ari_asas3_vband_polished.txt


In [16]:
writeout_polished_file

't_sex_asas3_vband_polished.txt'