In [94]:
import numpy as np
import pandas as pd 
import astropy as ap
import matplotlib.pyplot as plt
from astropy.io import ascii

In [95]:
from scipy.stats import binned_statistic_dd
from scipy.stats import linregress
#from astroquery.mast import Catalogs
import mr_forecast as mr
pd.options.display.max_columns = 100
'''
note on mr_forecast: I replaced the Kipping & Chen function with the strictly analytical relationship implemented in Louie
et. al. 2018, which runs more quickly and for our purposes is sufficient. 

EXCEPT for planets with R > Rj 
''';

The goal of this notebook is to re-implement the matlab code written by Natalie in Python. The purpose is to select Tess planets for radial velocity follow-up with the Keck telescope in order to constrain their masses in preparation for further characterization with JWST. 

In [96]:
#Just getting the data - can use TESS or Barclay catalog 
#barclay catalog: https://arxiv.org/pdf/1804.05050.pdf
data_source = 'tess' #make this tess or barclay or exoplanet_archive
if data_source == 'tess':
    tess = pd.read_csv('toi_plus_list-2019-10-31.csv',delimiter=',',header=4)
    c = tess
if data_source == 'barclay':
    bc = ascii.read('barclay_2018_tess_catalog.txt')
    c = bc.to_pandas() #to generalize the use

In [97]:
#catalog_2 = star_df.dropna().merge(catalog,left_on='TICID',right_on='TIC ID').reset_index(drop=True)
#commented line above is when you need to do the MAST query
#star_info = pd.read_csv('TIC_wider_crossmatch.csv',delimiter=',',header=4)

#trying it now with a query to https://exofop.ipac.caltech.edu/tess/search.php for
#my TICID list, which returned fewer parameters but might be what I need 
if data_source == 'tess':
    star_info = pd.read_csv('TIC_star_info_oct_31_all.csv',delimiter=',',header=10)
    c['Stellar Mass'] = ((10**c['Surface Gravity Value']) * ((c['Star Radius Value']*6.9551e10)**2) 
                         / 6.67e-8 ) / 1.99e33 
    catalog_2 = pd.merge(c,star_info, left_on = 'TIC', right_on = 'Target')
    c2 = catalog_2.drop(columns=['TFOP SG1a','TFOP SG1b','TFOP SG2',\
                                'TFOP SG3','TFOP SG4','TFOP SG5','TFOP Master',\
                                'TOI Disposition'])
    c = c2.sort_values('Full TOI ID')

In [98]:
#naming all the variables, so it's easier to switch from bc to tess
#future note to self: better to just do all the below as functions, rather than hard-coding all the variables
#at the top; make this change when you've got some spare time

#note: might be easier to have a dictionary of keys, which I could then make calls to 
#by having functions accept the dictionary as input, rather than each key individually...
#not that it makes that much of a difference but it might clean things up a bit

if data_source == 'barclay':
    #rp = catalog['Planet-radius']
    #ms = catalog['Star-mass']
    #pp = catalog['Planet-period']
    #Ts = catalog['Star-teff']
    #ars = catalog['Ars'] #this is the semimajor axis of the orbit over the stellar radius
    #Jmag = catalog['Jmag']
    #Vmag = catalog['Vmag']
    #rs = catalog['Star-radius']
    #dec = catalog['DEdeg'] #declination
    #Fp = catalog['Insol']

    rp_key = 'Planet-radius'
    ms_key = 'Star-mass'
    pp_key = 'Planet-period'
    Ts_key = 'Star-teff'
    ars_key = 'Ars'
    Jmag_key = 'Jmag'
    Vmag_key = 'Vmag'
    rs_key = 'Star-radius'
    dec_key = 'DEdeg'
    Fp_key = 'Insol'
    
if data_source == 'tess':
    #rp = catalog['Planet Radius (R_Earth)']
    #ms = catalog['st_mass']  
    #pp = catalog['Period (days)']
    #Ts = catalog['Stellar Teff (K)']
    #ars = catalog['Ars'] #this is the semimajor axis of the orbit over the stellar radius
    #Jmag = catalog['Jmag']
    #Vmag = catalog['Vmag']
    #rs = catalog['Stellar Radius (R_Sun)']
    #dec = catalog['Dec (degrees)'] #declination
    #Fp = catalog['Planet Insolation (Earth flux)']
    
    rp_key = 'Planet Radius Value'
    ms_key = 'Stellar Mass' 
    pp_key = 'Orbital Period Value'
    Ts_key = 'Effective Temperature Value'
    ars_key = 'Ars'
    Jmag_key = 'J mag' #spaces in mags comes from the exofop catalog; remove space if getting info from MAST
    Vmag_key = 'V mag'
    rs_key = 'Star Radius Value' 
    dec_key = 'TIC Declination'
    Fp_key = 'Effective Stellar Flux Value'
    mp_key = 'pl_masses'
    mp_units = 'Earth'
    
    #below are the keys for exofop; above are from https://tev.mit.edu:8010/data/collection/193/ 
        #which I think is standard from here on out
    #rp_key = 'Planet Radius (R_Earth)'
    #ms_key = 'Stellar Mass' #the from MAST and a god awful name is 'mass'; change this! 
    #                                #it's "Stellar Mass (M_Sun)" from exofop which is much better
    #pp_key = 'Period (days)'
    #Ts_key = 'Stellar Eff Temp (K)'
    #ars_key = 'Ars'
    #Jmag_key = 'J mag' #spaces in mags comes from the exofop catalog; remove space if getting info from MAST
    #Vmag_key = 'V mag'
    #rs_key = 'Stellar Radius (R_Sun)' 
    #dec_key = 'Dec_y'
    #Fp_key = 'Planet Insolation (Earth Flux)'
    #mp_key = 'pl_masses'
    #mp_units = 'Earth'
    
if data_source == 'exoplanet_archive':
    
    rp_key = 'pl_radj' #FINISH FILLING THIS IN BELOW HERE 
    ms_key = 'st_mass'
    pp_key = 'pl_orbper'
    Ts_key = 'st_teff'
    ars_key = 'Ars'
    Jmag_key = 'st_j'
    Vmag_key = 'st_vj'
    rs_key = 'st_rad'
    dec_key = 'dec'
    Fp_key = 'pl_insol'

In [106]:
exoarch_keys = ['pl_rade','st_mass','pl_orbper','st_teff','Ars','st_j',
                'st_vj','st_rad','dec','pl_insol', 'pl_masse']
all_planets = pd.read_csv('transits_above_v14.csv',header=50)
ap = all_planets
known_planets = pd.DataFrame({
    rp_key : ap[exoarch_keys[0]],
    ms_key : ap[exoarch_keys[1]],
    pp_key : ap[exoarch_keys[2]],
    rs_key : ap[exoarch_keys[7]],
    Ts_key : ap[exoarch_keys[3]],
    Jmag_key : ap[exoarch_keys[5]],
    Vmag_key : ap[exoarch_keys[6]], 
    dec_key : ap[exoarch_keys[8]],
    Fp_key : ap[exoarch_keys[9]]
})

In [170]:
c

Unnamed: 0,Source Pipeline,TIC,Full TOI ID,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,Alerted,Edited,Stellar Mass,Target,RA,Dec,V mag,J mag,H mag,K mag,Ars,pl_masses,K_amp,K_amp_n,TSM,nTSM
0,spoc,231663901,101.01,318.736981,-55.871780,12.35200,0.034000,1326.008874,0.000339,1.430401,0.000032,1.638765,0.026081,20452.531680,242.952330,1,WASP-46 b,4.48851,0.000000,1,0.860000,0.000000,13.145008,0.144216,1499.044062,5600.00,0.000,1193.379561,0.887868,False,2018-09-05T18:49:20+00:00,2019-10-18 15:52:34.879215+00:00,0.830108,231663901,318.737012,-55.871863,13.0430,11.753000,11.465000,11.401,5.840018,114.563927,73.743313,73.508642,225.320941,225.238184
1,spoc,149603524,102.01,87.139956,-63.988427,9.71600,0.018000,1326.078645,0.000099,4.411943,0.000005,3.776425,0.008533,13979.926188,30.580667,"6, 4, 3, 2, 1",WASP 62b,4.32092,0.000000,1,1.280000,0.000000,15.397243,0.032379,1370.000000,6280.00,0.000,586.130000,474.380950,,2019-05-07T17:42:37+00:00,2019-10-18 21:38:51.362543+00:00,1.250166,149603524,87.139821,-63.988329,10.2130,9.272000,9.008000,8.944,9.530047,-1.000000,-0.336560,-0.335582,-51535.193810,-49126.637384
2,spoc,336732616,103.01,312.457438,-24.428796,11.46400,0.018000,1327.252560,0.000586,3.547854,0.000149,3.494333,0.049205,10424.371800,123.359314,1,HATS-3,4.22896,0.000000,1,1.400000,0.000000,14.581841,0.196435,1504.858953,6351.00,0.000,1212.004376,0.800299,False,2018-09-05T18:49:20+00:00,2019-10-17 00:41:47.999819+00:00,1.210163,336732616,312.457488,-24.428694,12.4330,10.980000,10.719000,10.694,7.453489,-1.000000,-0.369856,-0.368782,-19055.755108,-19048.757339
3,spoc,231670397,104.01,319.949611,-58.148876,9.84800,0.018000,1327.673462,0.000842,4.087445,0.000239,5.590140,0.066407,3586.196984,48.804030,1,WASP-73,3.93359,0.000000,1,2.070000,0.000000,12.652102,0.221452,1630.958624,6036.00,0.000,1672.217546,0.808662,False,2018-09-05T18:49:20+00:00,2019-10-17 00:41:44.380089+00:00,1.340166,231670397,319.949697,-58.148933,10.4680,9.352000,9.073000,9.028,5.731649,107.357157,35.385488,35.276972,121.649024,121.604361
4,spoc,144065872,105.01,337.457199,-48.003087,9.48000,0.020000,1326.505990,0.000156,2.184659,0.000023,2.869426,0.012752,11836.691220,46.940147,1,WASP-95,4.37759,0.000000,1,1.130000,0.000000,12.514586,0.056125,1429.144596,5630.00,0.000,985.883704,0.886027,False,2018-09-05T18:49:20+00:00,2019-10-17 00:41:47.471372+00:00,1.110132,144065872,337.457824,-48.003099,10.0920,8.936000,8.628000,8.564,6.494286,105.381037,48.525343,48.375095,427.125640,426.968786
5,spoc,38846515,106.01,68.959732,-64.027040,10.30700,0.019000,1326.745077,0.000179,2.849380,0.000006,3.776111,0.013790,7452.432687,25.309372,"5, 6, 4, 3, 2, 1",WASP-100b,4.43800,0.000000,1,1.000000,0.000000,9.061380,0.027050,1534.801917,6900.00,0.000,1311.385368,278.009500,False,2019-05-07T17:42:35+00:00,2019-10-18 21:38:49.609601+00:00,0.999143,38846515,68.959816,-64.027039,10.7980,9.928001,9.715000,9.669,8.458085,60.867410,27.519043,27.435704,243.777673,243.691392
6,spoc,92352620,107.01,313.783108,-34.135572,9.63900,0.019000,1328.299340,0.000307,3.950054,0.000088,4.557506,0.023461,12999.897180,75.694890,1,WASP-94A (planet host),4.18077,0.000000,1,1.620000,0.000000,18.775574,0.097373,1468.219722,6153.00,0.000,1098.209548,0.860200,False,2018-09-05T18:49:20+00:00,2019-10-17 00:41:41.077982+00:00,1.450200,92352620,313.783239,-34.135751,10.0510,9.159000,8.916000,8.874,7.349517,-1.000000,-0.316299,-0.315380,-68563.029674,-68537.860345
7,spoc,281459670,110.01,5.618692,-59.942551,11.63200,0.018000,1328.040464,0.000446,3.174305,0.000044,2.723339,0.030983,15603.693104,151.402710,"2, 1",HATS-30,4.42524,0.000000,1,1.060000,0.000000,13.668801,0.126250,1293.941810,5943.00,0.000,662.491006,100.352080,False,2018-11-14T15:06:55+00:00,2019-10-17 00:41:48.801418+00:00,1.090133,281459670,5.618525,-59.942589,12.2830,11.129000,10.826000,10.793,8.827728,122.432341,50.382232,50.224487,179.534322,179.468392
8,spoc,388104525,112.01,55.933440,-65.193856,11.54700,0.018000,1327.409380,0.000189,2.499814,0.000008,2.878017,0.016900,15044.681156,64.478970,"4, 3, 2, 1",,4.28867,0.000000,1,1.200000,0.000000,14.839843,0.082961,1433.107203,5650.00,0.000,996.863551,235.476910,,2019-05-07T17:42:43+00:00,2019-10-18 21:38:41.021876+00:00,1.020141,388104525,55.933639,-65.193780,12.3140,10.924000,10.612000,10.545,6.504389,-1.000000,-0.465773,-0.464420,-26714.894937,-26705.084385
9,spoc,97409519,113.01,332.714323,-30.749674,12.14300,0.018000,1327.053085,0.000623,3.372877,0.000147,2.634260,0.043644,17163.604190,212.405870,1,WASP-124,4.45061,0.000000,1,1.020000,0.000000,14.201803,0.154789,1270.187448,6050.00,0.000,615.165921,0.829214,False,2018-09-05T18:49:20+00:00,2019-10-17 00:41:47.624418+00:00,1.070134,97409519,332.714337,-30.749719,12.7240,11.650000,11.419000,11.310,9.493843,130.658709,53.345352,53.177288,157.365286,157.307494


In [107]:
def mass_getter(planet_data, rad_key, mass_key):
    planet_mass = np.zeros(len(planet_data[rad_key]))
    big_ones = planet_data[rad_key]>14.26 #i.e. too big for the empirical relation
    masked_ones = pd.isna(planet_data[mass_key])
    
    i = 0
    while i < len(planet_mass):
        if masked_ones[i] and not big_ones[i]:
            #if the entry is masked (i.e. zero) AND it's small, use the empirical relationship
            planet_mass[i] = (0.9718 * ((planet_data[rad_key][i])**3.58)) if planet_data[rad_key][i] < 1.23 \
            else (1.436 * ((planet_data[rad_key][i])**1.7)) #Earth Masses
        i+=1
        
    #planet_mass[np.logical_and(big_ones, masked_ones)] = \
    #    mr.Rpost2M(planet_data[rad_key][np.logical_and(big_ones, masked_ones)],unit='Earth')
    #for the entries which are masked and big, apply the statistical relationship
    
    planet_mass[np.logical_and(big_ones, masked_ones)] = 317.8 #anything really big is just Jupiter fck it lol
                                                                #it's outside our bin regime anyway
    
    planet_mass[~masked_ones] = planet_data[mass_key][~masked_ones]
    #for unmasked entries, take the existing values
    
    return np.round(planet_mass,4)

known_planets[mp_key] = mass_getter(ap,exoarch_keys[0],exoarch_keys[10])

In [108]:
def ars_from_t(period,star_mass,star_radius):
    '''
    period should be given in days; star mass and radius in
    terms of their value in solar units. These units seem
    to be pretty much standard across exoplanet databases
    so I have not implemented any sort of unit options
    in this function.
    '''
    G = 6.6726e-11
    Msun = 1.989e30
    Mstar = star_mass * Msun
    period_s = period * 86400
    a_m = (G*Mstar*(period_s**2) / (4 * (np.pi**2))) ** (1/3)
    star_radius_m = star_radius * 6.9551e8 #sun radius in m
    ars = a_m / star_radius_m
    #this value is correct for earth 
    return ars

known_planets[ars_key] = ars_from_t(known_planets[pp_key],known_planets[ms_key],known_planets[rs_key])

In [109]:
if data_source == 'tess':
    c = c[np.logical_and.reduce((c[rp_key]>0, c[pp_key]>0, c['Source Pipeline']=='spoc'))]
    c[ars_key] = ars_from_t(c[pp_key], c[ms_key], c[rs_key]) #because there is no ars data in the tess datafile
    c = c.reset_index(drop=True)

In [110]:
#Calculating Optimistic mass based on relation in Chen & Kipping 2016 (https://arxiv.org/pdf/1603.08614.pdf) and direct 
#empircal implementation by Louie et. al. 2018 (https://iopscience.iop.org/article/10.1088/1538-3873/aaa87b)
def m_from_r(radii):
    masses = np.zeros(len(radii))
    i = 0
    while i < len(radii):
        masses[i] = (0.9718 * (radii[i]**3.58)) if radii[i] < 1.23\
        else (1.436 * (radii[i]**1.7)) if radii[i] < 14.26\
        else -1
        #don't use this analysis for planets outside the neptune regime: return -1
        i += 1
    return masses

c[mp_key] = m_from_r(c[rp_key])

In [111]:
def k_amp_finder(star_mass,star_radius,planet_mass,ars,mp_units):
    '''
    finds the amplitude of stellar oscillations due to the planet's orbit 
    star_mass: units of m_sun
    star_radius: units of r_sun
    planet_mass: units of m_earth or m_jup (should be able to set "mp_units = mp_units" as that 
                                            variable is named higher up in the chain. Note "Earth"
                                            is capitalized, if you set this manually. 
    ars: ratio of semimajor axis and stellar radius. This is used as an input instead of a alone 
                        because a is often not directly available from these datasets. 
    '''
    
    G = 6.67e-11 #SI units
    Msun = 1.98e30 #kg
    Rsun = 6.9551e8 #meters
    v_star = np.sqrt(G*star_mass*Msun/(ars*star_radius*Rsun)) 
    #this is actually backwards
    
    mp_factor = 5.972e24 if mp_units == 'Earth' else 1.898e27
    v_pl = v_star * ((planet_mass*mp_factor)/(star_mass*Msun))
    
    return v_pl
    
c['K_amp'] = k_amp_finder(c[ms_key],c[rs_key],c[mp_key],c[ars_key],mp_units)

In [112]:
#mjupiter=1.898e27; #kg
#mearth=5.972e24; #kg
#
#kamp = 203*(T(:,22).^(-1/3)).*(plmass*mearth/mjupiter)./((T(:,16) + 9.548e-4*plmass*mearth/mjupiter).^(2/3));

def k_amp_natalie(period,planet_mass,star_mass):
    '''
    from https://exoplanetarchive.ipac.caltech.edu/docs/poet_calculations.html
    '''
    mjupiter=1.898e27 #kg
    mearth=5.972e24 #kg
    k_amp = 203 * (period**(-1/3)) * (planet_mass*mearth/mjupiter)\
                            / (((star_mass) + (9.548e-4 * planet_mass * mearth/mjupiter) ) ** (2/3))
    return k_amp

c['K_amp_n'] = k_amp_natalie(c[pp_key],c[mp_key],c[ms_key])

In [243]:
#c[['K_amp','K_amp_n']][np.logical_or(np.logical_and(c['K_amp_n'] < 2, c['K_amp'] > 2), \
#                                    np.logical_and(c['K_amp'] < 2, c['K_amp_n'] > 2))]
#with the updated data, our values DO differ for TOI 262.01

In [114]:
#Calculating Webb SNR Proxy
#taken from Kempton et. al. : https://arxiv.org/pdf/1805.03671.pdf
#note: implement "ars" and "mp" being "None" so there's an option for the
#function to calculate them internally, making it more generally applicable

def get_TSM(planet_radius,star_radius,star_teff,Jmag,planet_mass,ars):
    
    scale_factors = np.zeros(len(planet_radius))
    i = 0
    while i < len(planet_radius):
        #from Table 1 in Kempton et. al. 
        scale_factors[i] = 0.19 if planet_radius[i]<1.5\
        else 1.26 if np.logical_and(planet_radius[i]>1.5,planet_radius[i]<2.75)\
        else 1.28 if np.logical_and(planet_radius[i]>2.75, planet_radius[i]<4)\
        else 1.15
        i += 1
    
    Teq = star_teff * (np.sqrt(1/ars)*(0.25**0.25)) #eqn 3 in Kempton et. al <- this is how I calculated TSM
   
    #TSM is transmission spectroscopy metric
    TSM = scale_factors * (planet_radius**3) * Teq * (10**(-Jmag/5)) / (planet_mass * (star_radius**2))
    return TSM

c['TSM'] = get_TSM(c[rp_key],c[rs_key],c[Ts_key],c[Jmag_key],c[mp_key],c[ars_key])
known_planets['TSM'] = get_TSM(known_planets[rp_key],known_planets[rs_key],
                                        known_planets[Ts_key],known_planets[Jmag_key],
                                        known_planets[mp_key],known_planets[ars_key])

In [143]:
def get_Fp(ars,ts):
    teq = ts * (np.sqrt(1/ars) * (0.25**0.25))
    Fp = 4 * (np.sqrt(ars) * (teq/ts))
    return Fp

known_planets[Fp_key] = get_Fp(known_planets[ars_key],known_planets[Ts_key])

In [144]:
#Calculating Webb SNR Proxy
#taken from Kempton et. al. : https://arxiv.org/pdf/1805.03671.pdf
#note: implement "ars" and "mp" being "None" so there's an option for the
#function to calculate them internally, making it more generally applicable

def get_natalie_TSM(planet_radius,star_radius,star_teff,Jmag,planet_mass,insol_flux):
    
    scale_factors = np.zeros(len(planet_radius))
    i = 0
    while i < len(planet_radius):
        #from Table 1 in Kempton et. al. 
        scale_factors[i] = 0.19 if planet_radius[i]<1.5\
        else 1.26 if np.logical_and(planet_radius[i]>1.5,planet_radius[i]<2.75)\
        else 1.28 if np.logical_and(planet_radius[i]>2.75, planet_radius[i]<4)\
        else 1.15
        i += 1
    
    rsun=696265; #km
    au=149598000; #km
    albedo=0; #.3; %3; %0.1; Bond albedo
    rearth=6371; #km
    tsun=5777;
    Teq = (((insol_flux)*(1/4))**0.25)*np.sqrt(rsun/au)*tsun 
    
    #Teq/tsun = (fp/4)** 1/4 * np.sqrt(1/ars)
    #4 * (np.sqrt(ars) * teq/ts )^4

    #TSM is transmission spectroscopy metric
    TSM = scale_factors * (planet_radius**3) * Teq * (10**(-Jmag/5)) / (planet_mass * (star_radius**2))
    return TSM

c['nTSM'] = get_natalie_TSM(c[rp_key],c[rs_key],c[Ts_key],c[Jmag_key],c[mp_key],c[Fp_key])
known_planets['nTSM'] = get_natalie_TSM(known_planets[rp_key],known_planets[rs_key],
                                        known_planets[Ts_key],known_planets[Jmag_key],
                                        known_planets[mp_key],known_planets[Fp_key])

In [145]:
#desirables = np.logical_and.reduce((Jmag<12, Vmag<14, dec<20, catalog['K_amp']>2))
desirables = np.logical_and(c[dec_key]>-20, c['K_amp']>2)

#NOTE: maybe ought to change the dec key back to the normal one - the _x comes, again, from MAST

#jmag is webb limit, Kmag is keck limit, dec is to simulate fraction of catalog visible from keck, vs is k_amp for star

In [146]:
catalog_cleaned = c[desirables]#.drop_duplicates(subset='TOI') #removed for barclay catalog
cc = catalog_cleaned.reset_index(drop=True)

In [147]:
#cc.to_csv(path_or_buf=r'tess_data_with_ticid_info.csv',index=False);
#done so that I can just reload here instead of going through that 
#god awful loading of all the TICID info from MAST again. 

In [148]:
#cc = pd.read_csv('tess_data_with_ticid_info.csv')
id_key = 'Full TOI ID'
kp = known_planets
kp[id_key] = ap['pl_name']
cc2 = cc.append(kp, sort=False)

In [149]:
#defining new bins - as per Natalie
rad_bins = 10**(np.linspace(0,1,6))
fpl_bins = 10**(np.linspace(-1,4,6))
tef_bins = np.array([2500,3900,5200,6500])
all_bins = [rad_bins, fpl_bins, tef_bins]

def binning_function(dataset,bins,id_key,sort_val):
    
    rad_bins = bins[0]
    fpl_bins = bins[1]
    tef_bins = bins[2]

    pre_bin = dataset.assign(
        radius_bin = pd.cut(dataset[rp_key],bins=rad_bins,labels = [1,2,3,4,5]),
        insol_bin = pd.cut(dataset[Fp_key],bins=fpl_bins,labels = [1,2,3,4,5]),
        st_Teff_bin = pd.cut(dataset[Ts_key],bins=tef_bins,labels = [1,2,3])
    )
        #pd.cut returns the bin number (or label - ints chosen here for ease)
        #of each row based on its place within a specified column. 
    
    binned = pre_bin.dropna(subset=['radius_bin','insol_bin','st_Teff_bin']).groupby(['radius_bin',\
                                    'insol_bin','st_Teff_bin']).apply(lambda _pre_bin:\
                                    _pre_bin.sort_values(by=[sort_val],ascending=False)).reset_index(level = 3,drop=True)
                    #this multi-line call: 
                        #1) drops values which are not in any of the desired bins 
                        #2) groups within those bins
                        #3) sorts by TSM (the lambda thing is necessary because "groupby" produces a "groupby object"
                                #which can't be operated on normally)
                        #4) drops all indexes which are not the bin numbers, which were just 1 to N anyway and therefore
                                #were worthless 
    
    all_idx = binned.index.to_list()
    unique_idx = []
    for element in all_idx: 
        if element not in unique_idx:
            unique_idx.append(element)
    
    binned['priority'] = np.zeros(len(binned))
    for idx in unique_idx:
        
        bin_items = len(binned.loc[idx].sort_values(sort_val,ascending=False).iloc[0:3].sort_values(Vmag_key)[id_key])
            #the number of objects in each bin
            
        if bin_items >= 3:
            binned.loc[binned[id_key] == binned.loc[idx].sort_values(sort_val,ascending=False).iloc[0:3]\
                       .sort_values(Vmag_key)[id_key].iloc[0],'priority'] = 1
            binned.loc[binned[id_key] == binned.loc[idx].sort_values(sort_val,ascending=False).iloc[0:3]\
                       .sort_values(Vmag_key)[id_key].iloc[1],'priority'] = 2
            binned.loc[binned[id_key] == binned.loc[idx].sort_values(sort_val,ascending=False).iloc[0:3]\
                       .sort_values(Vmag_key)[id_key].iloc[2],'priority'] = 3
            continue
            
        elif bin_items == 2:
            binned.loc[binned[id_key] == binned.loc[idx].sort_values(sort_val,ascending=False).iloc[0:3]\
                       .sort_values(Vmag_key)[id_key].iloc[0],'priority'] = 1
            binned.loc[binned[id_key] == binned.loc[idx].sort_values(sort_val,ascending=False).iloc[0:3]\
                       .sort_values(Vmag_key)[id_key].iloc[1],'priority'] = 2
            continue
            
        elif bin_items == 1:
            binned.loc[binned[id_key] == binned.loc[idx].sort_values(sort_val,ascending=False).iloc[0:3]\
                       .sort_values(Vmag_key)[id_key].iloc[0],'priority'] = 1
    
        #this is a HIDEOUS call but the idea is: 
            #you are going into each bin sequentially (by index), sorting by TSM, then sorting those top 3 by Vmag. 
            #then, you are taking out the TOI value of the top entry there (i.e., highest priority)
            #THEN, you are indexing that TOI in the list, .loc'ing to that row and the priority column, and setting 
            #THAT entry to 1. Then repeating this for the other priority values 
            
            #all these if statements are a lot but unless I want to predefine 
            #how many are in each bin (?) I think this is the fastest way to go, and as long as 
            #TESS keeps its number of targets < 10^5 or something this shouldn't be unacceptably
            #long in terms of its run time 
    return binned

In [192]:
binned = binning_function(cc,all_bins,'Full TOI ID','TSM')
binned2 = binning_function(cc2,all_bins,'Full TOI ID','TSM')
#binned 2 is the one with the exoplanet archive included

In [227]:
#rewriting this to include ExoArch planets
my_tois_or = binned[binned['priority']==1].reset_index(drop=True)[id_key].values
np.sort(my_tois_or)

array([ 233.01,  238.01,  266.01,  390.01,  421.01,  455.01,  460.01,
        465.01,  507.01,  526.01,  532.01,  538.01,  560.01,  620.01,
        635.01,  638.01,  663.01,  680.01,  732.01,  732.02, 1135.01,
       1136.01, 1136.02, 1235.01, 1242.01, 1246.02, 1258.01, 1264.01,
       1268.01, 1278.01, 1285.01, 1339.01])

In [233]:
my_tois = binned2[binned2['priority']==1].reset_index(drop=True)[id_key].values
my_tois

array([455.01, 'HD 219134 c', 'K2-184 b', 732.01, 635.01, 'TOI 270 c',
       'HD 219134 b', 'pi Men c', 663.01, 1235.01, 1285.01, 238.01,
       266.01, 1242.01, 638.01, 233.01, 'K2-36 c', 'HD 3167 c', 620.01,
       560.01, 1339.01, 1246.02, 1136.02, 'GJ 3470 b', 'K2-39 b',
       'DS Tuc A b', 538.01, 532.01, 1136.01, 465.01, 1258.01, 680.01,
       1278.01, 'K2-141 c', 'HD 149026 b', 507.01, 1268.01, 421.01,
       460.01, 1264.01, 1135.01, 390.01], dtype=object)

In [223]:
binned2[binned2['priority']==1][['']]

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Source Pipeline,TIC,Full TOI ID,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,Alerted,Edited,Stellar Mass,Target,RA,Dec,V mag,J mag,H mag,K mag,Ars,pl_masses,K_amp,K_amp_n,TSM,nTSM,radius_bin,insol_bin,st_Teff_bin,priority,highestp
radius_bin,insol_bin,st_Teff_bin,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1
1,2,1,spoc,98796344.0,455.01,45.4642,-16.5934,8.64,0.018,1412.708786,0.00091,5.358807,0.000351,1.364837,0.188153,2498.079231,168.20534,4,two stars on the same pixel; could also be 987...,4.97389,0.060229,1.0,0.271,0.008,1.368307,0.364177,420.370338,3562.0,83.0,7.379879,13.6348,False,2019-02-08T19:54:07+00:00,2019-10-17 00:41:41.598875+00:00,0.252032,98796344.0,45.462478,-16.594496,10.59,7.294,6.774,6.496,30.046283,2.447183,2.245208,2.238639,43.269585,43.2537,1,2,1,1.0,1
1,2,2,,,HD 219134 c,,57.168354,,,,,6.76458,,,,,,,,,,,0.78,,1.511,,,4699.0,,2.828427,,,,,0.81,,,,5.57,3.981,,,17.993824,4.36,,,205.218714,94.686105,1,2,2,1.0,1
1,2,3,,,K2-184 b,,14.461936,,,,,16.995731,,,,,,,,,,,0.78,,1.55,,,5220.0,,2.828427,,,,,0.86,,,,10.345,8.92,,,33.92558,3.025,,,26.567025,15.151271,1,2,3,1.0,1
1,3,1,spoc,36724087.0,732.01,154.6464,-11.7167,10.534,0.058,1543.91148,0.001189,0.768418,6.7e-05,0.816472,0.266768,1252.849899,105.63316,9,,4.94957,0.423263,1.0,0.3,0.054,1.134371,0.573323,770.585234,3329.0,72.0,83.330451,11.443317,False,2019-06-06T16:40:58+00:00,2019-10-17 00:41:48.757745+00:00,0.292039,36724087.0,154.644903,-11.717801,13.14,9.007,8.439,8.204001,7.810036,1.52616,2.424886,2.417812,26.868814,26.858943,1,3,1,1.0,1
1,5,3,spoc,286132427.0,635.01,146.724705,-4.298086,8.07,0.018,1517.43594,0.001801,0.493379,7.7e-05,1.5,0.283602,194.341058,22.715282,8,could be on TIC 286132422,4.46485,0.254775,1.0,1.00635,0.112958,1.503946,0.944963,2338.398008,5914.0,191.0,7066.343282,8.047397,False,2019-04-23T16:40:29+00:00,2019-10-17 00:41:48.599394+00:00,1.076406,286132427.0,146.72453,-4.29824,8.69,7.511,7.217,7.18,2.676656,2.873752,2.21814,2.21168,118.437703,118.394182,1,5,3,1.0,1
2,2,1,,,TOI 270 c,,-51.956233,,,,,5.660172,,,,,,,,,,,0.38,,2.42,,,3386.0,,2.828427,,,,,0.4,,,,12.62,9.099,,,25.923003,6.4512,,,136.501757,104.9076,2,2,1,1.0,1
2,2,2,,,HD 219134 b,,57.168354,,,,,3.092926,,,,,,,,,,,0.78,,1.602,,,4699.0,,2.828427,,,,,0.81,,,,5.57,3.981,,,10.679295,4.74,,,292.018044,103.797894,2,2,2,1.0,1
2,2,3,,,pi Men c,,-80.469124,,,,,6.2679,,,,,,,,,,,1.1,,2.042,,,6037.0,,2.828427,,,,,1.09,,,,5.67,4.869,,,13.388338,4.82,,,227.954509,70.616039,2,2,3,1.0,1
2,3,1,spoc,54962195.0,663.01,160.0665,-8.5107,11.672,0.04,1544.390641,0.002789,2.598654,0.0005,1.618382,0.5309,1911.17085,202.56204,9,,4.76941,0.347691,1.0,0.502,0.075,2.224192,1.594181,669.63775,3719.0,64.0,47.520469,9.389264,False,2019-05-07T15:39:33+00:00,2019-10-17 00:41:50.340011+00:00,0.540064,54962195.0,160.065852,-8.511083,13.667,10.448,9.828,9.607,12.907422,5.58917,3.926915,3.915419,58.617063,58.595541,2,3,1,1.0,1
2,3,2,spoc,103633434.0,1235.01,152.215862,69.276546,9.91924,0.007276,1683.620171,0.003529,3.44374,0.000844,2.17072,0.240967,803.704126,71.32727,14,Potential level one candidate,4.62642,0.011406,1.0,0.629575,0.018704,2.142192,0.189739,703.516471,3912.0,157.0,57.891937,9.588445,,2019-10-17T00:30:12+00:00,2019-10-26 14:27:37.006010+00:00,0.611143,103633434.0,152.218255,69.27662,11.495,8.711,8.074,7.893,12.939461,5.243409,3.08858,3.07955,82.977973,82.947509,2,3,2,1.0,1


In [188]:
counter = 0
cut_tois = []
for old_toi in my_tois_or:
    if old_toi not in my_tois:
        print(old_toi)
        cut_tois.append(old_toi)

732.02
526.01


From the most recent sector:

TOI       Rp          Teq             J

1235.01   ~2.1        703             8.7

1242.01   ~1.8        1670            10.5

1246.02   ~2.8        955             10.3

1258.01   ~5.0        1059            8.6

1264.01   ~7.6        1154            9.6

1268.01   ~8.9        784             9.4

1278.01   ~9.3        408             10.6

1285.01   ~1.9        841             9.5

In [221]:
#binned.loc[2,2,2]

In [161]:
kp[kp[id_key] == 442.01]

Unnamed: 0,Planet Radius Value,Stellar Mass,Orbital Period Value,Star Radius Value,Effective Temperature Value,J mag,V mag,TIC Declination,Effective Stellar Flux Value,pl_masses,Ars,TSM,nTSM,Full TOI ID


In [43]:
c[np.round(c[id_key], 0) == 1339][[id_key,dec_key,pp_key,rp_key,Fp_key,'Planet Equilibrium Temperature (K) Value',
                                   Ts_key,Vmag_key,Jmag_key,'pl_masses','TSM','Public Comment']]
#so my k_amp and Natalie's are BOTH below 2! What the heck?? 
#okay, I suspect the rows error crept into Natalie's code somehow, because both of
#our formulae return K_amp = 1.72 for TOI 455.01. Either that, or there was a 
#typo when she copied the list into an email for me. 

Unnamed: 0,Full TOI ID,TIC Declination,Orbital Period Value,Planet Radius Value,Effective Stellar Flux Value,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,V mag,J mag,pl_masses,TSM,Public Comment
634,1339.01,66.850576,8.87923,3.2711,39.310145,638.0,5555.7,8.97,7.597,10.767972,132.785168,possible multi; some transits fell in gaps
635,1339.02,66.850576,11.062812,3.009164,73.910839,747.819495,5555.7,8.97,7.597,9.34356,110.712623,part of possible multi-planet system


In [57]:
#np.savetxt(fname='nicholas_target_list.txt',X=vecstr(my_tois),fmt='%s')
binned[np.round(binned[id_key], 0) == 1339]

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Source Pipeline,TIC,Full TOI ID,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,Alerted,Edited,Stellar Mass,Target,RA,Dec,V mag,J mag,H mag,K mag,Ars,pl_masses,K_amp,K_amp_n,TSM,nTSM,radius_bin,insol_bin,st_Teff_bin,priority
radius_bin,insol_bin,st_Teff_bin,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1
3,3,3,spoc,269701147,1339.02,302.023979,66.850576,8.293,0.006,1743.556395,0.001723,11.062812,0.002426,5.256185,0.250002,1063.67199,45.211372,16,part of possible multi-planet system,4.49,0.08,2,0.920435,0.046312,3.009164,0.496579,747.819495,5555.7,313.7,73.910839,19.837212,,2019-10-30 15:08,2019-10-31 17:16:04.111324+00:00,0.954144,269701147,302.025625,66.850301,8.97,7.597,7.215,7.18,22.353786,9.34356,2.771607,2.763497,110.712623,108.877386,3,3,3,1.0
3,3,3,spoc,269701147,1339.01,302.023979,66.850576,8.293,0.006,1741.996126,0.00253,8.87923,0.00082,3.007854,0.156,1257.358469,0.576369,16,possible multi; some transits fell in gaps,4.49,0.08,1,0.920435,0.1,3.2711,0.355049,638.0,5555.7,313.7,39.310145,18.521164,,2019-10-30 15:08,2019-10-31 17:37:02.538553+00:00,0.954144,269701147,302.025625,66.850301,8.97,7.597,7.215,7.18,19.305939,10.767972,3.43703,3.426962,132.785168,103.635648,3,3,3,2.0


In [55]:
print(binned[binned['priority']!=0].sort_values([id_key])[id_key].values)

[ 233.01  238.01  256.02  266.01  278.01  390.01  421.01  455.01  460.01
  461.01  465.01  469.01  482.01  485.01  506.01  507.01  516.01  519.01
  521.01  526.01  529.01  532.01  538.01  543.01  544.01  560.01  561.02
  564.01  620.01  634.01  635.01  638.01  654.01  663.01  663.02  669.01
  680.01  732.01  732.02  736.01  736.02 1135.01 1136.01 1136.02 1194.01
 1201.01 1235.01 1239.01 1242.01 1244.01 1246.02 1251.01 1254.01 1256.01
 1258.01 1260.01 1264.01 1268.01 1272.01 1274.01 1275.01 1276.01 1278.01
 1284.01 1285.01 1288.01 1289.01 1339.01 1339.02 1340.01]


In [25]:
natalie_tois = np.array([123.01,129.01,134.01,140.01,141.01,177.01,179.01,200.01,216.01,221.01,245.01,270.02,282.01,431.02,455.01,482.01,507.01,509.01,510.01,523.01,526.01,533.01,539.01,554.01,560.01,561.02,576.01,620.01,672.01,682.01,712.02,732.01,783.01,784.01,788.01,793.01,821.01,836.02,865.03])
'''
natalie_data = pd.read_csv('targetList.csv',names=['TICID','RA','DEC','Vmag','Tmag','Jmag',
                                                   'st_teff','st_rad','period','pl_rade',
                                                   'Insol','teq','kamp','TSM'])
'''
#natalie_data
##binned2 = binning_function(cc,all_bins,'TICID')
#natalie_tics = binned2[binned2['priority']==1].reset_index(drop=True).sort_values(id_key)[id_key].values
natalie_tois

array([123.01, 129.01, 134.01, 140.01, 141.01, 177.01, 179.01, 200.01,
       216.01, 221.01, 245.01, 270.02, 282.01, 431.02, 455.01, 482.01,
       507.01, 509.01, 510.01, 523.01, 526.01, 533.01, 539.01, 554.01,
       560.01, 561.02, 576.01, 620.01, 672.01, 682.01, 712.02, 732.01,
       783.01, 784.01, 788.01, 793.01, 821.01, 836.02, 865.03])

In [26]:
binned[np.round(binned[id_key],0) == 732]

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Source Pipeline,TIC,Full TOI ID,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,Alerted,Edited,Stellar Mass,Target,RA,Dec,V mag,J mag,H mag,K mag,Ars,pl_masses,K_amp,K_amp_n,TSM,nTSM,radius_bin,insol_bin,st_Teff_bin,priority
radius_bin,insol_bin,st_Teff_bin,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1
1,3,1,spoc,36724087,732.01,154.6464,-11.7167,10.534,0.058,1543.91148,0.001189,0.768418,6.7e-05,0.816472,0.266768,1252.849899,105.63316,9,,4.94957,0.423263,1,0.3,0.054,1.134371,0.573323,770.585234,3329.0,72.0,83.330451,11.443317,False,2019-06-06T16:40:58+00:00,2019-10-17 00:41:48.757745+00:00,0.292039,36724087,154.644903,-11.717801,13.14,9.007,8.439,8.204001,7.810036,1.52616,2.424886,2.417812,26.868814,26.858943,1,3,1,1.0
2,2,1,spoc,36724087,732.02,154.6464,-11.7167,10.534,0.058,1546.848329,0.001409,12.254218,0.002019,1.361689,0.33205,3416.662447,283.4698,9,,4.94957,0.423263,2,0.3,0.054,1.785398,0.730371,306.143276,3329.0,72.0,2.075964,11.924323,False,2019-06-06T16:40:58+00:00,2019-10-17 00:41:48.764789+00:00,0.292039,36724087,154.644903,-11.717801,13.14,9.007,8.439,8.204001,49.481755,3.846839,2.428282,2.42116,109.497802,109.457586,2,2,1,1.0


In [50]:
binned[binned['Planet Equilibrium Temperature (K) Value'] < 373]

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Source Pipeline,TIC,Full TOI ID,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,Alerted,Edited,Stellar Mass,Target,RA,Dec,V mag,J mag,H mag,K mag,Ars,pl_masses,K_amp,K_amp_n,TSM,nTSM,radius_bin,insol_bin,st_Teff_bin,priority
radius_bin,insol_bin,st_Teff_bin,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1
2,2,1,spoc,181804752,736.01,165.6915,-16.4062,13.508,0.059,1546.508996,0.001156,4.99007,0.000444,1.150579,0.162682,17848.071663,1087.5365,9,,5.14315,0.410207,1,0.15,0.026,2.019085,0.426467,301.705315,2940.0,67.0,1.958181,17.659561,False,2019-06-06T16:40:58+00:00,2019-10-17 00:41:44.919807+00:00,0.114015,181804752,165.690484,-16.406444,16.91,11.559,10.993,10.644,39.737065,4.741516,7.559481,7.53688,156.375608,156.318197,2,2,1,3.0
2,2,1,spoc,43064903,1276.01,302.667462,40.668998,12.5405,0.007423,1712.548761,0.004739,6.264298,0.002524,2.389982,0.306185,9097.780143,1337.178,15,Potential L1 candidate; could be 3 x period.,5.04431,0.022945,1,0.211257,0.006205,2.337752,0.27781,328.99879,3145.0,157.0,2.768842,8.720192,,2019-10-17T00:30:12+00:00,2019-10-17 00:41:43.950911+00:00,0.180119,43064903,302.669134,40.668628,15.48,10.795,10.216,9.941,38.240158,6.082915,6.62773,6.608018,147.869181,147.814881,2,2,1,2.0
2,2,1,spoc,36724087,732.02,154.6464,-11.7167,10.534,0.058,1546.848329,0.001409,12.254218,0.002019,1.361689,0.33205,3416.662447,283.4698,9,,4.94957,0.423263,2,0.3,0.054,1.785398,0.730371,306.143276,3329.0,72.0,2.075964,11.924323,False,2019-06-06T16:40:58+00:00,2019-10-17 00:41:48.764789+00:00,0.292039,36724087,154.644903,-11.717801,13.14,9.007,8.439,8.204001,49.481755,3.846839,2.428282,2.42116,109.497802,109.457586,2,2,1,1.0
2,2,1,spoc,429358906,782.01,183.9211,-18.9102,12.191,0.04,1577.042852,0.002817,16.047204,0.004003,1.709139,0.538583,4333.162901,548.91736,10,Low SNR,4.94964,0.399131,1,0.301,0.051,2.003358,0.982551,280.141151,3331.0,63.0,1.455555,8.467292,False,2019-06-11T20:03:40+00:00,2019-10-17 00:41:50.481317+00:00,0.294036,429358906,183.920361,-18.910338,14.83,10.675,10.108,9.86,59.164681,4.678903,2.68737,2.679473,53.628743,53.609056,2,2,1,0.0


In [70]:
mismatch_tois = []
counter = 0
for toi in natalie_tois:
    if toi in my_tois:
        counter += 1
    if toi not in my_tois:
        print(toi)
        mismatch_tois.append(toi)
print(counter)
#Many TICIDs of missing TOIs ARE in my star_data list (e.g. 154618248) 
#so I'm not sure how they got excluded from the other list
# - maybe K_amp differences? Investigate tomorrow

#okay, so, 140.01 HAS all the values, but in its bin, it's beaten by 408, 670, and 467, 
#MISSING: 455.01 (k_amp), 523.01 (no stellar mass)

140.01
455.01
523.01
533.01
561.02
620.01
672.01
682.01
31


In [56]:
pd.options.display.max_columns = 100
binned.loc[4,4,2]

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Source Pipeline,TIC,Full TOI ID,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,Alerted,Edited,Stellar Mass,Target,RA,Dec,V mag,J mag,H mag,K mag,Ars,pl_masses,K_amp,K_amp_n,TSM,nTSM,radius_bin,insol_bin,st_Teff_bin,priority
radius_bin,insol_bin,st_Teff_bin,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1
4,4,2,spoc,270380593,465.01,32.781778,2.418047,10.661,0.018,1414.135825,0.000701,3.836317,0.000229,2.389717,0.084547,5578.265805,120.81916,4,WASP-156,4.60108,0.0,1,0.76,0.0,5.63586,0.362515,887.523592,4910.0,0.0,146.636007,34.84919,False,2019-02-08T19:54:07+00:00,2019-10-17 00:41:48.053462+00:00,0.840108,270380593,32.782085,2.418194,11.559,9.906,9.473,9.339,12.807673,27.151059,12.478885,12.441807,132.982914,132.934096,4,4,2,1.0
4,4,2,spoc,417948359,1272.01,199.196626,49.861039,11.024,0.006,1713.031745,0.00178,3.315605,0.00048,1.530639,0.34,2598.870257,5.77319,15,,4.54,0.09,1,0.809032,0.02,4.101916,0.240595,979.479471,4972.7,61.9,217.521583,17.029032,,2019-10-17T00:30:12+00:00,2019-10-31 18:10:58.508431+00:00,0.827102,417948359,199.196204,49.861059,11.758,10.218,9.793,9.701,10.859881,15.820927,7.713569,7.690853,73.970664,74.196281,4,4,2,2.0


In [102]:
binned.loc[:,['TOI',rp_key,mp_key,Ts_key,'Comments','TSM','priority']][binned['TSM'] > 600].sort_values('TSM', ascending=False)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,TOI,Planet Radius (R_Earth),pl_masses,Stellar Teff (K),Comments,TSM,priority
radius_bin,insol_bin,st_Teff_bin,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
3,3,1,278.01,2.630575,7.434309,2955.0,possible dipper; not a planet candidate; Rstar...,647.611359,1.0
5,3,1,507.01,9.812343,69.689615,3338.0,V-shaped; large planet,634.688014,1.0


In [30]:
tess[tess[id_key] == 1252]

Unnamed: 0,Source Pipeline,TIC,Full TOI ID,TOI Disposition,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,TFOP Master,TFOP SG1a,TFOP SG1b,TFOP SG2,TFOP SG3,TFOP SG4,TFOP SG5,Alerted,Edited,Stellar Mass


In [25]:
#np.savetxt(fname='ticid_names_test.txt',X=tess[['TIC ID']],fmt='%d',header='TICID', delimiter=',')
tess['TIC'].to_csv('ticid_names_only_oct31.csv',header='False',index=False)

In [None]:
#look for ESM targets as well 
#alison stall wrote code to take candidates and output important diagnostics (from ephemerides)
#make sure data wrangling works so it's adaptable as new TOIs come out

#prioritize NIRSPEC questions bc Emily meeting (find other planets observed)
    
'''
re: NSF - crafting Webb legacy survey might be good. If you say - find TKS sample, that's not so interesting 
more broadly, science question is explore diversity of exoplanet atmospheres. 
Could invision picking off interesting targets w/ found masses and put in observing proposals 
Jonathan: can we identify disequilibrium processes in atmospheres - can learn how to recognize them (even in giant planets)
    and will be better positioned to find them in the future 
    Webb will be sending us data 2022 
    ERS sample (Webb exoplanet sample) might be good
    Study systematics; red noise; etc. in Webb? 
    SHOULD mention Keck observations; SHOULD mention ERS program; SHOULD mention NIRSPEC; SHOULD mention Webb 
        legacy survey
    NEED some kind of science question to answer; we don't necessarily understand what that is yet 
    Search for similar target with Webb
'''

In [398]:
def planck_microns(T,wavelength):
    '''
    note input is in microns! 
    '''
    c = 3e8 #m/s
    h = 6.626e-34
    kb = 1.38e-23
    wav_meters = wavelength / 1e6
    B = 2 * h * c / ((wav_meters**5) * (np.exp(h*c/(wav_meters * kb * T))-1))
    return B

def get_ESM(planet_teq, star_teff, planet_radius, star_radius, Kmag, rp_units = 'jupiter',rs_units='solar'):
    
    dayside_teq = 1.1 * planet_teq
    planet_b = planck_microns(dayside_teq,4)
    star_b = planck_microns(star_teff,4) #note: may want to use 7.5 instead of 4 since the prefactor in Kempton
                                            #is scaled based on the LRS bandpass for a specific planet
                                            #Although I should still get consistent *relative* ESM values. 
    
    if rp_units == 'earth':
        rp_m = 6.371e6 * planet_radius
    elif rp_units == 'jupiter':
        rp_m = 6.9911e7 * planet_radius
    if rs_units == 'solar':
        rs_m = 6.9551e8 * star_radius
    
    ESM = 4.29e6 * (planet_b / star_b) * ((rp_m/rs_m)**2) * (10**(-Kmag/5))
    
    return ESM

NOTE

TKS is using Teff < 6500, NAtalie 10^5, and Rstar < 5.5 
after this, want a file with prioritization 
want to prioritize all P = 1, 2, 3 targets 
       read in confirmed planets from exoplanet archive and compare quality 
       give priority to empty cells 
       give priority to p = 1 (of course) 
       naively, just sort by p; however, how to sort within priority 1? 
       i.e., is there anything better in a "cell" (bin) - how many? 
write out CSV file that could be read into excel. Include a bunch of stuff (P + S properties) 
    for P: R, P, Fp, Mp (if available - create binary value for "was it calculated or measured") 
        name: put name and alternate name (e.g. TOI xxx.xx, WASP-xx) 
        toggles: 0, 1 for "is Kepler, is K2, is TESS") 
    for S: logg, Rs, Vmag, Jmag, Teff, Rs
    also, TSM, ESM, priority, Kamp, numeric value for cell # 
    would be nice if we could look at the # and know immediately where it resides 
    do a three digit integer: want it as Rp, Fp, Teff (low to high) 
    there will be additional historical info and a comments field. Append new comments using | or ; 
        e.g.: "on TKS target list", "previously observed", "vetting status": on confluence, there was a list of criteria that 
           Theo was using related to this 
                could do something fancy, e.g. include links to vetting reports (TESS TOI working group does this when they 
                create spreadsheets; there are cells with links to vetting reports) 
        also want observability: e.g. Mar Apr May it has airmass above 2. (would put "MarAprMay" as "345") - I should think aby 
        this
    something like Theo's visibility plots (airmass as function of UT) - might put this as "mean hours per night as a function 
    of month"
    last thing: what if there are 5 confirmed planets in a cell, and they're all better than the TESS target? Or a new TESS 
    release demotes a formerly P = 1 target? I think a "highest lifetime priority" column might work. Could also do a string 
    which is a concatenation of all previous priorities (e.g. "1111111222222233000000" for something that's steadily getting 
    kicked off)
    Natalie wants to know if a target has been observed with RV measurements. Like, what's the quality of the RV signal (not 
    worry about that yet) 
For Webb: how many planets do we need in a bin? Maybe at least 4 (one for every epoch), maybe 3 (2/3 will be hazy?) maybe 12 (for both of those things)
Also: if we've already observed something for, like, 2 months, why on earth would we get rid of it?? 


In [207]:
vecint = np.vectorize(int)
vecstr = np.vectorize(str)
binned2['highestp'] = vecstr(vecint(binned2['priority']))
binned2.to_csv('test.csv')

In [214]:
test['highestp'] = np.core.defchararray.add(vecstr(test['highestp']), vecstr(vecint(test['priority'])))
test

Unnamed: 0,radius_bin,insol_bin,st_Teff_bin,Source Pipeline,TIC,Full TOI ID,TIC Right Ascension,TIC Declination,TMag Value,TMag Uncertainty,Orbital Epoch Value,Orbital Epoch Uncertainty,Orbital Period Value,Orbital Period Uncertainty,Transit Duration (hours) Value,Transit Duration (hours) Uncertainty,Transit Depth Value,Transit Depth Uncertainty,Sectors,Public Comment,Surface Gravity Value,Surface Gravity Uncertainty,Signal ID,Star Radius Value,Star Radius Uncertainty,Planet Radius Value,Planet Radius Uncertainty,Planet Equilibrium Temperature (K) Value,Effective Temperature Value,Effective Temperature Uncertainty,Effective Stellar Flux Value,Signal-to-noise,Centroid Offset,Alerted,Edited,Stellar Mass,Target,RA,Dec,V mag,J mag,H mag,K mag,Ars,pl_masses,K_amp,K_amp_n,TSM,nTSM,radius_bin.1,insol_bin.1,st_Teff_bin.1,priority,highestp
0,1,2,1,,,LTT 1445 A b,,-16.593372,,,,,5.358820,,,,,,,,,,,0.280000,,1.380000,,,3337.00,,2.828427,,,,,0.260000,,,,11.220,7.294000,,,29.383827,2.200000,,,43.816647,36.378947,1,2,1,3.0,33
1,1,2,1,spoc,98796344.0,455.01,45.464200,-16.593400,8.6400,0.0180,1412.708786,0.000910,5.358807,0.000351,1.364837,0.188153,2498.079231,168.205340,4,two stars on the same pixel; could also be 987...,4.97389,0.060229,1.0,0.271000,0.008000,1.368307,0.364177,420.370338,3562.00,83.0000,7.379879,13.634800,False,2019-02-08T19:54:07+00:00,2019-10-17 00:41:41.598875+00:00,0.252032,98796344.0,45.462478,-16.594496,10.590,7.294000,6.774,6.496,30.046283,2.447183,2.245208,2.238639,43.269585,43.253700,1,2,1,1.0,11
2,1,2,1,,,GJ 357 b,,-21.660797,,,,,3.930720,,,,,,,,,,,0.340000,,1.217000,,,3505.00,,2.828427,,,,,0.340000,,,,10.920,7.337000,,,21.522429,1.840000,,,29.320884,19.835707,1,2,1,2.0,22
3,1,2,1,spoc,92226327.0,256.02,11.247108,-15.271294,11.2380,0.0700,1389.293276,0.002136,3.778378,0.000784,1.028338,0.287900,3334.776030,300.731080,3,LHS-1140c,5.05701,0.000000,2.0,0.190000,0.000000,1.136554,0.410558,379.011837,3131.00,0.0000,4.876768,10.993547,False,2018-11-30T22:06:23+00:00,2019-10-31 19:59:43.339723+00:00,0.150019,92226327.0,11.248632,-15.274109,14.150,9.612001,9.092,8.821,28.557982,1.536701,2.238591,2.232038,24.907571,24.898423,1,2,1,0.0,00
4,1,2,1,,,K2-3 d,,-1.454787,,,,,44.559830,,,,,,,,,,,0.560000,,1.510000,,,3896.00,,2.828427,,,,,0.600000,,,,12.170,9.421000,,,79.686956,2.893400,,,19.263145,22.558741,1,2,1,0.0,00
5,1,2,1,,,TOI 270 b,,-51.956233,,,,,3.360080,,,,,,,,,,,0.380000,,1.247000,,,3386.00,,2.828427,,,,,0.400000,,,,12.620,9.099000,,,18.310434,2.089900,,,10.343866,6.681258,1,2,1,0.0,00
6,1,2,1,,,K2-129 b,,-25.644964,,,,,8.239493,,,,,,,,,,,0.360000,,1.040000,,,3459.09,,2.828427,,,,,0.360000,,,,13.630,9.697000,,,33.933435,1.118300,,,7.119070,6.127570,1,2,1,0.0,00
7,1,2,2,,,HD 219134 c,,57.168354,,,,,6.764580,,,,,,,,,,,0.780000,,1.511000,,,4699.00,,2.828427,,,,,0.810000,,,,5.570,3.981000,,,17.993824,4.360000,,,205.218714,94.686105,1,2,2,1.0,11
8,1,2,2,,,GJ 9827 b,,-1.286273,,,,,1.208982,,,,,,,,,,,0.600000,,1.577000,,,4340.00,,2.828427,,,,,0.610000,,,,10.250,7.984000,,,6.752549,4.910000,,,83.545392,25.566992,1,2,2,2.0,22
9,1,2,2,,,K2-141 b,,-1.189274,,,,,0.280324,,,,,,,,,,,0.680000,,1.510000,,,4599.00,,2.828427,,,,,0.710000,,,,11.389,9.086000,,,2.365449,5.080000,,,59.485545,10.167586,1,2,2,3.0,33


In [209]:
#don't make V cuts until after we rank them - then we can be aware of good targets that are dim / M dwarves
#could we make a graphic where each square had a name/TOI number, Vmag, Jmag, priority (for top few / bin)
#6 characters: e.g. gj1214 or k20018 
#flags in NASA ExoArch for IsKepler, IsK2, 
#should also add KOI and K2 candidate lists to this (those will not change so should just be a single thing)
    #those are on NASA ExoArch, they have their own tables
#make 5 pages (one for each Rp bin) with boxes for each bin containing the info above 
#relax Vmag to 16 so we can get M dwarf targets.
#add "does it have a mass already"
#some observability informations: e.g., what quarters it can be seen in

'ab'

More from Natalie: 

make sure that we're actually getting the Sector 14, 15, 16 targets (SPOC)