In [1]:
import numpy as np
import pandas as pd

fpp_all = pd.read_csv('fpp_final_table.csv', index_col=0)
fpp_all.count()

koi.1                    8826
rprs                     8440
secthresh                8440
maxrad                   8440
pr_heb                   8145
pr_heb_Px2               8145
pr_eb                    8145
pr_eb_Px2                8145
pr_beb                   8145
pr_beb_Px2               8145
L_tot                    8148
fp                       8148
FPP                      8145
kepid                    8616
period                   8616
rp                       8321
disposition              8616
prob_ontarget            6786
pos_prob_score           7470
not_transitlike          8826
significant_secondary    8826
centroid_offset          8826
ephem_match              8826
MES                      7260
exception                 678
has_ttv                  8556
dtype: int64

In [40]:
columns = ['kepid', 'koi', 'kepler_pl', 'period','depth','aR','Kp',
           'Teff','logg','feh','nature','reference']

from keputils.koiutils import koiname
santerne = pd.read_table('TargetSelection.tex', delimiter='\s*&\s*',
                        names=columns)
santerne['koi'] = santerne.koi.apply(koiname)
santerne['FPP'] = fpp_all.ix[santerne.koi,'FPP'].values

In [41]:
santerne[['koi','nature','FPP']].head()

Unnamed: 0,koi,nature,FPP
0,K00001.01,planet,0.0156
1,K00002.01,planet,2.09e-07
2,K00003.01,planet,8.34e-05
3,K00010.01,planet,8.45e-06
4,K00012.01,planet,0.015


Here are the summarized results of the `vespa` FPP calculations on the KOI giant planet sample presented in Santerne et al. (2015; arxiv:1511.00643v1), which find a 54.6 +/- 6.5% false positive rate in this sample.

In [50]:
print santerne.groupby('nature')['FPP'].mean()
print santerne.groupby('nature')['FPP'].median()

nature
?         0.194506
BD        0.001406
CEB       0.666857
EB        0.776810
planet    0.106562
Name: FPP, dtype: float64
nature
?         0.002660
BD        0.000848
CEB       0.991000
EB        0.966500
planet    0.000242
Name: FPP, dtype: float64


In [46]:
santerne['FPP'].mean()

0.41968902067324709

In [51]:
santerne.to_csv('santerne_sample_with_fpp.csv')

In [52]:
santerne.index = santerne.koi

In [53]:
santerne.ix['K00614.01']

kepid                              7368664
koi                              K00614.01
kepler_pl                             434b
period                              12.875
depth                                 0.43
aR           22.90$^{_{+1.20}}_{^{-1.20}}$
Kp                                    14.5
Teff            5926$^{_{+154}}_{^{-189}}$
logg          4.51$^{_{+0.04}}_{^{-0.24}}$
feh          -0.04$^{_{+0.20}}_{^{-0.30}}$
nature                              planet
reference                             Al15
FPP                                  0.529
Name: K00614.01, dtype: object

In [54]:
santerne.query('nature=="planet" and FPP > 0.3')

Unnamed: 0_level_0,kepid,koi,kepler_pl,period,depth,aR,Kp,Teff,logg,feh,nature,reference,FPP
koi,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
K00377.01,3323887,K00377.01,9b,19.271,0.7,36.84$^{_{+4.30}}_{^{-4.30}}$,13.8,5779$^{_{+110}}_{^{-128}}$,4.49$^{_{+0.03}}_{^{-0.16}}$,0.12$^{_{+0.10}}_{^{-0.14}}$,planet,Ho10,0.994
K00377.02,3323887,K00377.02,9c,38.908,0.62,54.34$^{_{+5.60}}_{^{-5.60}}$,13.8,5779$^{_{+110}}_{^{-128}}$,4.49$^{_{+0.03}}_{^{-0.16}}$,0.12$^{_{+0.10}}_{^{-0.14}}$,planet,Ho10,1.0
K00614.01,7368664,K00614.01,434b,12.875,0.43,22.90$^{_{+1.20}}_{^{-1.20}}$,14.5,5926$^{_{+154}}_{^{-189}}$,4.51$^{_{+0.04}}_{^{-0.24}}$,-0.04$^{_{+0.20}}_{^{-0.30}}$,planet,Al15,0.529
K01426.02,11122894,K01426.02,297c,74.928,0.42,82.40$^{_{+14.90}}_{^{-14.90}}$,14.2,6150$^{_{+151}}_{^{-193}}$,4.42$^{_{+0.06}}_{^{-0.30}}$,-0.12$^{_{+0.22}}_{^{-0.30}}$,planet,Ro14,0.666
K01474.01,12365184,K01474.01,419b,69.727,0.46,45.17$^{_{+7.80}}_{^{-7.80}}$,13.0,6287$^{_{+106}}_{^{-153}}$,4.24$^{_{+0.10}}_{^{-0.18}}$,0.22$^{_{+0.14}}_{^{-0.20}}$,planet,Da14,0.993


In [55]:
fpp_all.ix['K00368.01']

koi.1                         K00368.01
rprs                              0.084
secthresh                            40
maxrad                              0.6
pr_heb                         0.000192
pr_heb_Px2                     2.14e-22
pr_eb                            0.0221
pr_eb_Px2                      8.11e-25
pr_beb                         3.07e-06
pr_beb_Px2                     3.21e-31
L_tot                             3.672
fp                                0.055
FPP                              0.0223
kepid                           6603043
period                         110.3217
rp                             16.14879
disposition              FALSE POSITIVE
prob_ontarget                         1
pos_prob_score                        1
not_transitlike                   False
significant_secondary              True
centroid_offset                   False
ephem_match                       False
MES                            1688.579
exception                           NaN


In [57]:
import koiutils as ku

In [60]:
n_cands = []
for k in fpp_all.index:
    try:
        n_cands.append(ku.get_ncands(k))
    except:
        n_cands.append(np.nan)
        
fpp_all['n_cands'] = n_cands

In [62]:
fpp_all.query('n_cands == 1 and disposition=="CANDIDATE"')['FPP'].describe()

count    2402.000000
mean        0.215587
std         0.353618
min         0.000000
25%         0.000452
50%         0.012250
75%         0.253000
max         1.000000
Name: FPP, dtype: float64