In [1]:
import pandas as pd

In [2]:
# Create a dataframe from a CSV file:
df = pd.read_csv("kepler.csv.gz", skiprows=53)

In [3]:
# Show a snippet of the dataframe:
cols = ['kepid', 'kepoi_name', 'kepler_name', 'koi_disposition', 'koi_score']
print (df.to_string(columns=cols, max_rows=4))


         kepid kepoi_name   kepler_name koi_disposition  koi_score
0     10797460  K00752.01  Kepler-227 b       CONFIRMED      1.000
1     10797460  K00752.02  Kepler-227 c       CONFIRMED      0.969
...        ...        ...           ...             ...        ...
9562  10155286  K07988.01           NaN       CANDIDATE      0.092
9563  10156110  K07989.01           NaN  FALSE POSITIVE      0.000


In [4]:
# Show all the columns:
df.columns

Index(['kepid', 'kepoi_name', 'kepler_name', 'koi_disposition',
       'koi_pdisposition', 'koi_score', 'koi_fpflag_nt', 'koi_fpflag_ss',
       'koi_fpflag_co', 'koi_fpflag_ec', 'koi_period', 'koi_period_err1',
       'koi_period_err2', 'koi_time0bk', 'koi_time0bk_err1',
       'koi_time0bk_err2', 'koi_impact', 'koi_impact_err1', 'koi_impact_err2',
       'koi_duration', 'koi_duration_err1', 'koi_duration_err2', 'koi_depth',
       'koi_depth_err1', 'koi_depth_err2', 'koi_prad', 'koi_prad_err1',
       'koi_prad_err2', 'koi_teq', 'koi_teq_err1', 'koi_teq_err2', 'koi_insol',
       'koi_insol_err1', 'koi_insol_err2', 'koi_model_snr', 'koi_tce_plnt_num',
       'koi_tce_delivname', 'koi_steff', 'koi_steff_err1', 'koi_steff_err2',
       'koi_slogg', 'koi_slogg_err1', 'koi_slogg_err2', 'koi_srad',
       'koi_srad_err1', 'koi_srad_err2', 'ra', 'dec', 'koi_kepmag'],
      dtype='object')

In [5]:
# Show data for specific columns: 
cols = ['kepid', 'kepoi_name', 'kepler_name', 'koi_disposition', 'koi_score']
print (df.to_string(columns=cols, max_rows=4))

         kepid kepoi_name   kepler_name koi_disposition  koi_score
0     10797460  K00752.01  Kepler-227 b       CONFIRMED      1.000
1     10797460  K00752.02  Kepler-227 c       CONFIRMED      0.969
...        ...        ...           ...             ...        ...
9562  10155286  K07988.01           NaN       CANDIDATE      0.092
9563  10156110  K07989.01           NaN  FALSE POSITIVE      0.000


In [6]:
# Select confirmed exoplanets with a disposition score equal to 1.0:
cols = ['kepid', 'kepoi_name', 'kepler_name', 'koi_pdisposition', 'koi_score', 'koi_period']
df_confirmed = df[(df["koi_disposition"] == "CONFIRMED") & (df["koi_score"] == 1.0)]
print (df_confirmed.to_string(columns=cols, max_rows=4))


         kepid kepoi_name    kepler_name koi_pdisposition  koi_score  koi_period
0     10797460  K00752.01   Kepler-227 b        CANDIDATE        1.0    9.488036
4     10854555  K00755.01   Kepler-664 b        CANDIDATE        1.0    2.525592
...        ...        ...            ...              ...        ...         ...
7612  11125797  K03371.02  Kepler-1482 b        CANDIDATE        1.0   12.253843
8817   7350067  K06863.01  Kepler-1646 b        CANDIDATE        1.0    4.485592


In [7]:
# Show columns upto and include 'koi_score':
print (df.loc[:, :'koi_score'].to_string(max_rows=4))


         kepid kepoi_name   kepler_name koi_disposition koi_pdisposition  koi_score
0     10797460  K00752.01  Kepler-227 b       CONFIRMED        CANDIDATE      1.000
1     10797460  K00752.02  Kepler-227 c       CONFIRMED        CANDIDATE      0.969
...        ...        ...           ...             ...              ...        ...
9562  10155286  K07988.01           NaN       CANDIDATE        CANDIDATE      0.092
9563  10156110  K07989.01           NaN  FALSE POSITIVE   FALSE POSITIVE      0.000


In [8]:
# Take rows and columns of interest:
cond1 = df["koi_disposition"] == "CONFIRMED"
cond2 = df["koi_score"] == 1.0
df_interest = df.loc[cond1 & cond2, 'kepid':'koi_score']
print(df_interest.to_string(max_rows=4))

         kepid kepoi_name    kepler_name koi_disposition koi_pdisposition  koi_score
0     10797460  K00752.01   Kepler-227 b       CONFIRMED        CANDIDATE        1.0
4     10854555  K00755.01   Kepler-664 b       CONFIRMED        CANDIDATE        1.0
...        ...        ...            ...             ...              ...        ...
7612  11125797  K03371.02  Kepler-1482 b       CONFIRMED        CANDIDATE        1.0
8817   7350067  K06863.01  Kepler-1646 b       CONFIRMED        CANDIDATE        1.0
