In [1]:
import pandas as pd
import numpy as np

from os import path

In [2]:
# Directories etc:
data_dir = "~/OneDrive/SEPHI_data/CKS/"
#data_dir = "~/Scarlett/OneDrive - Liverpool John Moores University/SEPHI_data/CKS/"
header_length = 8 #for 2022_04_13
data_date = "2022_04_28"

#data_date = "2022_04_13"

In [3]:
# The Kepler Confirmed nades can be found on the NASA EA, under the tab Data -> Kepler c=Confirmed Names
# Here: https://exoplanetarchive.ipac.caltech.edu/cgi-bin/TblView/nph-tblView?app=ExoTbls&config=kep_conf_names

# Read in rosetta:
rosetta = pd.read_csv(path.join(data_dir, f"kep_conf_names_" + data_date + ".csv"), skiprows=header_length)
rosetta_len = rosetta["pl_name"].size

# Planet names in NEA format examples:
# KOI-13 b
# Kepler-10 c
# KIC 5095269 b

cols_renamed = {"kepler_name":"pl_kepler_name",
               "koi_name":"pl_koi_name",
               "kepid":"st_kepid"}

rosetta.rename( columns=cols_renamed, inplace=True )

# Creating new columns in rosetta that have identifiers in the same format that theya re in in the NASA EA:
rosetta["st_kepid_NEA"] = "KIC " + rosetta["st_kepid"].astype(str) # putting the planet's Kepler ID (/Kepler Input Catalogue no.) into the same format that it's in in the NASA EA (e.g. KIC 5095269 b)
rosetta["pl_kepid_NEA"] = rosetta["st_kepid_NEA"] + " " + rosetta["pl_kepler_name"].str[-1] # the planet's Kepler ID is the star's Kepler ID + planet letter

rosetta["st_koi_name"] = rosetta["pl_koi_name"].str[:-3] # deleting the .?? characters to get the KOI for the star
rosetta["st_koi_NEA"] = rosetta["st_koi_name"].str[1:] # putting the KOI into the same format that it's in in the NASA EA
rosetta["st_koi_NEA"] = "K0I-" + rosetta["st_koi_NEA"].str.lstrip('0').astype(str)

rosetta["st_kepler_name"] = rosetta["pl_kepler_name"].str.rsplit(" ", n=1, expand=True)[0] # deleting the planet letter to get the Kepler- star name
rosetta["st_name"] = rosetta["pl_name"].str.rsplit(" ", n=1, expand=True)[0] # deleting the planet letter to get the generic star name (that should be in the NASA EA)

# The pl_kepler_name and pl_name are unique to each planet and are listed for all confirmed planets

print("Rosetta:\n", rosetta)

Rosetta:
       st_kepid pl_koi_name pl_kepler_name       pl_name  st_kepid_NEA  \
0     11446443   K00001.01     Kepler-1 b      TrES-2 b  KIC 11446443   
1     11904151   K00072.01    Kepler-10 b   Kepler-10 b  KIC 11904151   
2     11904151   K00072.02    Kepler-10 c   Kepler-10 c  KIC 11904151   
3      6521045   K00041.02   Kepler-100 b  Kepler-100 b   KIC 6521045   
4      6521045   K00041.01   Kepler-100 c  Kepler-100 c   KIC 6521045   
...        ...         ...            ...           ...           ...   
2727   4035640   K01881.01   Kepler-995 b  Kepler-995 b   KIC 4035640   
2728   6205228   K01882.01   Kepler-996 b  Kepler-996 b   KIC 6205228   
2729  11758544   K01883.01   Kepler-997 b  Kepler-997 b  KIC 11758544   
2730  11413812   K01885.01   Kepler-998 b  Kepler-998 b  KIC 11413812   
2731   9549648   K01886.01   Kepler-999 b  Kepler-999 b   KIC 9549648   

        pl_kepid_NEA st_koi_name st_koi_NEA st_kepler_name     st_name  
0     KIC 11446443 b      K00001      K0

In [4]:
# Save the rosetta file to a csv:
rosetta.to_csv( path.join(data_dir, f"rosetta_" + data_date + ".csv") , index=False)