In [29]:
import pandas as pd
import numpy as np

filename = 'data/AMUSINGSample.csv'
redshift_cutoff = 0.01

data_df = pd.read_csv(filename)
data_df = data_df.replace(r'^\s+',np.nan, regex=True)
data_df = data_df.replace(r'--',np.nan, regex=True)
data_df = data_df[data_df['redshift_amusing'].notna()].sort_values(by=['redshift_amusing'])
data_df = data_df[~(data_df['SN_type'].str.contains('Ia', case=False))]

data_df = data_df.rename(columns={'def_name': 'Host', 'SN_name': 'SN', 'SN_type': 'SNType',
                                  'redshift_amusing': 'z', 'type': 'GType', 'bt': 'bmag', 'e_bt': 'berr'})
data_df = data_df[['Host', 'SN', 'SNType', 'GType', 'z', 'bmag', 'berr', 'RA_DSS', 'DEC_DSS', 'RA_SN', 'DEC_SN', 'offset_RA', 'offset_DEC']]
data_df[['offset_RA', 'offset_DEC']] = data_df[['offset_RA', 'offset_DEC']].astype('float64') 
data_df['Offset'] = (data_df['offset_RA'].pow(2).add(data_df['offset_DEC'].pow(2))).pow(0.5)
data_df = data_df[data_df['z'] < redshift_cutoff]
data_df = data_df[data_df['Offset'] < 8]

data_df = data_df.sort_values(by='SNType').sort_values(kind='mergesort', by='Offset')
data_df.to_csv('data/AMUSING_CCSNe.dat', sep='\t')
data_df

Unnamed: 0,Host,SN,SNType,GType,z,bmag,berr,RA_DSS,DEC_DSS,RA_SN,DEC_SN,offset_RA,offset_DEC
500,IC3476,SN1970A,II,Sm,0.000564,13.306,0.074,12:32:41.85,14:03:01.86,12:32:42,14:03:04,2.1924,2.13952
166,UGC7798,SN2007rw,II,I,0.006716,14.338,0.043,12:38:03.29,-02:15:50.42,12:38:04,-2:15:40,10.7106,10.42412
508,NGC4965,SN2000P,II,SABc,0.007542,12.785,0.202,13:07:09.38,-28:13:41.28,13:07:11,-28:14:03,24.3714,-21.7176
548,NGC4603,SN2008cn,II,SABc,0.008647,12.462,0.23,12:40:55.19,-40:58:034.9,12:40:55.66,-40:58:12.1,7.008,22.80428
181,IC4582,SN2006be,II,SBbc,0.008896,14.834,0.322,15:45:39.31,28:05:18.68,15:45:39,28:05:19,-4.5936,0.31864
186,UGC11214,SN2006ca,II,Sc,0.008903,15.0,0.5,18:22:53.22,12:25:46.74,18:22:54,12:26:03,11.727,16.2618
109,ESO319-G015,ASASSN14dp,II,Sm,0.009159,15.15,0.5,11:21:58.05,-37:54:03.63,11:21:58,-37:54:24,-0.7662,-20.37012
309,NGC3318,SN2017ahn,II,Sbc,0.009255,12.326,0.179,10:37:15.51,-41:37:039.2,10:37:17.450,-41:37:05.27,29.046,33.92872
493,NGC3120,SN2010F,II,SABb,0.00931,13.511,0.036,10:05:23.06,-34:13:12.05,10:05:21,-34:13:21,-30.9384,-8.94564
574,NGC7755,SN2004cx,II,Sc,0.009867,12.462,0.193,23:47:51.77,-30:31:19.43,23:47:52.86,-30:31:32.6,16.317,-13.17176


In [30]:
data_df['offset_RA']

500      2.1924
166     10.7106
508     24.3714
548      7.0080
181     -4.5936
186     11.7270
109     -0.7662
309     29.0460
493    -30.9384
574     16.3170
509      5.5170
496    -28.9020
501    -24.9018
498      6.8880
513     -5.8122
337    -15.8622
536      8.3238
495    -28.8942
503    147.2256
155     -2.6016
497      0.8316
296     36.4572
617    -30.8202
504     -2.3658
569    -21.5562
567     -7.5774
510    -22.2384
321     10.4232
132    -18.2586
583     -0.4098
285    113.7798
499     68.0490
514     28.1820
507     42.0804
167      8.8488
274      0.3966
265    -56.0016
534      2.2374
566      1.6584
502      4.9890
184      5.5410
568      3.7770
572      8.5524
280     -0.3798
545    -42.8994
301    103.7478
511    -15.7626
549    -15.6462
505     -1.3032
546    -42.8994
268     17.9988
512    -21.1482
494    -20.8650
506     23.6910
612     -3.3750
272     32.4384
Name: offset_RA, dtype: float64