# V5 of cleaning data
- drop any column with 50% or more nans
- still use ordinal data, 
- changed ordinal ranking scores
- drop zipcd,
- clean src_div_id, 
- no normalization for tree-based methods

In [1]:
import sys
print("Python version")
print (sys.version)

Python version
3.6.13 |Anaconda, Inc.| (default, Jun  4 2021, 14:25:59) 
[GCC 7.5.0]


In [2]:
import pandas as pd
import numpy as np

In [3]:
pd.set_option('display.max_columns', None)

## Load training set

In [4]:
train_df = pd.read_csv('data/2021_Competition_Training.csv', low_memory=False)
train_df = train_df.drop('Unnamed: 0', axis=1)
train_df = train_df.set_index('ID', drop=True)
train_df = train_df.replace({'*': np.nan})

In [5]:
y_name = ['covid_vaccination']

In [6]:
# put y in the first column
cols = list(train_df.columns)
cols.remove('covid_vaccination')
cols = y_name + cols

In [7]:
train_df = train_df[cols]

In [8]:
train_df.shape

(974842, 366)

In [9]:
train_df['covid_vaccination'].value_counts()

no_vacc    805389
vacc       169453
Name: covid_vaccination, dtype: int64

## Drop columns with >=50% nan

In [10]:
# check na numbers
for i in np.arange(0, 1, 0.1):
    print(f'{i:.1f}', train_df.dropna(axis=1, how='any', thresh=int(train_df.shape[0]*i)).shape)

0.0 (974842, 366)
0.1 (974842, 366)
0.2 (974842, 366)
0.3 (974842, 365)
0.4 (974842, 364)
0.5 (974842, 364)
0.6 (974842, 364)
0.7 (974842, 362)
0.8 (974842, 340)
0.9 (974842, 335)


In [10]:
for col in train_df.columns:
    if train_df[col].count() < int(train_df.shape[0]*0.5):
        print(col, f'has {(train_df.shape[0]-train_df[col].count())/train_df.shape[0]} nans')

mabh_seg has 0.649258033609549 nans
lang_spoken_cd has 0.7421182099253008 nans


In [11]:
# drop columns with > 50% na
train_df = train_df.dropna(axis=1, how='any', thresh=int(train_df.shape[0]*0.5))

In [12]:
train_df.shape

(974842, 364)

## Drop cols with only one value

In [13]:
for name in train_df.columns:
    if train_df[name].nunique() == 1:
        train_df.drop(name, axis=1, inplace=True)
train_df.shape

(974842, 310)

## Drop zipcd (since they were artificially generated)

In [14]:
train_df = train_df.drop('zip_cd', axis=1)

In [15]:
train_df.shape

(974842, 309)

## Find numerical/categorical features

In [16]:
cd_set = []
for name in train_df.columns.values:
    if '_cd' in name:
        print(name)
        cd_set.append(name)

cms_orig_reas_entitle_cd
sex_cd
race_cd


In [17]:
id_set = []
for name in train_df.columns.values:
    if '_id' in name:
        print(name)
        id_set.append(name)

src_div_id


In [18]:
categorical_features = ( set(train_df.columns) - set(train_df.describe().columns) - set(y_name) ) | set(cd_set)
len(categorical_features)

86

In [19]:
for col in categorical_features:
    train_df[col] = train_df[col].astype(float, errors='ignore')

In [20]:
categorical_features = ( set(train_df.columns) - set(train_df.describe().columns) - set(y_name) ) | set(cd_set)
len(categorical_features)

52

In [21]:
train_df['src_div_id'] = train_df['src_div_id'].fillna(0).astype(int, errors='ignore')

In [22]:
train_df['covid_vaccination'] = train_df['covid_vaccination'].map({'vacc': 1, 'no_vacc': 0})

## Add missing values

In [23]:
# how many columns with missing values
train_df.isnull().any().sum()

181

In [24]:
# Use mean or mode
for name in train_df.columns:
    if train_df[name].hasnans:
        if name in categorical_features:
            print('categorical:', name)
            train_df[name].fillna(train_df[name].mode()[0], inplace=True)
        elif train_df[name].dtypes == float:
            print('numerical:', name)
            train_df[name].fillna(train_df[name].mean(), inplace=True)
        else:
            print(name)

numerical: atlas_pct_laccess_child15
numerical: atlas_recfacpth14
numerical: atlas_pct_fmrkt_frveg16
numerical: atlas_pct_free_lunch14
numerical: cons_chmi
categorical: mcc_ano_pmpm_ct_t_9-6-3m_b4
numerical: cons_ltmedicr
numerical: rx_gpi4_6110_pmpm_ct
numerical: atlas_pc_snapben15
numerical: credit_bal_nonmtgcredit_60dpd
numerical: atlas_pct_laccess_nhna15
numerical: credit_hh_nonmtgcredit_60dpd
numerical: rx_bh_pmpm_ct_0to3m_b4
numerical: cons_lwcm10
numerical: atlas_fsrpth14
numerical: auth_3mth_dc_home
numerical: atlas_wicspth12
categorical: rx_gpi2_17_pmpm_cost_t_12-9-6m_b4
numerical: cons_hxmioc
numerical: atlas_ghveg_farms12
numerical: credit_hh_bankcardcredit_60dpd
numerical: total_outpatient_allowed_pmpm_cost_6to9m_b4
numerical: cons_cwht
numerical: atlas_netmigrationrate1016
numerical: atlas_pct_laccess_snap15
numerical: atlas_retirement_destination_2015_upda
numerical: atlas_naturalchangerate1016
numerical: atlas_pct_laccess_hisp15
numerical: auth_3mth_dc_no_ref
numerical: 

In [25]:
# how many columns with missing values after filling na
train_df.isnull().any().sum()

0

In [26]:
# save cleaned dataset without missing value
train_df.to_csv('data/training_removed_missing_v5.csv')

In [27]:
train_df.shape

(974842, 309)

## Transform ordinal features

In [28]:
# to restart only
if 0:
    train_df = pd.read_csv('data/training_removed_missing_v5.csv', index_col='ID')

In [29]:
ordered_cat_set = set([])
ordered_cat = []
for name in categorical_features:
    if 'No Activity' in train_df[name].unique():
        ordered_cat_set = ordered_cat_set | set(train_df[name].unique())
        ordered_cat.append(name)
print(ordered_cat_set)

  after removing the cwd from sys.path.


{'No Activity', 'No_Change', 'Inc_1x-2x', 'Dec_1x-2x', 'Inc_4x-8x', 'New', 'Dec_4x-8x', 'Resolved', 'Dec_2x-4x', 'Dec_over_8x', 'Inc_over_8x', 'Inc_2x-4x'}


In [30]:
len(ordered_cat)

45

In [31]:
len(ordered_cat_set)

12

In [32]:
train_df[ordered_cat].head()

Unnamed: 0_level_0,rx_nonotc_pmpm_cost_t_6-3-0m_b4,rx_mail_net_paid_pmpm_cost_t_6-3-0m_b4,rx_nonbh_pmpm_ct_t_9-6-3m_b4,bh_urgent_care_copay_pmpm_cost_t_12-9-6m_b4,rx_nonmail_dist_gpi6_pmpm_ct_t_9-6-3m_b4,rx_gpi2_17_pmpm_cost_t_12-9-6m_b4,rej_med_er_net_paid_pmpm_cost_t_9-6-3m_b4,rej_med_ip_snf_coins_pmpm_cost_t_9-6-3m_b4,rx_maint_net_paid_pmpm_cost_t_12-9-6m_b4,rx_generic_pmpm_cost_t_6-3-0m_b4,total_allowed_pmpm_cost_t_9-6-3m_b4,total_physician_office_net_paid_pmpm_cost_t_9-6-3m_b4,total_physician_office_mbr_resp_pmpm_cost_t_9-6-3m_b4,med_outpatient_deduct_pmpm_cost_t_9-6-3m_b4,rx_nonbh_pmpm_cost_t_9-6-3m_b4,rx_phar_cat_humana_pmpm_ct_t_9-6-3m_b4,rx_maint_pmpm_cost_t_12-9-6m_b4,total_ip_maternity_net_paid_pmpm_cost_t_12-9-6m_b4,rx_nonbh_net_paid_pmpm_cost_t_6-3-0m_b4,med_physician_office_allowed_pmpm_cost_t_9-6-3m_b4,rx_gpi2_62_pmpm_cost_t_9-6-3m_b4,total_physician_office_visit_ct_pmpm_t_6-3-0m_b4,rx_nonmaint_dist_gpi6_pmpm_ct_t_12-9-6m_b4,rx_maint_pmpm_cost_t_6-3-0m_b4,rx_maint_pmpm_ct_t_6-3-0m_b4,rx_overall_mbr_resp_pmpm_cost_t_6-3-0m_b4,rx_maint_net_paid_pmpm_cost_t_9-6-3m_b4,rx_generic_dist_gpi6_pmpm_ct_t_9-6-3m_b4,bh_ip_snf_admit_days_pmpm_t_9-6-3m_b4,rx_overall_dist_gpi6_pmpm_ct_t_6-3-0m_b4,total_med_net_paid_pmpm_cost_t_6-3-0m_b4,med_ambulance_coins_pmpm_cost_t_9-6-3m_b4,rx_gpi2_39_pmpm_cost_t_6-3-0m_b4,med_outpatient_mbr_resp_pmpm_cost_t_9-6-3m_b4,rx_overall_gpi_pmpm_ct_t_6-3-0m_b4,rx_branded_pmpm_ct_t_6-3-0m_b4,med_outpatient_visit_ct_pmpm_t_12-9-6m_b4,rej_med_outpatient_visit_ct_pmpm_t_6-3-0m_b4,oontwk_mbr_resp_pmpm_cost_t_6-3-0m_b4,rx_mail_mbr_resp_pmpm_cost_t_9-6-3m_b4,rx_phar_cat_cvs_pmpm_ct_t_9-6-3m_b4,total_bh_copay_pmpm_cost_t_9-6-3m_b4,mcc_chf_pmpm_ct_t_9-6-3m_b4,rx_overall_gpi_pmpm_ct_t_12-9-6m_b4,mcc_ano_pmpm_ct_t_9-6-3m_b4
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1
1MObcfaSTac85Lca0Y8bbA6I,Dec_1x-2x,Inc_1x-2x,Inc_1x-2x,No Activity,Inc_1x-2x,No Activity,No Activity,No Activity,Inc_1x-2x,Dec_1x-2x,No Activity,No Activity,No Activity,No Activity,Dec_1x-2x,No_Change,Inc_1x-2x,No Activity,Dec_1x-2x,No Activity,No Activity,No Activity,No Activity,Dec_1x-2x,Dec_1x-2x,Dec_1x-2x,Dec_2x-4x,Inc_1x-2x,No Activity,Dec_1x-2x,No Activity,No Activity,No_Change,No Activity,Dec_1x-2x,No Activity,No Activity,No Activity,No Activity,Inc_1x-2x,No Activity,No Activity,No Activity,Dec_1x-2x,No Activity
5M89OSTL580dYeA849d3480I,Inc_1x-2x,Inc_1x-2x,New,No_Change,No Activity,No Activity,No Activity,No Activity,No Activity,Inc_over_8x,No Activity,No Activity,No Activity,No Activity,New,New,No Activity,No_Change,Inc_1x-2x,No Activity,No Activity,No Activity,No Activity,Inc_1x-2x,Dec_1x-2x,Inc_1x-2x,New,New,No Activity,Inc_1x-2x,No Activity,No Activity,Dec_1x-2x,No Activity,Inc_1x-2x,No Activity,No_Change,No Activity,No Activity,New,No Activity,No Activity,No Activity,No Activity,No Activity
MdOS23TLe18Y60043Acfa2I9,Inc_1x-2x,New,New,No Activity,Inc_1x-2x,No Activity,No Activity,No Activity,Dec_2x-4x,Inc_1x-2x,Dec_4x-8x,Dec_2x-4x,Dec_2x-4x,No Activity,New,No Activity,Dec_2x-4x,No Activity,Inc_2x-4x,Dec_4x-8x,No Activity,Inc_1x-2x,No Activity,No_Change,No_Change,Inc_1x-2x,Dec_1x-2x,Inc_1x-2x,No Activity,Inc_1x-2x,Inc_1x-2x,No Activity,No Activity,Dec_2x-4x,Inc_1x-2x,No Activity,Dec_4x-8x,No Activity,Dec_1x-2x,No_Change,No Activity,No Activity,No Activity,No_Change,No Activity
2ccMO510abSaT79cLfaYAIe4,Dec_4x-8x,Resolved,Dec_1x-2x,No Activity,Dec_4x-8x,No Activity,No Activity,No Activity,Inc_2x-4x,New,Resolved,No Activity,No Activity,No Activity,Dec_1x-2x,No Activity,Inc_1x-2x,No Activity,Dec_over_8x,No Activity,No Activity,No Activity,No Activity,Dec_2x-4x,Dec_1x-2x,Dec_2x-4x,Dec_1x-2x,Dec_1x-2x,No Activity,No_Change,No Activity,No Activity,No Activity,No Activity,Dec_1x-2x,No Activity,No Activity,No Activity,No Activity,Inc_1x-2x,No Activity,No Activity,No Activity,Inc_1x-2x,No Activity
0M9811Ocb1ST94LY3f5A9I00,Dec_1x-2x,Dec_1x-2x,Inc_1x-2x,No Activity,No Activity,Resolved,No Activity,No Activity,Inc_1x-2x,Dec_1x-2x,No Activity,No Activity,No Activity,No Activity,Inc_2x-4x,Inc_1x-2x,Inc_1x-2x,No Activity,Dec_1x-2x,No Activity,No Activity,No Activity,Resolved,Dec_2x-4x,Dec_2x-4x,No Activity,Inc_1x-2x,Dec_1x-2x,No Activity,No_Change,No Activity,No Activity,Dec_2x-4x,No Activity,No_Change,No Activity,Resolved,No Activity,No Activity,No Activity,No Activity,No Activity,No Activity,No_Change,No Activity


### Set ordinal scores

These trend variables compare the numerator to the denominator, so 0-3-6 compares 3 months prior to score date (0-3, numerator) to the 3-6 months prior to the score date (3-6, denominator).  
For 3-6-9, it’s 3-6 months prior to score date as numerator and 6-9 months prior to score date as denominator.  
We’ll use numerator and denominator to help explain things below.  
- Is there a difference between the values of "Not_Activity" and "No_Change"?
No Activity = No claims in numerator or denominator; No change = claims in both numerator and denominator, but ratio between 0.99 and 1.01
- What does the value of "Resolved" mean?
Resolved = Had claims in denominator, but none in numerator
- We are assuming "New" means the patient had the cost incurred for the first time, is that a correct assumption?
New = had claims in numerator, but not denominator


In [33]:
ordered_cat_transform_tab = {'Inc_over_8x': 8,
                             'Inc_4x-8x': 6,
                             'Inc_2x-4x': 3,
                             'Inc_1x-2x': 1.5,
                             'No_Change': 0,
                             'Dec_1x-2x': -1.5,
                             'Dec_2x-4x': -3,
                             'Dec_4x-8x': -6,
                             'Dec_over_8x': -8,
                             'Resolved': -10, 
                             'No Activity': 0.5,
                             'New': 10}

In [34]:
# check trend
train_df.groupby('rx_gpi2_62_pmpm_cost_t_9-6-3m_b4')[y_name].mean().sort_values(y_name)

Unnamed: 0_level_0,covid_vaccination
rx_gpi2_62_pmpm_cost_t_9-6-3m_b4,Unnamed: 1_level_1
Dec_4x-8x,0.1625
Resolved,0.162727
No Activity,0.17273
New,0.192548
Inc_2x-4x,0.202619
Dec_over_8x,0.212121
Inc_4x-8x,0.218935
Inc_1x-2x,0.226991
Dec_2x-4x,0.235988
No_Change,0.241322


In [35]:
for name in ordered_cat:
    train_df[name] = train_df[name].map(ordered_cat_transform_tab)

## Transform categorical features

In [36]:
categorical_features = (set(categorical_features)-set(ordered_cat)) | set(['src_div_id'])
categorical_features

{'cms_orig_reas_entitle_cd',
 'cons_hhcomp',
 'cons_mobplus',
 'hedis_dia_hba1c_ge9',
 'hum_region',
 'race_cd',
 'sex_cd',
 'src_div_id'}

In [37]:
train_df[categorical_features].sample(20)

Unnamed: 0_level_0,cons_hhcomp,race_cd,cons_mobplus,src_div_id,cms_orig_reas_entitle_cd,hedis_dia_hba1c_ge9,sex_cd,hum_region
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
40M99fO294Sd1eT2LY9dA15I,A,1.0,P,0,0.0,N,M,TEXAS
5fMO5Sb3T3a3Lbfd4eYfA54I,L,1.0,U,0,0.0,N,F,TEXAS
MO20S751T3654L42Y25AId89,L,1.0,S,0,1.0,N,F,TEXAS
MO9a2d96eS2ddTf1L12YAI74,A,5.0,S,0,1.0,N,M,FLORIDA
0dMOadf0STLd1a5aY5fAd9Ib,J,1.0,U,0,1.0,N,M,MID-ATLANTIC/NORTH CAROLINA
eM65aO8S588TfL7Y9e38cAfI,B,1.0,M,0,0.0,N,F,GREAT LAKES/CENTRAL NORTH
fMbd3O18eSdcT8LYfa7A7I73,L,1.0,M,0,0.0,N,F,INTERMOUNTAIN
MO200S96cTL857aY9Adf4I4b,A,1.0,M,0,0.0,N,F,CENTRAL WEST
McO9STc3aL6abfYd9d5A7I5a,J,4.0,M,0,0.0,N,M,CENTRAL WEST
dMeaO656S31TdfLbeY2AI9c4,U,1.0,M,0,1.0,N,M,CENTRAL


In [38]:
train_df[id_set].value_counts()

0    898148
1     69291
2      5536
3       841
5       526
4       500
Name: src_div_id, dtype: int64

In [40]:
for name in categorical_features:
    train_df = pd.concat([train_df.drop(name, axis=1), pd.get_dummies(train_df[name], prefix=name, dummy_na=True)], axis=1)
    print(name, train_df.shape)

cons_hhcomp (974842, 322)
race_cd (974842, 329)
cons_mobplus (974842, 333)
src_div_id (974842, 339)
cms_orig_reas_entitle_cd (974842, 343)
hedis_dia_hba1c_ge9 (974842, 345)
sex_cd (974842, 347)
hum_region (974842, 363)


In [41]:
train_df.shape

(974842, 363)

## Save cleaned dataset

In [42]:
train_df.head()

Unnamed: 0_level_0,covid_vaccination,rx_gpi2_72_pmpm_cost_6to9m_b4,atlas_pct_laccess_child15,atlas_recfacpth14,atlas_pct_fmrkt_frveg16,atlas_pct_free_lunch14,bh_ncal_pmpm_ct,total_bh_copay_pmpm_cost_t_9-6-3m_b4,cons_chmi,mcc_ano_pmpm_ct_t_9-6-3m_b4,rx_maint_pmpm_cost_t_12-9-6m_b4,cons_ltmedicr,rx_gpi4_6110_pmpm_ct,atlas_pc_snapben15,credit_bal_nonmtgcredit_60dpd,rx_bh_mbr_resp_pmpm_cost_9to12m_b4,rx_nonbh_pmpm_cost_t_9-6-3m_b4,atlas_pct_laccess_nhna15,credit_hh_nonmtgcredit_60dpd,rx_bh_pmpm_ct_0to3m_b4,cons_lwcm10,atlas_fsrpth14,auth_3mth_dc_home,atlas_wicspth12,rx_gpi2_17_pmpm_cost_t_12-9-6m_b4,cons_hxmioc,rx_generic_pmpm_cost_t_6-3-0m_b4,cmsd2_sns_digest_abdomen_pmpm_ct,atlas_ghveg_farms12,credit_hh_bankcardcredit_60dpd,total_outpatient_allowed_pmpm_cost_6to9m_b4,cons_cwht,atlas_netmigrationrate1016,atlas_pct_laccess_snap15,bh_ncdm_ind,rx_nonmaint_mbr_resp_pmpm_cost_9to12m_b4,atlas_retirement_destination_2015_upda,rx_overall_mbr_resp_pmpm_cost_t_6-3-0m_b4,atlas_naturalchangerate1016,ccsp_236_pct,rx_overall_dist_gpi6_pmpm_ct_t_6-3-0m_b4,atlas_pct_laccess_hisp15,auth_3mth_dc_no_ref,rx_overall_mbr_resp_pmpm_cost,rx_overall_gpi_pmpm_ct_0to3m_b4,auth_3mth_dc_snf,rx_phar_cat_humana_pmpm_ct_t_9-6-3m_b4,atlas_pct_laccess_hhnv15,auth_3mth_acute_end,auth_3mth_psychic,atlas_hiamenity,auth_3mth_bh_acute,credit_bal_consumerfinance,auth_3mth_acute_chf,rx_overall_gpi_pmpm_ct_t_6-3-0m_b4,rwjf_uninsured_pct,mcc_chf_pmpm_ct_t_9-6-3m_b4,rx_mail_mbr_resp_pmpm_cost_0to3m_b4,bh_urgent_care_copay_pmpm_cost_t_12-9-6m_b4,atlas_pct_wic15,ccsp_193_pct,auth_3mth_dc_hospice,atlas_pct_fmrkt_baked16,rx_nonmaint_mbr_resp_pmpm_cost,auth_3mth_acute_skn,atlas_veg_farms12,atlas_vlfoodsec_13_15,rx_gpi2_34_dist_gpi6_pmpm_ct,bh_ip_snf_net_paid_pmpm_cost,credit_hh_bankcard_severederog,rx_hum_16_pmpm_ct,est_age,rx_maint_pmpm_cost_t_6-3-0m_b4,cnt_cp_webstatement_pmpm_ct,atlas_pct_laccess_seniors15,phy_em_px_pct,atlas_percapitainc,rwjf_uninsured_adults_pct,rx_generic_mbr_resp_pmpm_cost_0to3m_b4,rwjf_air_pollute_density,rx_gpi2_02_pmpm_cost,atlas_recfac14,lab_albumin_loinc_pmpm_ct,atlas_pct_obese_adults13,rx_maint_net_paid_pmpm_cost_t_12-9-6m_b4,rev_pm_obsrm_pmpm_ct,atlas_pct_sfsp15,total_physician_office_net_paid_pmpm_cost_9to12m_b4,atlas_pc_dirsales12,med_ip_snf_admit_days_pmpm,rej_med_outpatient_visit_ct_pmpm_t_6-3-0m_b4,cms_tot_partd_payment_amt,rx_nonotc_dist_gpi6_pmpm_ct,rx_nonmaint_pmpm_ct,rx_nonbh_mbr_resp_pmpm_cost_6to9m_b4,cons_stlnindx,atlas_hipov_1115,rx_nonbh_mbr_resp_pmpm_cost,atlas_redemp_snaps16,atlas_berry_farms12,rej_med_ip_snf_coins_pmpm_cost_t_9-6-3m_b4,rwjf_inactivity_pct,rx_gpi2_72_pmpm_ct_6to9m_b4,cons_n2pmr,med_physician_office_allowed_pmpm_cost_t_9-6-3m_b4,auth_3mth_acute_res,rev_cms_ct_pmpm_ct,atlas_foodhub16,total_physician_office_copay_pmpm_cost,auth_3mth_acute_dig,auth_3mth_dc_acute_rehab,atlas_pct_fmrkt_anmlprod16,credit_num_agencyfirstmtg,total_physician_office_net_paid_pmpm_cost_t_9-6-3m_b4,atlas_type_2015_mining_no,atlas_agritrsm_rct12,rx_days_since_last_script,atlas_pct_laccess_pop15,auth_3mth_post_acute_res,auth_3mth_acute_inf,rx_gpi2_01_pmpm_cost_0to3m_b4,atlas_povertyallagespct,rwjf_uninsured_child_pct,rx_branded_pmpm_ct_t_6-3-0m_b4,med_outpatient_deduct_pmpm_cost_t_9-6-3m_b4,credit_bal_mtgcredit_new,atlas_low_employment_2015_update,atlas_pct_diabetes_adults13,atlas_pct_laccess_nhasian15,atlas_deep_pov_all,atlas_net_international_migration_rate,atlas_deep_pov_children,bh_ncdm_pct,auth_3mth_non_er,atlas_foodinsec_child_03_11,rx_branded_mbr_resp_pmpm_cost,atlas_pc_wic_redemp12,rwjf_mv_deaths_rate,auth_3mth_acute_cad,atlas_pct_reduced_lunch14,cons_nwperadult,total_allowed_pmpm_cost_t_9-6-3m_b4,rx_hum_28_pmpm_cost,atlas_totalocchu,med_physician_office_ds_clm_6to9m_b4,atlas_pct_loclfarm12,rx_generic_mbr_resp_pmpm_cost,total_outpatient_mbr_resp_pmpm_cost_6to9m_b4,rx_gpi4_3400_pmpm_ct,lab_dist_loinc_pmpm_ct,atlas_pct_nslp15,rx_generic_pmpm_ct_0to3m_b4,oontwk_mbr_resp_pmpm_cost_t_6-3-0m_b4,atlas_pct_laccess_lowi15,bh_ncal_ind,atlas_pct_fmrkt_sfmnp16,rx_nonmail_dist_gpi6_pmpm_ct_t_9-6-3m_b4,atlas_pct_loclsale12,rej_med_er_net_paid_pmpm_cost_t_9-6-3m_b4,credit_bal_autobank,med_outpatient_mbr_resp_pmpm_cost_t_9-6-3m_b4,rx_overall_mbr_resp_pmpm_cost_0to3m_b4,rx_tier_2_pmpm_ct_3to6m_b4,rx_nonbh_net_paid_pmpm_cost,rx_maint_pmpm_ct_9to12m_b4,rx_nonbh_net_paid_pmpm_cost_t_6-3-0m_b4,atlas_type_2015_recreation_no,rx_gpi2_39_pmpm_cost_t_6-3-0m_b4,atlas_type_2015_update,cms_risk_adjustment_factor_a_amt,total_ip_maternity_net_paid_pmpm_cost_t_12-9-6m_b4,rx_generic_pmpm_cost,cmsd2_eye_retina_pmpm_ct,auth_3mth_post_acute,auth_3mth_facility,rx_days_since_last_script_0to3m_b4,atlas_population_loss_2015_update,rx_maint_pmpm_ct_t_6-3-0m_b4,auth_3mth_acute_mean_los,credit_num_autofinance,cons_rxmaint,rx_mail_net_paid_pmpm_cost_t_6-3-0m_b4,auth_3mth_home,rx_maint_mbr_resp_pmpm_cost_6to9m_b4,cons_hxwearbl,total_physician_office_mbr_resp_pmpm_cost_t_9-6-3m_b4,atlas_pct_laccess_black15,atlas_hh65plusalonepct,atlas_farm_to_school13,auth_3mth_acute_inj,rej_days_since_last_clm,bh_outpatient_net_paid_pmpm_cost,atlas_dirsales_farms12,rx_generic_pmpm_cost_6to9m_b4,rev_cms_ansth_pmpm_ct,atlas_convspth14,total_med_allowed_pmpm_cost_9to12m_b4,rx_mail_mbr_resp_pmpm_cost_t_9-6-3m_b4,med_outpatient_visit_ct_pmpm_t_12-9-6m_b4,rx_nonbh_pmpm_ct_t_9-6-3m_b4,auth_3mth_acute,rx_nonbh_pmpm_ct_0to3m_b4,atlas_pc_ffrsales12,auth_3mth_dc_left_ama,credit_bal_bankcard_severederog,atlas_povertyunder18pct,rx_tier_1_pmpm_ct_0to3m_b4,cons_estinv30_rc,auth_3mth_bh_acute_men,rx_gpi2_34_pmpm_ct,auth_3mth_dc_custodial,atlas_veg_acrespth12,atlas_grocpth14,total_med_net_paid_pmpm_cost_t_6-3-0m_b4,rx_gpi2_90_dist_gpi6_pmpm_ct_9to12m_b4,atlas_csa12,rx_gpi2_62_pmpm_cost_t_9-6-3m_b4,rx_overall_gpi_pmpm_ct_t_12-9-6m_b4,auth_3mth_acute_hdz,cons_rxadhs,atlas_pct_fmrkt_snap16,met_obe_diag_pct,cms_partd_ra_factor_amt,atlas_pct_sbp15,rwjf_resident_seg_black_inx,atlas_pct_cacfp15,auth_3mth_rehab,pdc_lip,atlas_ffrpth14,credit_num_autobank_new,rx_tier_2_pmpm_ct,cons_n2pwh,rx_nonmaint_dist_gpi6_pmpm_ct_t_12-9-6m_b4,atlas_berry_acrespth12,atlas_pct_fmrkt_credit16,atlas_slhouse12,atlas_pc_fsrsales12,credit_hh_1stmtgcredit,auth_3mth_snf_post_hsp,atlas_pct_fmrkt_wiccash16,atlas_foodinsec_13_15,cons_rxadhm,atlas_fmrktpth16,rx_nonotc_pmpm_cost_t_6-3-0m_b4,cci_dia_m_pmpm_ct,cons_n2phi,bh_physician_office_copay_pmpm_cost_6to9m_b4,rwjf_income_inequ_ratio,rej_total_physician_office_visit_ct_pmpm_0to3m_b4,credit_num_nonmtgcredit_60dpd,credit_bal_autofinance_new,rwjf_men_hlth_prov_ratio,auth_3mth_dc_home_health,rx_gpi2_56_dist_gpi6_pmpm_ct_3to6m_b4,cmsd2_sns_genitourinary_pmpm_ct,auth_3mth_acute_cir,med_ambulance_coins_pmpm_cost_t_9-6-3m_b4,bh_ncal_pct,atlas_pct_snap16,ccsp_227_pct,atlas_ghveg_sqftpth12,rx_days_since_last_script_6to9m_b4,atlas_orchard_acrespth12,atlas_persistentchildpoverty_1980_2011,atlas_pct_laccess_multir15,cons_cgqs,ccsp_065_pmpm_ct,atlas_medhhinc,rx_maint_net_paid_pmpm_cost_t_9-6-3m_b4,rwjf_mental_distress_pct,bh_ip_snf_admit_days_pmpm_t_9-6-3m_b4,rx_phar_cat_cvs_pmpm_ct_t_9-6-3m_b4,atlas_pct_laccess_nhpi15,auth_3mth_post_er,credit_num_consumerfinance_new,rx_gpi2_49_pmpm_cost_0to3m_b4,cons_chva,atlas_avghhsize,rx_overall_net_paid_pmpm_cost_6to9m_b4,atlas_ownhomepct,atlas_orchard_farms12,total_physician_office_visit_ct_pmpm_t_6-3-0m_b4,atlas_pct_fmrkt_wic16,rx_gpi2_33_pmpm_ct_0to3m_b4,rwjf_social_associate_rate,atlas_freshveg_farms12,auth_3mth_acute_sns,days_since_last_clm_0to3m_b4,auth_3mth_dc_other,auth_3mth_bh_acute_mean_los,mcc_end_pct,cons_lwcm07,atlas_pct_fmrkt_otherfood16,auth_3mth_acute_mus,atlas_perpov_1980_0711,atlas_pct_laccess_white15,auth_3mth_post_acute_mean_los,rx_gpi2_66_pmpm_ct,auth_3mth_acute_gus,rx_generic_dist_gpi6_pmpm_ct_t_9-6-3m_b4,atlas_low_education_2015_update,cons_hhcomp_A,cons_hhcomp_B,cons_hhcomp_C,cons_hhcomp_D,cons_hhcomp_E,cons_hhcomp_F,cons_hhcomp_G,cons_hhcomp_H,cons_hhcomp_I,cons_hhcomp_J,cons_hhcomp_K,cons_hhcomp_L,cons_hhcomp_U,cons_hhcomp_nan,race_cd_0.0,race_cd_1.0,race_cd_2.0,race_cd_3.0,race_cd_4.0,race_cd_5.0,race_cd_6.0,race_cd_nan,cons_mobplus_M,cons_mobplus_P,cons_mobplus_S,cons_mobplus_U,cons_mobplus_nan,src_div_id_0.0,src_div_id_1.0,src_div_id_2.0,src_div_id_3.0,src_div_id_4.0,src_div_id_5.0,src_div_id_nan,cms_orig_reas_entitle_cd_0.0,cms_orig_reas_entitle_cd_1.0,cms_orig_reas_entitle_cd_2.0,cms_orig_reas_entitle_cd_3.0,cms_orig_reas_entitle_cd_nan,hedis_dia_hba1c_ge9_N,hedis_dia_hba1c_ge9_Y,hedis_dia_hba1c_ge9_nan,sex_cd_F,sex_cd_M,sex_cd_nan,hum_region_CALIFORNIA/NEVADA,hum_region_CENTRAL,hum_region_CENTRAL WEST,hum_region_EAST,hum_region_EAST CENTRAL,hum_region_FLORIDA,hum_region_GREAT LAKES/CENTRAL NORTH,hum_region_GULF STATES,hum_region_INTERMOUNTAIN,hum_region_MID-ATLANTIC/NORTH CAROLINA,hum_region_MID-SOUTH,hum_region_NORTHEAST,hum_region_PACIFIC,hum_region_PR,hum_region_SOUTHEAST,hum_region_TEXAS,hum_region_nan
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1,Unnamed: 278_level_1,Unnamed: 279_level_1,Unnamed: 280_level_1,Unnamed: 281_level_1,Unnamed: 282_level_1,Unnamed: 283_level_1,Unnamed: 284_level_1,Unnamed: 285_level_1,Unnamed: 286_level_1,Unnamed: 287_level_1,Unnamed: 288_level_1,Unnamed: 289_level_1,Unnamed: 290_level_1,Unnamed: 291_level_1,Unnamed: 292_level_1,Unnamed: 293_level_1,Unnamed: 294_level_1,Unnamed: 295_level_1,Unnamed: 296_level_1,Unnamed: 297_level_1,Unnamed: 298_level_1,Unnamed: 299_level_1,Unnamed: 300_level_1,Unnamed: 301_level_1,Unnamed: 302_level_1,Unnamed: 303_level_1,Unnamed: 304_level_1,Unnamed: 305_level_1,Unnamed: 306_level_1,Unnamed: 307_level_1,Unnamed: 308_level_1,Unnamed: 309_level_1,Unnamed: 310_level_1,Unnamed: 311_level_1,Unnamed: 312_level_1,Unnamed: 313_level_1,Unnamed: 314_level_1,Unnamed: 315_level_1,Unnamed: 316_level_1,Unnamed: 317_level_1,Unnamed: 318_level_1,Unnamed: 319_level_1,Unnamed: 320_level_1,Unnamed: 321_level_1,Unnamed: 322_level_1,Unnamed: 323_level_1,Unnamed: 324_level_1,Unnamed: 325_level_1,Unnamed: 326_level_1,Unnamed: 327_level_1,Unnamed: 328_level_1,Unnamed: 329_level_1,Unnamed: 330_level_1,Unnamed: 331_level_1,Unnamed: 332_level_1,Unnamed: 333_level_1,Unnamed: 334_level_1,Unnamed: 335_level_1,Unnamed: 336_level_1,Unnamed: 337_level_1,Unnamed: 338_level_1,Unnamed: 339_level_1,Unnamed: 340_level_1,Unnamed: 341_level_1,Unnamed: 342_level_1,Unnamed: 343_level_1,Unnamed: 344_level_1,Unnamed: 345_level_1,Unnamed: 346_level_1,Unnamed: 347_level_1,Unnamed: 348_level_1,Unnamed: 349_level_1,Unnamed: 350_level_1,Unnamed: 351_level_1,Unnamed: 352_level_1,Unnamed: 353_level_1,Unnamed: 354_level_1,Unnamed: 355_level_1,Unnamed: 356_level_1,Unnamed: 357_level_1,Unnamed: 358_level_1,Unnamed: 359_level_1,Unnamed: 360_level_1,Unnamed: 361_level_1,Unnamed: 362_level_1,Unnamed: 363_level_1
1MObcfaSTac85Lca0Y8bbA6I,0,0.0,7.910346,0.049413,0.0,46.839102,0.0,0.5,67.0,0.5,1.5,4.0,0.0,8.068443,2366.225593,0.0,-1.5,0.03655,22.614359,0.0,0.26716,0.904069,0.0,0.248279,0.5,9.0,-1.5,0.0,5.0,9.803185,0.0,70.0,9.775188,1.458254,0,0.0,0.0,-1.5,2.255148,0.0,-1.5,1.190413,0.0,14.424166,2.0,0.0,0.0,1.150322,0,0.0,0.0,0.0,832.960852,0.0,-1.5,0.071574,0.5,1.266667,0.5,2.032116,0.0,0,25.0,4.394167,0,30.0,6.1,0.083333,0.0,7.551157,0.833333,78,-1.5,1.416667,5.521413,0.0,28021.0,0.065172,12.37,8.0,0.595833,3.0,0.0,33.2,1.5,0.0,0.534684,0.0,5.674145,0.0,0.5,28.89,0.5,0.166667,50.546665,9.0,0.0,14.1775,152649.765535,2.0,0.5,0.234,0.0,52.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,20.0,0.200841,0.5,0.0,210873.0,17,26.891725,0,0,0.0,11.4,0.058867,0.5,0.5,5559.328994,0.0,11.7,0.071579,4.598999,0.083808,6.946784,0.0,0.0,8.3,0.0,7.444571,13.008691,0,8.014182,104166.666667,0.5,0.0,16416.0,120,3.359617,14.174166,0.0,0.333333,0.0,12.218996,2.0,0.5,8.809361,0,0.0,1.5,0.042699,0.5,6434.326769,0.5,12.383333,1.0,24.014165,1.333333,-1.5,0.0,0.0,3.0,0.0,0.5,40.331667,0.0,0.0,0.0,11,1.0,-1.5,0.0,0.115556,2.0,1.5,0.0,12.716667,8.0,0.5,0.031035,12.005285,1.0,0,480,0.0,17.0,72.27333,0.0,0.504157,0.0,1.5,0.5,1.5,0.0,2.0,479.49278,0.0,336.631069,18.3,1.0,175000.0,0,0.333333,0.0,4.181879,0.008268,0.5,0.0,1.0,0.5,-1.5,0,5.0,0.0,0.0,0.736,3.145443,83.762117,1.412746,0,1.0,0.81708,0.10478,0.75,95.0,0.5,0.207904,0.0,0.0,534.961996,33.213855,0.0,0.0,14.8,2.0,0.070159,-1.5,0.0,3.0,0.0,3.621404,0.0,0.621714,1389.427219,0.0004,0.0,0.0,0.0,0,0.5,0.0,12.083352,0.0,147.994686,217,0.0,0.0,1.260405,88.0,0.0,56861.0,-3.0,0.103341,0.5,0.5,0.0,0.0,0.073287,3.956667,158.0,2.12,38.32,73.922397,0.0,0.5,0.0,0.333333,23.839718,5.0,0,120,0.0,0.0,0.0,0.23359,0.0,0.0,0.0,26.842903,0.0,0.0,0,1.5,0.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0
5M89OSTL580dYeA849d3480I,0,0.0,1.730272,0.095624,60.0,36.721923,0.0,0.5,69.0,0.5,0.5,3.0,0.0,12.354272,2926.079093,0.0,10.0,0.028851,19.627044,0.0,0.14265,0.721653,0.0,0.08781,0.5,9.0,8.0,0.0,6.0,10.081917,0.0,75.0,9.931234,1.063555,0,0.0,0.0,1.5,3.093653,0.0,1.5,1.251418,0.0,27.2675,3.666667,0.0,10.0,2.447362,0,0.0,0.0,0.0,814.885956,0.0,1.5,0.080894,0.5,15.0,0.0,2.378146,0.0,0,50.0,11.9675,0,63.0,3.8,0.0,0.0,8.550448,1.25,75,1.5,1.5,2.518561,0.0,29859.0,0.090135,39.64,10.3,0.8275,28.0,0.0,32.9,0.5,0.0,0.961838,18.992024,3.954437,0.0,0.5,28.81,1.25,0.625,0.0,9.0,0.0,47.8625,233871.961736,14.0,0.5,0.239,0.0,56.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,43.0,0.419854,0.5,0.0,14000.0,12,12.019081,0,0,0.0,13.3,0.032037,0.5,0.5,13848.662109,0.0,10.0,0.280467,7.640235,0.475498,1.502318,0.0,0.0,7.1,0.0,22.96716,13.32628,0,5.009556,437500.0,0.5,0.0,99660.0,120,10.251445,37.615,0.0,0.0,0.0,11.18006,3.666667,0.5,4.217246,0,70.0,0.5,0.929615,0.5,7183.751526,0.5,49.34,1.666667,9.4975,0.0,1.5,0.0,-1.5,0.0,0.0,0.0,53.745,0.0,0.0,0.0,18,0.0,-1.5,0.0,0.331104,1.0,1.5,0.0,0.0,9.0,0.5,0.669094,11.286925,1.0,0,480,0.0,116.0,0.0,0.0,0.30099,350.915216,10.0,0.0,10.0,0.0,3.666667,521.2382,0.0,348.886552,12.6,2.666667,875000.0,0,0.0,0.0,0.646902,0.129287,0.5,0.0,4.0,0.5,0.5,0,0.0,40.0,0.0,0.544,3.913049,48.515137,1.704639,0,1.0,0.619212,0.145811,1.5,93.0,0.5,0.04339,40.0,2.0,690.520343,41.87406,0.0,0.0,9.9,2.0,0.025133,1.5,0.0,1.0,0.0,4.430692,0.0,0.549206,1795.154717,0.001456,0.0,0.333333,0.0,0,0.5,0.0,8.67772,0.0,80.357201,120,0.156425,0.0,0.310503,82.0,0.0,55828.0,10.0,0.106975,0.5,0.5,0.002699,0.0,0.228002,7.793334,254.0,2.58,0.0,68.704457,21.0,0.5,0.0,0.333333,12.576445,69.0,0,120,0.0,0.0,0.0,0.19198,50.0,0.0,0.0,11.405128,0.0,0.0,0,10.0,0.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0
MdOS23TLe18Y60043Acfa2I9,0,0.0,5.015501,0.022398,30.0,39.605015,0.0,0.5,76.0,0.5,-3.0,5.422812,0.0,14.18409,4522.696898,0.17,10.0,0.08674,36.273675,0.0,0.25904,0.444301,0.0,0.103268,0.5,3.0,1.5,0.0,1.0,15.611655,4192.19,55.0,5.55576,2.51632,0,0.0,0.0,1.5,3.323222,0.0,1.5,1.715413,0.0,23.571666,1.333333,0.0,0.5,2.212277,0,0.0,0.0,0.0,1796.896312,0.0,1.5,0.110481,0.5,2.5,0.5,2.339832,0.0,0,0.0,11.381667,0,10.0,4.6,0.0,0.0,13.68484,0.0,41,0.0,8.583333,2.418513,1.568324,28725.0,0.164377,6.716667,9.0,0.0,2.0,0.0,35.0,-3.0,0.3,1.359437,125.33,7.440498,0.0,0.5,151.83,0.333333,0.416667,0.0,7.0,0.0,26.849167,236625.461866,10.0,0.5,0.271,0.0,48.0,-6.0,0.0,0.0,0.0,10.833333,0.0,0.0,0.0,0.280883,-3.0,0.0,210873.0,61,19.188011,0,0,0.0,10.3,0.059742,0.5,0.5,7172.199109,0.0,13.1,0.000395,6.64755,0.384934,8.625882,0.0,0.0,9.8,0.0,18.92932,15.423137,0,6.299918,1250.0,-6.0,0.0,23811.0,214,5.168731,12.001666,154.423333,0.0,2.75,9.865436,1.333333,-1.5,7.809896,0,0.0,1.5,0.075195,0.5,4952.314364,-3.0,10.116667,0.0,4.733333,0.333333,3.0,0.0,0.5,3.0,0.749,0.5,34.0975,0.0,0.0,0.0,17,0.0,0.0,0.0,0.381622,7.0,10.0,0.0,4.666667,2.0,-3.0,1.466227,10.10489,1.0,0,180,0.0,33.0,7.733333,0.25,0.640569,7369.42,0.0,-6.0,10.0,0.0,1.333333,632.196141,0.0,324.401536,17.3,0.666667,32500.0,0,0.0,0.0,7.431193,0.299296,1.5,0.0,2.0,0.5,0.0,0,9.0,0.0,0.0,0.952,5.437714,20.332516,0.800732,0,1.1,0.56106,0.105058,0.0,26.0,0.5,0.040506,0.0,0.0,688.251535,31.331165,0.0,0.0,13.2,6.0,0.018161,1.5,0.0,6.0,0.0,3.682825,0.0,1.167164,1989.082598,0.000981,0.0,0.0,0.0,0,0.5,0.0,15.466672,1.958872,60.517063,231,1.03751,0.0,0.773873,98.0,0.0,61903.0,-1.5,0.113497,0.5,0.5,0.0,0.0,0.502758,0.0,118.0,2.57,1.186667,68.700726,10.0,1.5,0.0,0.0,9.649039,14.0,0,36,0.0,0.0,0.0,0.44111,0.0,0.0,0.0,1.713138,0.0,0.083333,0,1.5,0.0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0
2ccMO510abSaT79cLfaYAIe4,0,2.266667,4.049586,0.070407,50.0,93.694818,0.0,0.5,46.0,0.5,1.5,8.0,0.0,25.22,3993.478363,0.0,-1.5,0.167049,34.035432,0.0,0.27952,0.696737,0.0,0.087032,0.5,6.0,10.0,0.0,0.0,22.732829,0.0,66.0,2.118735,5.050701,0,0.0,0.0,-3.0,3.725334,0.0,0.0,1.879706,0.0,6.016667,1.333333,0.0,0.5,1.527418,0,0.0,0.0,0.0,961.13878,0.0,-1.5,0.155642,0.5,8.383333,0.5,2.587396,0.0,0,0.0,0.0,0,15.0,5.6,0.0,0.0,18.194131,0.416667,67,-3.0,0.583333,3.429659,0.0,24971.0,0.224473,8.28,10.7,0.0,18.0,0.0,37.1,3.0,0.0,0.991095,0.0,0.156201,0.0,0.5,83.67,0.416667,0.0,27.413333,9.0,0.0,7.061667,302974.081188,0.0,0.5,0.247,0.333333,30.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.254306,0.5,0.0,5000.0,39,28.96755,0,0,0.0,16.3,0.08192,0.5,0.5,3686.592588,0.0,11.5,0.849008,6.820686,0.145067,10.999059,0.0,0.0,10.5,0.0,27.75764,13.809701,0,6.507174,625000.0,-10.0,0.0,70150.0,120,4.0006,7.066667,0.0,0.0,0.0,12.101522,1.333333,0.5,10.317817,0,0.0,-6.0,0.1001,0.5,3840.454257,0.5,9.02,0.0,1.6975,1.333333,-8.0,0.0,0.5,0.0,0.0,0.5,7.994167,0.0,0.0,0.0,35,0.0,-1.5,0.0,0.465225,2.0,-10.0,0.0,18.733334,6.0,0.5,5.392784,7.023556,0.0,0,480,0.0,3.0,11.95,0.0,0.585325,0.0,1.5,0.5,-1.5,0.0,1.333333,666.146008,0.0,422.525637,33.7,1.333333,175000.0,0,0.0,0.0,0.027,0.184512,0.5,0.0,4.0,0.5,1.5,0,4.0,0.0,0.0,0.828,6.137434,40.74969,1.387364,0,1.1,0.630592,0.064825,0.75,38.0,0.5,0.0,0.0,0.0,649.837136,24.131826,0.0,0.0,14.9,3.0,0.017912,-6.0,0.0,15.0,0.0,4.228425,0.0,1.021212,1832.369829,0.000883,0.0,0.0,0.0,0,0.5,0.0,16.414948,0.0,0.0,199,9.094149,0.0,1.950803,86.0,0.0,41694.0,-1.5,0.122726,0.5,0.5,0.023008,0.0,0.330044,0.0,185.0,2.82,2.926667,53.014194,20.0,0.5,0.0,0.0,11.351209,10.0,0,120,0.0,0.0,0.0,0.15418,0.0,0.0,0.0,11.853595,0.0,0.0,0,-1.5,0.0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0
0M9811Ocb1ST94LY3f5A9I00,0,0.0,0.618606,0.074862,88.272489,36.298252,0.0,0.5,111.0,0.5,1.5,4.0,0.0,2.080756,1336.755009,0.0,3.0,0.03595,11.661509,0.0,0.26716,0.759512,0.0,0.160382,-10.0,8.0,-1.5,0.0,17.0,7.175145,0.0,64.0,6.841375,0.018473,0,0.0,0.0,0.5,1.592511,0.0,0.0,2.637248,0.0,0.0,1.666667,0.0,1.5,0.208543,0,0.0,1.0,0.0,540.459213,0.0,0.0,0.093018,0.5,0.0,0.5,3.231603,0.0,0,79.271429,0.0,0,283.0,4.5,0.083333,0.0,6.021257,1.25,70,-3.0,0.333333,1.730244,6.0,38982.0,0.094049,0.0,8.7,0.0,38.0,0.0,24.1,1.5,0.0,0.327121,0.0,5.434265,0.0,0.5,76.15,0.833333,0.416667,0.0,9.0,0.0,0.0,206260.065041,64.0,0.5,0.108,0.0,57.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,16.278134,0.431809,0.5,0.0,1747000.0,45,5.248898,0,0,0.0,11.7,0.039492,0.5,0.5,21211.640393,0.0,7.1,0.885394,7.59274,0.449443,5.735983,0.0,0.0,10.8,0.0,10.44615,7.609376,0,7.556822,1000000.0,0.5,0.0,106124.0,120,17.864455,0.0,0.0,0.416667,0.0,8.358339,1.666667,0.5,3.923556,0,0.0,0.5,0.757533,0.5,6185.36902,0.5,0.0,0.333333,48.255,1.333333,-1.5,0.0,-3.0,0.0,0.3,0.5,22.905834,0.0,0.0,0.0,31,0.0,-3.0,0.0,0.323137,4.0,-1.5,0.0,0.0,9.0,0.5,0.155782,9.750538,1.0,0,480,0.0,195.0,46.816667,0.0,0.260929,0.0,0.5,-10.0,1.5,0.0,1.666667,642.487457,0.0,316.407643,16.5,1.333333,875000.0,0,0.416667,0.0,0.245965,0.284236,0.5,0.0,28.0,0.5,0.0,0,5.0,30.0,0.0,0.548,4.321251,42.702891,1.438477,0,1.0,0.709837,0.115028,0.0,88.0,-10.0,0.322768,66.666667,5.0,750.318646,41.662242,0.0,0.0,12.6,3.0,0.012339,-1.5,0.0,13.0,0.0,4.307094,0.0,0.247203,1564.619184,0.003372,0.0,0.0,0.0,0,0.5,0.0,10.961725,6.0,480.118347,273,0.853436,0.0,1.061934,124.0,0.0,86014.0,1.5,0.108619,0.5,0.5,0.033882,0.0,0.108163,0.0,640.0,2.76,34.02,52.552074,58.0,0.5,30.0,0.666667,7.573321,163.0,0,120,0.0,0.0,0.0,0.16355,19.45,0.0,0.0,33.795298,0.0,0.0,0,-1.5,0.0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [43]:
train_df.to_csv('data/training_cleaned_v5.csv')