In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
sns.set()
%matplotlib inline

import gc
import os
import warnings
warnings.filterwarnings('ignore')
pd.set_option('max_columns', None)

In [2]:
PATH_TO_DATA = ('D:/Py/DataFrames/Home_Credit_Default_Risk(KAGGLE)/')

# Preprocessing

In [3]:
# One-hot encoding for categorical columns with get_dummies
def one_hot_encoder(df, nan_as_category=False):
    original_columns = list(df.columns)
    categorical_columns = [col for col in df.columns if df[col].dtype == 'object']
    df = pd.get_dummies(df, columns=categorical_columns, dummy_na=nan_as_category)
    new_columns = [c for c in df.columns if c not in original_columns]
    return df, new_columns

In [4]:
# Preprocess application_train.csv and application_test.csv
def application_train_test():
    df = pd.read_csv(os.path.join(PATH_TO_DATA, 'application_train.csv'))
    test_df = pd.read_csv(os.path.join(PATH_TO_DATA, 'application_test.csv'))
    df = df.append(test_df).reset_index(drop=True)
    # Remove 4 applications with XNA CODE_GENDER (train set)
    df = df[df['CODE_GENDER'] != 'XNA']
    
    
    # Preprocessing
    df['NAME_FAMILY_STATUS'].replace('Unknown', 'Single / not married', inplace=True)
    df['ORGANIZATION_TYPE'].replace('XNA', np.nan, inplace=True)
    # NaN values for DAYS_EMPLOYED: 365243 -> nan
    for col in ['DAYS_BIRTH', 'DAYS_EMPLOYED', 'DAYS_REGISTRATION', 'DAYS_ID_PUBLISH']:
        df[col].replace(365243, np.nan, inplace=True)
    
    # Categorical features with Binary encode (0 or 1)
    for bin_feature in ['CODE_GENDER', 'FLAG_OWN_CAR', 'FLAG_OWN_REALTY']:
        df[bin_feature], uniques = pd.factorize(df[bin_feature])
    
    # OHE for other categorical features
    df, cat_cols = one_hot_encoder(df, nan_as_category=False)

    
    # [FEATURES]
    df['birth_employed_gap'] = df['DAYS_BIRTH'] - df['DAYS_EMPLOYED']
    df['birth_registration_gap'] = df['DAYS_BIRTH'] - df['DAYS_REGISTRATION']
    df['birth_car_age_gap'] = df['DAYS_BIRTH'] - df['OWN_CAR_AGE']
    df['birth_last_phone_gap'] = df['DAYS_BIRTH'] - df['DAYS_LAST_PHONE_CHANGE']
    df['last_phone_employed_perc'] = df['DAYS_LAST_PHONE_CHANGE'] / df['DAYS_EMPLOYED']
    
    df['PAYMENT_RATE'] = df['AMT_CREDIT'] / df['AMT_ANNUITY']
    df['CREDIT_INCOME_PERC'] = df['AMT_CREDIT'] / df['AMT_INCOME_TOTAL']
    df['ANNUITY_INCOME_PERC'] = df['AMT_ANNUITY'] / df['AMT_INCOME_TOTAL']
    df['GOODS_PRICE_INCOME_PERC'] = df['AMT_GOODS_PRICE'] / df['AMT_INCOME_TOTAL']
    df['ANNUITY_GOODS_PRICE_PERC'] = df['AMT_ANNUITY'] / df['AMT_GOODS_PRICE']
    df['GOODS_PRICE_CREDIT_PERC'] = df['AMT_CREDIT'] / df['AMT_GOODS_PRICE']
    
    df['INCOME_PER_PERSON'] = df['AMT_INCOME_TOTAL'] / df['CNT_FAM_MEMBERS']
    df['INCOME_PER_CHILD'] = df['AMT_INCOME_TOTAL'] / (1 + df['CNT_CHILDREN']) # to avoid +-np.inf
    df['CREDIT_PER_PERSON'] = df['AMT_CREDIT'] / df['CNT_FAM_MEMBERS']
    df['CREDIT_PER_CHILD'] = df['AMT_CREDIT'] / (1 + df['CNT_CHILDREN']) # to avoid +-np.inf
    df['cnt_non_child'] = df['CNT_FAM_MEMBERS'] - df['CNT_CHILDREN']
    df['child_to_non_child_ratio'] = df['CNT_CHILDREN'] / df['cnt_non_child']
    df['income_per_non_child'] = df['AMT_INCOME_TOTAL'] / df['cnt_non_child']
    df['credit_per_non_child'] = df['AMT_CREDIT'] / df['cnt_non_child']
    
    flags = [_f for _f in df.columns if 'FLAG_' in _f]
    for agg in ['sum', 'mean']:
        df['flags_{}'.format(agg)] = eval('np.{}'.format(agg))(df[flags], axis=1)
    
    sources = ['EXT_SOURCE_1', 'EXT_SOURCE_2', 'EXT_SOURCE_3']
    for agg in ['sum', 'mean', 'median', 'std']:
        df['ext_sources_{}'.format(agg)] = eval('np.{}'.format(agg))(df[sources], axis=1)
    df['ext_sources_prod'] = df['EXT_SOURCE_1'] * df['EXT_SOURCE_2'] * df['EXT_SOURCE_3']
    
    df.drop([
        'FLAG_DOCUMENT_2','FLAG_DOCUMENT_4', 'FLAG_DOCUMENT_5',
        'FLAG_DOCUMENT_6','FLAG_DOCUMENT_7', 'FLAG_DOCUMENT_8',
        'FLAG_DOCUMENT_9','FLAG_DOCUMENT_10', 'FLAG_DOCUMENT_11',
        'FLAG_DOCUMENT_12','FLAG_DOCUMENT_13', 'FLAG_DOCUMENT_14',
        'FLAG_DOCUMENT_15','FLAG_DOCUMENT_16', 'FLAG_DOCUMENT_17',
        'FLAG_DOCUMENT_18','FLAG_DOCUMENT_19', 'FLAG_DOCUMENT_20',
        'FLAG_DOCUMENT_21'], axis=1, inplace=True) #useless
    
    
    del test_df
    gc.collect()
    
    return df

In [5]:
# Preprocess bureau.csv and bureau_balance.csv
def bureau_and_balance():
    bureau = pd.read_csv(os.path.join(PATH_TO_DATA, 'bureau.csv'))
    bb = pd.read_csv(os.path.join(PATH_TO_DATA, 'bureau_balance.csv'))
    
    # [FEATURES]
    bureau['CREDIT_ACTIVE_BINARY'] = (bureau['CREDIT_ACTIVE'] != 'Closed').astype(int)
    bureau['CREDIT_ENDDATE_BINARY'] = (bureau['DAYS_CREDIT_ENDDATE'] > 0).astype(int)
    
    bb, bb_cat_features = one_hot_encoder(bb)
    bureau, bureau_cat_features = one_hot_encoder(bureau)
    
    # Bureau balance: Perform aggregations and merge with bureau.csv
    bb_agregations = {'MONTHS_BALANCE': ['min', 'max', 'size']}
    for col in bb_cat_features: bb_agregations[col] = ['mean']
    bb_agg = bb.groupby('SK_ID_BUREAU').agg(bb_agregations)
    bb_agg.columns = pd.Index([e[0] + "_" + e[1].upper() for e in bb_agg.columns.tolist()])
    bureau = bureau.join(bb_agg, on='SK_ID_BUREAU')
    bureau.drop('SK_ID_BUREAU', axis=1, inplace=True)
    del bb, bb_agg
    gc.collect()
    
    
    # Bureau and bureau_balance numeric features
    num_aggregations = {
        'DAYS_CREDIT': ['count', 'mean', 'var'],
        'DAYS_CREDIT_ENDDATE': ['mean'],
        'DAYS_CREDIT_UPDATE': ['mean'],
        'CREDIT_DAY_OVERDUE': ['mean'],
        'AMT_CREDIT_MAX_OVERDUE': ['mean', 'sum'],
        'AMT_CREDIT_SUM': ['mean', 'sum'],
        'AMT_CREDIT_SUM_DEBT': ['mean', 'sum'],
        'AMT_CREDIT_SUM_OVERDUE': ['mean', 'sum'],
        'AMT_CREDIT_SUM_LIMIT': ['mean', 'sum'],
        'AMT_ANNUITY': ['max', 'mean', 'sum'],
        'CNT_CREDIT_PROLONG': ['sum'],
        'MONTHS_BALANCE_MIN': ['min'],
        'MONTHS_BALANCE_MAX': ['max'],
        'MONTHS_BALANCE_SIZE': ['mean', 'sum'],
        
        'CREDIT_ACTIVE_BINARY': ['mean'],
        'CREDIT_ENDDATE_BINARY': ['mean']
    }
    
    cat_aggregations = {}
    for col in bureau_cat_features: cat_aggregations[col] = ['mean']
    for col in bb_cat_features: cat_aggregations[col + '_MEAN'] = ['mean']
    bureau_agg = bureau.groupby('SK_ID_CURR').agg({**num_aggregations, **cat_aggregations})
    bureau_agg.columns = pd.Index(['BUREAU_' + e[0] + "_" + e[1].upper() for e in bureau_agg.columns.tolist()])
    
    # Bureau: Active credits - using only numerical aggregations
    active = bureau[bureau['CREDIT_ACTIVE_Active'] == 1]
    active_agg = active.groupby('SK_ID_CURR').agg(num_aggregations)
    active_agg.columns = pd.Index(['ACTIVE_' + e[0] + "_" + e[1] for e in active_agg.columns.tolist()])
    bureau_agg = bureau_agg.join(active_agg, on='SK_ID_CURR')
    del active, active_agg
    gc.collect()
    
    # Bureau: Closed credits - using only numerical aggregations
    closed = bureau[bureau['CREDIT_ACTIVE_Closed'] == 1]
    closed_agg = closed.groupby('SK_ID_CURR').agg(num_aggregations)
    closed_agg.columns = pd.Index(['CLOSED_' + e[0] + "_" + e[1] for e in closed_agg.columns.tolist()])
    bureau_agg = bureau_agg.join(closed_agg, on='SK_ID_CURR')
    del closed, closed_agg
    
    
    del bureau
    gc.collect()
    
    return bureau_agg

In [6]:
# Preprocess credit_card_balance.csv
def credit_card_balance():
    cc = pd.read_csv(os.path.join(PATH_TO_DATA, 'credit_card_balance.csv'))
    
    
    # Preprocessing
    for col in ['AMT_BALANCE', 'AMT_DRAWINGS_ATM_CURRENT', 'AMT_DRAWINGS_CURRENT',
                'AMT_RECEIVABLE_PRINCIPAL', 'AMT_RECIVABLE', 'AMT_TOTAL_RECEIVABLE']:
        cc[col] = cc[col].apply(lambda x: x if x > 0 else 0) 
    cc, cc_cat_features = one_hot_encoder(cc)
    
    
    # [FEATURES]
    cc['dpddef_dpd_gap'] = cc['SK_DPD_DEF'] - cc['SK_DPD']
    
    # General aggregations
    cc.drop('SK_ID_PREV', axis=1, inplace=True)
    cc_agg = cc.groupby('SK_ID_CURR').agg(['max', 'mean', 'sum', 'var'])
    cc_agg.columns = pd.Index(['CC_' + e[0] + "_" + e[1] for e in cc_agg.columns.tolist()])
    
    # [FEATURES]
    cc_agg['cc_count'] = cc.groupby('SK_ID_CURR').size()
    
    
    del cc
    gc.collect()
    
    return cc_agg

In [7]:
# Preprocess installments_payments.csv
def installments_payments():
    ins = pd.read_csv(os.path.join(PATH_TO_DATA, 'installments_payments.csv'))
    ins, ins_cat_features = one_hot_encoder(ins)
    
    
    # [FEATURES]
    ins['PAYMENT_PERC'] = ins['AMT_PAYMENT'] / ins['AMT_INSTALMENT']
    ins['PAYMENT_DIFF'] = ins['AMT_PAYMENT'] - ins['AMT_INSTALMENT']
    ins['PAID_OVER'] = (ins['PAYMENT_DIFF'] > 0).astype(int)
    
    # Days past due and days before due (no negative values)
    ins['DPD'] = ins['DAYS_ENTRY_PAYMENT'] - ins['DAYS_INSTALMENT']
    ins['DPD_LATE'] = (ins['DPD'] > 0).astype(int)
    ins['DPD'] = ins['DPD'].apply(lambda x: x if x > 0 else 0)
    ins['DBD'] = ins['DAYS_INSTALMENT'] - ins['DAYS_ENTRY_PAYMENT']
    ins['DBD'] = ins['DBD'].apply(lambda x: x if x > 0 else 0)
    
    # Perform aggregations
    aggregations = {
        'NUM_INSTALMENT_VERSION': ['nunique'],
        'AMT_INSTALMENT': ['max', 'mean', 'sum', 'std'],
        'AMT_PAYMENT': ['min', 'max', 'mean', 'sum', 'std'],
        'DAYS_ENTRY_PAYMENT': ['max', 'mean', 'sum', 'std'],
        
        'PAYMENT_PERC': ['max', 'mean', 'sum', 'std'],
        'PAYMENT_DIFF': ['max', 'mean', 'sum', 'std'],
        'PAID_OVER': ['mean', 'sum'],
        'DPD': ['max', 'mean', 'sum', 'std'],
        'DPD_LATE': ['mean', 'sum'],
        'DBD': ['max', 'mean', 'sum', 'std'],
    }
    
    for col in ins_cat_features: aggregations[col] = ['mean']
    ins_agg = ins.groupby('SK_ID_CURR').agg(aggregations)
    ins_agg.columns = pd.Index(['INSTAL_' + e[0] + "_" + e[1].upper() for e in ins_agg.columns.tolist()])
    
    # [FEATURES]
    ins_agg['install_count'] = ins.groupby('SK_ID_CURR').size()
    
    
    del ins
    gc.collect()
    
    return ins_agg

In [8]:
# Preprocess POS_CASH_balance.csv
def pos_cash():
    pos = pd.read_csv(os.path.join(PATH_TO_DATA, 'POS_CASH_balance.csv'))
    pos, pos_cat_features = one_hot_encoder(pos)
    
    
    # Some aggregations
    aggregations = {
        'MONTHS_BALANCE': ['max', 'mean', 'size'],
        'SK_DPD': ['max', 'mean'],
        'SK_DPD_DEF': ['max', 'mean']
    }
    for col in pos_cat_features: aggregations[col] = ['mean']
    pos_agg = pos.groupby('SK_ID_CURR').agg(aggregations)
    pos_agg.columns = pd.Index(['POS_' + e[0] + "_" + e[1].upper() for e in pos_agg.columns.tolist()])
    
    # [FEATURES]
    pos_agg['pos_cash_acc_count'] = pos.groupby('SK_ID_CURR').size()
    
    del pos
    gc.collect()
    
    return pos_agg

In [9]:
# Preprocess previous_applications.csv
def previous_application():
    prev = pd.read_csv(os.path.join(PATH_TO_DATA, 'previous_application.csv'))
    
    
    # Preprocessing
    # Days 365243 values -> nan
    prev.replace(365243, np.nan, inplace= True)
    prev, prev_cat_features = one_hot_encoder(prev)
    
    
    # [FEATURES]
    prev['APP_CREDIT_PERC'] = prev['AMT_APPLICATION'] / prev['AMT_CREDIT']
    prev['PAYMENT_RATE'] = prev['AMT_ANNUITY'] / prev['AMT_CREDIT'] # my
    prev['ANNUITY_GOODS_PRICE_PERC'] = prev['AMT_ANNUITY'] / prev['AMT_GOODS_PRICE'] #my
    
    # Previous applications numeric features
    num_aggregations = {
        'AMT_ANNUITY': ['max', 'mean'],
        'AMT_APPLICATION': ['max', 'mean'],
        'AMT_CREDIT': ['max', 'mean'],
        'AMT_DOWN_PAYMENT': ['max', 'mean'],
        'AMT_GOODS_PRICE': ['max', 'mean'],
        'HOUR_APPR_PROCESS_START': ['max', 'mean'],
        'RATE_DOWN_PAYMENT': ['max', 'mean'],
        'DAYS_DECISION': ['max', 'mean'],
        'CNT_PAYMENT': ['mean', 'sum'],
        
        'APP_CREDIT_PERC': ['max', 'mean'],
        'PAYMENT_RATE': ['max', 'mean'],
        'ANNUITY_GOODS_PRICE_PERC': ['max', 'mean']
    }
    # Previous applications categorical features
    cat_aggregations = {}
    for col in prev_cat_features: cat_aggregations[col] = ['mean']
    prev_agg = prev.groupby('SK_ID_CURR').agg({**num_aggregations, **cat_aggregations})
    prev_agg.columns = pd.Index(['PREV_' + e[0] + "_" + e[1].upper() for e in prev_agg.columns.tolist()])
    
    # Previous Applications: Approved Applications - only numerical features
    approved = prev[prev['NAME_CONTRACT_STATUS_Approved'] == 1]
    approved_agg = approved.groupby('SK_ID_CURR').agg(num_aggregations)
    approved_agg.columns = pd.Index(['APPROVED_' + e[0] + "_" + e[1].upper() for e in approved_agg.columns.tolist()])
    prev_agg = prev_agg.join(approved_agg, on='SK_ID_CURR')
    del approved, approved_agg
    gc.collect()
    
    # Previous Applications: Refused Applications - only numerical features
    refused = prev[prev['NAME_CONTRACT_STATUS_Refused'] == 1]
    refused_agg = refused.groupby('SK_ID_CURR').agg(num_aggregations)
    refused_agg.columns = pd.Index(['REFUSED_' + e[0] + "_" + e[1].upper() for e in refused_agg.columns.tolist()])
    prev_agg = prev_agg.join(refused_agg, on='SK_ID_CURR')
    
    
    del refused, refused_agg, prev
    gc.collect()
    
    return prev_agg

# Merge and Save

In [25]:
%%time
df = application_train_test()

bureau = bureau_and_balance()
df = df.join(bureau, on='SK_ID_CURR')
del bureau
gc.collect()

prev = previous_application()
df = df.join(prev, on='SK_ID_CURR')
del prev
gc.collect()

pos = pos_cash()
df = df.join(pos, on='SK_ID_CURR')
del pos
gc.collect()

ins = installments_payments()
df = df.join(ins, on='SK_ID_CURR')
del ins
gc.collect()

cc = credit_card_balance()
df = df.join(cc, on='SK_ID_CURR')
del cc
gc.collect()

print('Full DF shape: ', df.shape)

Full DF shape:  (356251, 761)
Wall time: 2min 23s


In [26]:
df.to_csv(os.path.join(PATH_TO_DATA, 'df_all_files.csv'), index=False)

In [33]:
df.head(3)

Unnamed: 0,AMT_ANNUITY,AMT_CREDIT,AMT_GOODS_PRICE,AMT_INCOME_TOTAL,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_YEAR,APARTMENTS_AVG,APARTMENTS_MEDI,APARTMENTS_MODE,BASEMENTAREA_AVG,BASEMENTAREA_MEDI,BASEMENTAREA_MODE,CNT_CHILDREN,CNT_FAM_MEMBERS,CODE_GENDER,COMMONAREA_AVG,COMMONAREA_MEDI,COMMONAREA_MODE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_ID_PUBLISH,DAYS_LAST_PHONE_CHANGE,DAYS_REGISTRATION,DEF_30_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,ELEVATORS_AVG,ELEVATORS_MEDI,ELEVATORS_MODE,ENTRANCES_AVG,ENTRANCES_MEDI,ENTRANCES_MODE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,FLAG_CONT_MOBILE,FLAG_DOCUMENT_3,FLAG_EMAIL,FLAG_EMP_PHONE,FLAG_MOBIL,FLAG_OWN_CAR,FLAG_OWN_REALTY,FLAG_PHONE,FLAG_WORK_PHONE,FLOORSMAX_AVG,FLOORSMAX_MEDI,FLOORSMAX_MODE,FLOORSMIN_AVG,FLOORSMIN_MEDI,FLOORSMIN_MODE,HOUR_APPR_PROCESS_START,LANDAREA_AVG,LANDAREA_MEDI,LANDAREA_MODE,LIVE_CITY_NOT_WORK_CITY,LIVE_REGION_NOT_WORK_REGION,LIVINGAPARTMENTS_AVG,LIVINGAPARTMENTS_MEDI,LIVINGAPARTMENTS_MODE,LIVINGAREA_AVG,LIVINGAREA_MEDI,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_AVG,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_AVG,NONLIVINGAREA_MEDI,NONLIVINGAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE,REGION_POPULATION_RELATIVE,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,SK_ID_CURR,TARGET,TOTALAREA_MODE,YEARS_BEGINEXPLUATATION_AVG,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_AVG,YEARS_BUILD_MEDI,YEARS_BUILD_MODE,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,FONDKAPREMONT_MODE_not specified,FONDKAPREMONT_MODE_org spec account,FONDKAPREMONT_MODE_reg oper account,FONDKAPREMONT_MODE_reg oper spec account,HOUSETYPE_MODE_block of flats,HOUSETYPE_MODE_specific housing,HOUSETYPE_MODE_terraced house,NAME_CONTRACT_TYPE_Cash loans,NAME_CONTRACT_TYPE_Revolving loans,NAME_EDUCATION_TYPE_Academic degree,NAME_EDUCATION_TYPE_Higher education,NAME_EDUCATION_TYPE_Incomplete higher,NAME_EDUCATION_TYPE_Lower secondary,NAME_EDUCATION_TYPE_Secondary / secondary special,NAME_FAMILY_STATUS_Civil marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single / not married,NAME_FAMILY_STATUS_Widow,NAME_HOUSING_TYPE_Co-op apartment,NAME_HOUSING_TYPE_House / apartment,NAME_HOUSING_TYPE_Municipal apartment,NAME_HOUSING_TYPE_Office apartment,NAME_HOUSING_TYPE_Rented apartment,NAME_HOUSING_TYPE_With parents,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial associate,NAME_INCOME_TYPE_Maternity leave,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group of people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse, partner",NAME_TYPE_SUITE_Unaccompanied,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning staff,OCCUPATION_TYPE_Cooking staff,OCCUPATION_TYPE_Core staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR staff,OCCUPATION_TYPE_High skill tech staff,OCCUPATION_TYPE_IT staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine staff,OCCUPATION_TYPE_Private service staff,OCCUPATION_TYPE_Realty agents,OCCUPATION_TYPE_Sales staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security staff,OCCUPATION_TYPE_Waiters/barmen staff,ORGANIZATION_TYPE_Advertising,ORGANIZATION_TYPE_Agriculture,ORGANIZATION_TYPE_Bank,ORGANIZATION_TYPE_Business Entity Type 1,ORGANIZATION_TYPE_Business Entity Type 2,ORGANIZATION_TYPE_Business Entity Type 3,ORGANIZATION_TYPE_Cleaning,ORGANIZATION_TYPE_Construction,ORGANIZATION_TYPE_Culture,ORGANIZATION_TYPE_Electricity,ORGANIZATION_TYPE_Emergency,ORGANIZATION_TYPE_Government,ORGANIZATION_TYPE_Hotel,ORGANIZATION_TYPE_Housing,ORGANIZATION_TYPE_Industry: type 1,ORGANIZATION_TYPE_Industry: type 10,ORGANIZATION_TYPE_Industry: type 11,ORGANIZATION_TYPE_Industry: type 12,ORGANIZATION_TYPE_Industry: type 13,ORGANIZATION_TYPE_Industry: type 2,ORGANIZATION_TYPE_Industry: type 3,ORGANIZATION_TYPE_Industry: type 4,ORGANIZATION_TYPE_Industry: type 5,ORGANIZATION_TYPE_Industry: type 6,ORGANIZATION_TYPE_Industry: type 7,ORGANIZATION_TYPE_Industry: type 8,ORGANIZATION_TYPE_Industry: type 9,ORGANIZATION_TYPE_Insurance,ORGANIZATION_TYPE_Kindergarten,ORGANIZATION_TYPE_Legal Services,ORGANIZATION_TYPE_Medicine,ORGANIZATION_TYPE_Military,ORGANIZATION_TYPE_Mobile,ORGANIZATION_TYPE_Other,ORGANIZATION_TYPE_Police,ORGANIZATION_TYPE_Postal,ORGANIZATION_TYPE_Realtor,ORGANIZATION_TYPE_Religion,ORGANIZATION_TYPE_Restaurant,ORGANIZATION_TYPE_School,ORGANIZATION_TYPE_Security,ORGANIZATION_TYPE_Security Ministries,ORGANIZATION_TYPE_Self-employed,ORGANIZATION_TYPE_Services,ORGANIZATION_TYPE_Telecom,ORGANIZATION_TYPE_Trade: type 1,ORGANIZATION_TYPE_Trade: type 2,ORGANIZATION_TYPE_Trade: type 3,ORGANIZATION_TYPE_Trade: type 4,ORGANIZATION_TYPE_Trade: type 5,ORGANIZATION_TYPE_Trade: type 6,ORGANIZATION_TYPE_Trade: type 7,ORGANIZATION_TYPE_Transport: type 1,ORGANIZATION_TYPE_Transport: type 2,ORGANIZATION_TYPE_Transport: type 3,ORGANIZATION_TYPE_Transport: type 4,ORGANIZATION_TYPE_University,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone, brick",WALLSMATERIAL_MODE_Wooden,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,birth_employed_gap,birth_registration_gap,birth_car_age_gap,birth_last_phone_gap,last_phone_employed_perc,PAYMENT_RATE,CREDIT_INCOME_PERC,ANNUITY_INCOME_PERC,GOODS_PRICE_INCOME_PERC,ANNUITY_GOODS_PRICE_PERC,GOODS_PRICE_CREDIT_PERC,INCOME_PER_PERSON,INCOME_PER_CHILD,CREDIT_PER_PERSON,CREDIT_PER_CHILD,cnt_non_child,child_to_non_child_ratio,income_per_non_child,credit_per_non_child,flags_sum,flags_mean,ext_sources_sum,ext_sources_mean,ext_sources_median,ext_sources_std,ext_sources_prod,BUREAU_DAYS_CREDIT_COUNT,BUREAU_DAYS_CREDIT_MEAN,BUREAU_DAYS_CREDIT_VAR,BUREAU_DAYS_CREDIT_ENDDATE_MEAN,BUREAU_DAYS_CREDIT_UPDATE_MEAN,BUREAU_CREDIT_DAY_OVERDUE_MEAN,BUREAU_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_AMT_CREDIT_MAX_OVERDUE_SUM,BUREAU_AMT_CREDIT_SUM_MEAN,BUREAU_AMT_CREDIT_SUM_SUM,BUREAU_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_OVERDUE_SUM,BUREAU_AMT_CREDIT_SUM_LIMIT_MEAN,BUREAU_AMT_CREDIT_SUM_LIMIT_SUM,BUREAU_AMT_ANNUITY_MAX,BUREAU_AMT_ANNUITY_MEAN,BUREAU_AMT_ANNUITY_SUM,BUREAU_CNT_CREDIT_PROLONG_SUM,BUREAU_MONTHS_BALANCE_MIN_MIN,BUREAU_MONTHS_BALANCE_MAX_MAX,BUREAU_MONTHS_BALANCE_SIZE_MEAN,BUREAU_MONTHS_BALANCE_SIZE_SUM,BUREAU_CREDIT_ACTIVE_BINARY_MEAN,BUREAU_CREDIT_ENDDATE_BINARY_MEAN,BUREAU_CREDIT_ACTIVE_Active_MEAN,BUREAU_CREDIT_ACTIVE_Bad debt_MEAN,BUREAU_CREDIT_ACTIVE_Closed_MEAN,BUREAU_CREDIT_ACTIVE_Sold_MEAN,BUREAU_CREDIT_ACTIVE_nan_MEAN,BUREAU_CREDIT_CURRENCY_currency 1_MEAN,BUREAU_CREDIT_CURRENCY_currency 2_MEAN,BUREAU_CREDIT_CURRENCY_currency 3_MEAN,BUREAU_CREDIT_CURRENCY_currency 4_MEAN,BUREAU_CREDIT_CURRENCY_nan_MEAN,BUREAU_CREDIT_TYPE_Another type of loan_MEAN,BUREAU_CREDIT_TYPE_Car loan_MEAN,BUREAU_CREDIT_TYPE_Cash loan (non-earmarked)_MEAN,BUREAU_CREDIT_TYPE_Consumer credit_MEAN,BUREAU_CREDIT_TYPE_Credit card_MEAN,BUREAU_CREDIT_TYPE_Interbank credit_MEAN,BUREAU_CREDIT_TYPE_Loan for business development_MEAN,BUREAU_CREDIT_TYPE_Loan for purchase of shares (margin lending)_MEAN,BUREAU_CREDIT_TYPE_Loan for the purchase of equipment_MEAN,BUREAU_CREDIT_TYPE_Loan for working capital replenishment_MEAN,BUREAU_CREDIT_TYPE_Microloan_MEAN,BUREAU_CREDIT_TYPE_Mobile operator loan_MEAN,BUREAU_CREDIT_TYPE_Mortgage_MEAN,BUREAU_CREDIT_TYPE_Real estate loan_MEAN,BUREAU_CREDIT_TYPE_Unknown type of loan_MEAN,BUREAU_CREDIT_TYPE_nan_MEAN,BUREAU_STATUS_0_MEAN_MEAN,BUREAU_STATUS_1_MEAN_MEAN,BUREAU_STATUS_2_MEAN_MEAN,BUREAU_STATUS_3_MEAN_MEAN,BUREAU_STATUS_4_MEAN_MEAN,BUREAU_STATUS_5_MEAN_MEAN,BUREAU_STATUS_C_MEAN_MEAN,BUREAU_STATUS_X_MEAN_MEAN,BUREAU_STATUS_nan_MEAN_MEAN,ACTIVE_DAYS_CREDIT_count,ACTIVE_DAYS_CREDIT_mean,ACTIVE_DAYS_CREDIT_var,ACTIVE_DAYS_CREDIT_ENDDATE_mean,ACTIVE_DAYS_CREDIT_UPDATE_mean,ACTIVE_CREDIT_DAY_OVERDUE_mean,ACTIVE_AMT_CREDIT_MAX_OVERDUE_mean,ACTIVE_AMT_CREDIT_MAX_OVERDUE_sum,ACTIVE_AMT_CREDIT_SUM_mean,ACTIVE_AMT_CREDIT_SUM_sum,ACTIVE_AMT_CREDIT_SUM_DEBT_mean,ACTIVE_AMT_CREDIT_SUM_DEBT_sum,ACTIVE_AMT_CREDIT_SUM_OVERDUE_mean,ACTIVE_AMT_CREDIT_SUM_OVERDUE_sum,ACTIVE_AMT_CREDIT_SUM_LIMIT_mean,ACTIVE_AMT_CREDIT_SUM_LIMIT_sum,ACTIVE_AMT_ANNUITY_max,ACTIVE_AMT_ANNUITY_mean,ACTIVE_AMT_ANNUITY_sum,ACTIVE_CNT_CREDIT_PROLONG_sum,ACTIVE_MONTHS_BALANCE_MIN_min,ACTIVE_MONTHS_BALANCE_MAX_max,ACTIVE_MONTHS_BALANCE_SIZE_mean,ACTIVE_MONTHS_BALANCE_SIZE_sum,ACTIVE_CREDIT_ACTIVE_BINARY_mean,ACTIVE_CREDIT_ENDDATE_BINARY_mean,CLOSED_DAYS_CREDIT_count,CLOSED_DAYS_CREDIT_mean,CLOSED_DAYS_CREDIT_var,CLOSED_DAYS_CREDIT_ENDDATE_mean,CLOSED_DAYS_CREDIT_UPDATE_mean,CLOSED_CREDIT_DAY_OVERDUE_mean,CLOSED_AMT_CREDIT_MAX_OVERDUE_mean,CLOSED_AMT_CREDIT_MAX_OVERDUE_sum,CLOSED_AMT_CREDIT_SUM_mean,CLOSED_AMT_CREDIT_SUM_sum,CLOSED_AMT_CREDIT_SUM_DEBT_mean,CLOSED_AMT_CREDIT_SUM_DEBT_sum,CLOSED_AMT_CREDIT_SUM_OVERDUE_mean,CLOSED_AMT_CREDIT_SUM_OVERDUE_sum,CLOSED_AMT_CREDIT_SUM_LIMIT_mean,CLOSED_AMT_CREDIT_SUM_LIMIT_sum,CLOSED_AMT_ANNUITY_max,CLOSED_AMT_ANNUITY_mean,CLOSED_AMT_ANNUITY_sum,CLOSED_CNT_CREDIT_PROLONG_sum,CLOSED_MONTHS_BALANCE_MIN_min,CLOSED_MONTHS_BALANCE_MAX_max,CLOSED_MONTHS_BALANCE_SIZE_mean,CLOSED_MONTHS_BALANCE_SIZE_sum,CLOSED_CREDIT_ACTIVE_BINARY_mean,CLOSED_CREDIT_ENDDATE_BINARY_mean,PREV_AMT_ANNUITY_MAX,PREV_AMT_ANNUITY_MEAN,PREV_AMT_APPLICATION_MAX,PREV_AMT_APPLICATION_MEAN,PREV_AMT_CREDIT_MAX,PREV_AMT_CREDIT_MEAN,PREV_AMT_DOWN_PAYMENT_MAX,PREV_AMT_DOWN_PAYMENT_MEAN,PREV_AMT_GOODS_PRICE_MAX,PREV_AMT_GOODS_PRICE_MEAN,PREV_HOUR_APPR_PROCESS_START_MAX,PREV_HOUR_APPR_PROCESS_START_MEAN,PREV_RATE_DOWN_PAYMENT_MAX,PREV_RATE_DOWN_PAYMENT_MEAN,PREV_DAYS_DECISION_MAX,PREV_DAYS_DECISION_MEAN,PREV_CNT_PAYMENT_MEAN,PREV_CNT_PAYMENT_SUM,PREV_APP_CREDIT_PERC_MAX,PREV_APP_CREDIT_PERC_MEAN,PREV_PAYMENT_RATE_MAX,PREV_PAYMENT_RATE_MEAN,PREV_ANNUITY_GOODS_PRICE_PERC_MAX,PREV_ANNUITY_GOODS_PRICE_PERC_MEAN,PREV_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_NAME_CONTRACT_TYPE_XNA_MEAN,PREV_NAME_CONTRACT_TYPE_nan_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_FRIDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_MONDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SATURDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SUNDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_THURSDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_TUESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_nan_MEAN,PREV_FLAG_LAST_APPL_PER_CONTRACT_N_MEAN,PREV_FLAG_LAST_APPL_PER_CONTRACT_Y_MEAN,PREV_FLAG_LAST_APPL_PER_CONTRACT_nan_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Building a house or an annex_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Business development_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a garage_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a holiday home / land_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a home_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a new car_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a used car_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Car repairs_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Education_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Everyday expenses_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Furniture_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Gasification / water supply_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Hobby_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Journey_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Medicine_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Money for a third person_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Other_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Payments on other loans_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Purchase of electronic equipment_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Refusal to name the goal_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Repairs_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Urgent needs_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Wedding / gift / holiday_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_XAP_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_XNA_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_nan_MEAN,PREV_NAME_CONTRACT_STATUS_Approved_MEAN,PREV_NAME_CONTRACT_STATUS_Canceled_MEAN,PREV_NAME_CONTRACT_STATUS_Refused_MEAN,PREV_NAME_CONTRACT_STATUS_Unused offer_MEAN,PREV_NAME_CONTRACT_STATUS_nan_MEAN,PREV_NAME_PAYMENT_TYPE_Cash through the bank_MEAN,PREV_NAME_PAYMENT_TYPE_Cashless from the account of the employer_MEAN,PREV_NAME_PAYMENT_TYPE_Non-cash from your account_MEAN,PREV_NAME_PAYMENT_TYPE_XNA_MEAN,PREV_NAME_PAYMENT_TYPE_nan_MEAN,PREV_CODE_REJECT_REASON_CLIENT_MEAN,PREV_CODE_REJECT_REASON_HC_MEAN,PREV_CODE_REJECT_REASON_LIMIT_MEAN,PREV_CODE_REJECT_REASON_SCO_MEAN,PREV_CODE_REJECT_REASON_SCOFR_MEAN,PREV_CODE_REJECT_REASON_SYSTEM_MEAN,PREV_CODE_REJECT_REASON_VERIF_MEAN,PREV_CODE_REJECT_REASON_XAP_MEAN,PREV_CODE_REJECT_REASON_XNA_MEAN,PREV_CODE_REJECT_REASON_nan_MEAN,PREV_NAME_TYPE_SUITE_Children_MEAN,PREV_NAME_TYPE_SUITE_Family_MEAN,PREV_NAME_TYPE_SUITE_Group of people_MEAN,PREV_NAME_TYPE_SUITE_Other_A_MEAN,PREV_NAME_TYPE_SUITE_Other_B_MEAN,"PREV_NAME_TYPE_SUITE_Spouse, partner_MEAN",PREV_NAME_TYPE_SUITE_Unaccompanied_MEAN,PREV_NAME_TYPE_SUITE_nan_MEAN,PREV_NAME_CLIENT_TYPE_New_MEAN,PREV_NAME_CLIENT_TYPE_Refreshed_MEAN,PREV_NAME_CLIENT_TYPE_Repeater_MEAN,PREV_NAME_CLIENT_TYPE_XNA_MEAN,PREV_NAME_CLIENT_TYPE_nan_MEAN,PREV_NAME_GOODS_CATEGORY_Additional Service_MEAN,PREV_NAME_GOODS_CATEGORY_Animals_MEAN,PREV_NAME_GOODS_CATEGORY_Audio/Video_MEAN,PREV_NAME_GOODS_CATEGORY_Auto Accessories_MEAN,PREV_NAME_GOODS_CATEGORY_Clothing and Accessories_MEAN,PREV_NAME_GOODS_CATEGORY_Computers_MEAN,PREV_NAME_GOODS_CATEGORY_Construction Materials_MEAN,PREV_NAME_GOODS_CATEGORY_Consumer Electronics_MEAN,PREV_NAME_GOODS_CATEGORY_Direct Sales_MEAN,PREV_NAME_GOODS_CATEGORY_Education_MEAN,PREV_NAME_GOODS_CATEGORY_Fitness_MEAN,PREV_NAME_GOODS_CATEGORY_Furniture_MEAN,PREV_NAME_GOODS_CATEGORY_Gardening_MEAN,PREV_NAME_GOODS_CATEGORY_Homewares_MEAN,PREV_NAME_GOODS_CATEGORY_House Construction_MEAN,PREV_NAME_GOODS_CATEGORY_Insurance_MEAN,PREV_NAME_GOODS_CATEGORY_Jewelry_MEAN,PREV_NAME_GOODS_CATEGORY_Medical Supplies_MEAN,PREV_NAME_GOODS_CATEGORY_Medicine_MEAN,PREV_NAME_GOODS_CATEGORY_Mobile_MEAN,PREV_NAME_GOODS_CATEGORY_Office Appliances_MEAN,PREV_NAME_GOODS_CATEGORY_Other_MEAN,PREV_NAME_GOODS_CATEGORY_Photo / Cinema Equipment_MEAN,PREV_NAME_GOODS_CATEGORY_Sport and Leisure_MEAN,PREV_NAME_GOODS_CATEGORY_Tourism_MEAN,PREV_NAME_GOODS_CATEGORY_Vehicles_MEAN,PREV_NAME_GOODS_CATEGORY_Weapon_MEAN,PREV_NAME_GOODS_CATEGORY_XNA_MEAN,PREV_NAME_GOODS_CATEGORY_nan_MEAN,PREV_NAME_PORTFOLIO_Cards_MEAN,PREV_NAME_PORTFOLIO_Cars_MEAN,PREV_NAME_PORTFOLIO_Cash_MEAN,PREV_NAME_PORTFOLIO_POS_MEAN,PREV_NAME_PORTFOLIO_XNA_MEAN,PREV_NAME_PORTFOLIO_nan_MEAN,PREV_NAME_PRODUCT_TYPE_XNA_MEAN,PREV_NAME_PRODUCT_TYPE_walk-in_MEAN,PREV_NAME_PRODUCT_TYPE_x-sell_MEAN,PREV_NAME_PRODUCT_TYPE_nan_MEAN,PREV_CHANNEL_TYPE_AP+ (Cash loan)_MEAN,PREV_CHANNEL_TYPE_Car dealer_MEAN,PREV_CHANNEL_TYPE_Channel of corporate sales_MEAN,PREV_CHANNEL_TYPE_Contact center_MEAN,PREV_CHANNEL_TYPE_Country-wide_MEAN,PREV_CHANNEL_TYPE_Credit and cash offices_MEAN,PREV_CHANNEL_TYPE_Regional / Local_MEAN,PREV_CHANNEL_TYPE_Stone_MEAN,PREV_CHANNEL_TYPE_nan_MEAN,PREV_NAME_SELLER_INDUSTRY_Auto technology_MEAN,PREV_NAME_SELLER_INDUSTRY_Clothing_MEAN,PREV_NAME_SELLER_INDUSTRY_Connectivity_MEAN,PREV_NAME_SELLER_INDUSTRY_Construction_MEAN,PREV_NAME_SELLER_INDUSTRY_Consumer electronics_MEAN,PREV_NAME_SELLER_INDUSTRY_Furniture_MEAN,PREV_NAME_SELLER_INDUSTRY_Industry_MEAN,PREV_NAME_SELLER_INDUSTRY_Jewelry_MEAN,PREV_NAME_SELLER_INDUSTRY_MLM partners_MEAN,PREV_NAME_SELLER_INDUSTRY_Tourism_MEAN,PREV_NAME_SELLER_INDUSTRY_XNA_MEAN,PREV_NAME_SELLER_INDUSTRY_nan_MEAN,PREV_NAME_YIELD_GROUP_XNA_MEAN,PREV_NAME_YIELD_GROUP_high_MEAN,PREV_NAME_YIELD_GROUP_low_action_MEAN,PREV_NAME_YIELD_GROUP_low_normal_MEAN,PREV_NAME_YIELD_GROUP_middle_MEAN,PREV_NAME_YIELD_GROUP_nan_MEAN,PREV_PRODUCT_COMBINATION_Card Street_MEAN,PREV_PRODUCT_COMBINATION_Card X-Sell_MEAN,PREV_PRODUCT_COMBINATION_Cash_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: high_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: low_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: middle_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: high_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: low_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: middle_MEAN,PREV_PRODUCT_COMBINATION_POS household with interest_MEAN,PREV_PRODUCT_COMBINATION_POS household without interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry with interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry without interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile with interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile without interest_MEAN,PREV_PRODUCT_COMBINATION_POS other with interest_MEAN,PREV_PRODUCT_COMBINATION_POS others without interest_MEAN,PREV_PRODUCT_COMBINATION_nan_MEAN,APPROVED_AMT_ANNUITY_MAX,APPROVED_AMT_ANNUITY_MEAN,APPROVED_AMT_APPLICATION_MAX,APPROVED_AMT_APPLICATION_MEAN,APPROVED_AMT_CREDIT_MAX,APPROVED_AMT_CREDIT_MEAN,APPROVED_AMT_DOWN_PAYMENT_MAX,APPROVED_AMT_DOWN_PAYMENT_MEAN,APPROVED_AMT_GOODS_PRICE_MAX,APPROVED_AMT_GOODS_PRICE_MEAN,APPROVED_HOUR_APPR_PROCESS_START_MAX,APPROVED_HOUR_APPR_PROCESS_START_MEAN,APPROVED_RATE_DOWN_PAYMENT_MAX,APPROVED_RATE_DOWN_PAYMENT_MEAN,APPROVED_DAYS_DECISION_MAX,APPROVED_DAYS_DECISION_MEAN,APPROVED_CNT_PAYMENT_MEAN,APPROVED_CNT_PAYMENT_SUM,APPROVED_APP_CREDIT_PERC_MAX,APPROVED_APP_CREDIT_PERC_MEAN,APPROVED_PAYMENT_RATE_MAX,APPROVED_PAYMENT_RATE_MEAN,APPROVED_ANNUITY_GOODS_PRICE_PERC_MAX,APPROVED_ANNUITY_GOODS_PRICE_PERC_MEAN,REFUSED_AMT_ANNUITY_MAX,REFUSED_AMT_ANNUITY_MEAN,REFUSED_AMT_APPLICATION_MAX,REFUSED_AMT_APPLICATION_MEAN,REFUSED_AMT_CREDIT_MAX,REFUSED_AMT_CREDIT_MEAN,REFUSED_AMT_DOWN_PAYMENT_MAX,REFUSED_AMT_DOWN_PAYMENT_MEAN,REFUSED_AMT_GOODS_PRICE_MAX,REFUSED_AMT_GOODS_PRICE_MEAN,REFUSED_HOUR_APPR_PROCESS_START_MAX,REFUSED_HOUR_APPR_PROCESS_START_MEAN,REFUSED_RATE_DOWN_PAYMENT_MAX,REFUSED_RATE_DOWN_PAYMENT_MEAN,REFUSED_DAYS_DECISION_MAX,REFUSED_DAYS_DECISION_MEAN,REFUSED_CNT_PAYMENT_MEAN,REFUSED_CNT_PAYMENT_SUM,REFUSED_APP_CREDIT_PERC_MAX,REFUSED_APP_CREDIT_PERC_MEAN,REFUSED_PAYMENT_RATE_MAX,REFUSED_PAYMENT_RATE_MEAN,REFUSED_ANNUITY_GOODS_PRICE_PERC_MAX,REFUSED_ANNUITY_GOODS_PRICE_PERC_MEAN,POS_MONTHS_BALANCE_MAX,POS_MONTHS_BALANCE_MEAN,POS_MONTHS_BALANCE_SIZE,POS_SK_DPD_MAX,POS_SK_DPD_MEAN,POS_SK_DPD_DEF_MAX,POS_SK_DPD_DEF_MEAN,POS_NAME_CONTRACT_STATUS_Active_MEAN,POS_NAME_CONTRACT_STATUS_Amortized debt_MEAN,POS_NAME_CONTRACT_STATUS_Approved_MEAN,POS_NAME_CONTRACT_STATUS_Canceled_MEAN,POS_NAME_CONTRACT_STATUS_Completed_MEAN,POS_NAME_CONTRACT_STATUS_Demand_MEAN,POS_NAME_CONTRACT_STATUS_Returned to the store_MEAN,POS_NAME_CONTRACT_STATUS_Signed_MEAN,POS_NAME_CONTRACT_STATUS_XNA_MEAN,POS_NAME_CONTRACT_STATUS_nan_MEAN,pos_cash_acc_count,INSTAL_NUM_INSTALMENT_VERSION_NUNIQUE,INSTAL_AMT_INSTALMENT_MAX,INSTAL_AMT_INSTALMENT_MEAN,INSTAL_AMT_INSTALMENT_SUM,INSTAL_AMT_INSTALMENT_STD,INSTAL_AMT_PAYMENT_MIN,INSTAL_AMT_PAYMENT_MAX,INSTAL_AMT_PAYMENT_MEAN,INSTAL_AMT_PAYMENT_SUM,INSTAL_AMT_PAYMENT_STD,INSTAL_DAYS_ENTRY_PAYMENT_MAX,INSTAL_DAYS_ENTRY_PAYMENT_MEAN,INSTAL_DAYS_ENTRY_PAYMENT_SUM,INSTAL_DAYS_ENTRY_PAYMENT_STD,INSTAL_PAYMENT_PERC_MAX,INSTAL_PAYMENT_PERC_MEAN,INSTAL_PAYMENT_PERC_SUM,INSTAL_PAYMENT_PERC_STD,INSTAL_PAYMENT_DIFF_MAX,INSTAL_PAYMENT_DIFF_MEAN,INSTAL_PAYMENT_DIFF_SUM,INSTAL_PAYMENT_DIFF_STD,INSTAL_PAID_OVER_MEAN,INSTAL_PAID_OVER_SUM,INSTAL_DPD_MAX,INSTAL_DPD_MEAN,INSTAL_DPD_SUM,INSTAL_DPD_STD,INSTAL_DPD_LATE_MEAN,INSTAL_DPD_LATE_SUM,INSTAL_DBD_MAX,INSTAL_DBD_MEAN,INSTAL_DBD_SUM,INSTAL_DBD_STD,install_count,CC_MONTHS_BALANCE_max,CC_MONTHS_BALANCE_mean,CC_MONTHS_BALANCE_sum,CC_MONTHS_BALANCE_var,CC_AMT_BALANCE_max,CC_AMT_BALANCE_mean,CC_AMT_BALANCE_sum,CC_AMT_BALANCE_var,CC_AMT_CREDIT_LIMIT_ACTUAL_max,CC_AMT_CREDIT_LIMIT_ACTUAL_mean,CC_AMT_CREDIT_LIMIT_ACTUAL_sum,CC_AMT_CREDIT_LIMIT_ACTUAL_var,CC_AMT_DRAWINGS_ATM_CURRENT_max,CC_AMT_DRAWINGS_ATM_CURRENT_mean,CC_AMT_DRAWINGS_ATM_CURRENT_sum,CC_AMT_DRAWINGS_ATM_CURRENT_var,CC_AMT_DRAWINGS_CURRENT_max,CC_AMT_DRAWINGS_CURRENT_mean,CC_AMT_DRAWINGS_CURRENT_sum,CC_AMT_DRAWINGS_CURRENT_var,CC_AMT_DRAWINGS_OTHER_CURRENT_max,CC_AMT_DRAWINGS_OTHER_CURRENT_mean,CC_AMT_DRAWINGS_OTHER_CURRENT_sum,CC_AMT_DRAWINGS_OTHER_CURRENT_var,CC_AMT_DRAWINGS_POS_CURRENT_max,CC_AMT_DRAWINGS_POS_CURRENT_mean,CC_AMT_DRAWINGS_POS_CURRENT_sum,CC_AMT_DRAWINGS_POS_CURRENT_var,CC_AMT_INST_MIN_REGULARITY_max,CC_AMT_INST_MIN_REGULARITY_mean,CC_AMT_INST_MIN_REGULARITY_sum,CC_AMT_INST_MIN_REGULARITY_var,CC_AMT_PAYMENT_CURRENT_max,CC_AMT_PAYMENT_CURRENT_mean,CC_AMT_PAYMENT_CURRENT_sum,CC_AMT_PAYMENT_CURRENT_var,CC_AMT_PAYMENT_TOTAL_CURRENT_max,CC_AMT_PAYMENT_TOTAL_CURRENT_mean,CC_AMT_PAYMENT_TOTAL_CURRENT_sum,CC_AMT_PAYMENT_TOTAL_CURRENT_var,CC_AMT_RECEIVABLE_PRINCIPAL_max,CC_AMT_RECEIVABLE_PRINCIPAL_mean,CC_AMT_RECEIVABLE_PRINCIPAL_sum,CC_AMT_RECEIVABLE_PRINCIPAL_var,CC_AMT_RECIVABLE_max,CC_AMT_RECIVABLE_mean,CC_AMT_RECIVABLE_sum,CC_AMT_RECIVABLE_var,CC_AMT_TOTAL_RECEIVABLE_max,CC_AMT_TOTAL_RECEIVABLE_mean,CC_AMT_TOTAL_RECEIVABLE_sum,CC_AMT_TOTAL_RECEIVABLE_var,CC_CNT_DRAWINGS_ATM_CURRENT_max,CC_CNT_DRAWINGS_ATM_CURRENT_mean,CC_CNT_DRAWINGS_ATM_CURRENT_sum,CC_CNT_DRAWINGS_ATM_CURRENT_var,CC_CNT_DRAWINGS_CURRENT_max,CC_CNT_DRAWINGS_CURRENT_mean,CC_CNT_DRAWINGS_CURRENT_sum,CC_CNT_DRAWINGS_CURRENT_var,CC_CNT_DRAWINGS_OTHER_CURRENT_max,CC_CNT_DRAWINGS_OTHER_CURRENT_mean,CC_CNT_DRAWINGS_OTHER_CURRENT_sum,CC_CNT_DRAWINGS_OTHER_CURRENT_var,CC_CNT_DRAWINGS_POS_CURRENT_max,CC_CNT_DRAWINGS_POS_CURRENT_mean,CC_CNT_DRAWINGS_POS_CURRENT_sum,CC_CNT_DRAWINGS_POS_CURRENT_var,CC_CNT_INSTALMENT_MATURE_CUM_max,CC_CNT_INSTALMENT_MATURE_CUM_mean,CC_CNT_INSTALMENT_MATURE_CUM_sum,CC_CNT_INSTALMENT_MATURE_CUM_var,CC_SK_DPD_max,CC_SK_DPD_mean,CC_SK_DPD_sum,CC_SK_DPD_var,CC_SK_DPD_DEF_max,CC_SK_DPD_DEF_mean,CC_SK_DPD_DEF_sum,CC_SK_DPD_DEF_var,CC_NAME_CONTRACT_STATUS_Active_max,CC_NAME_CONTRACT_STATUS_Active_mean,CC_NAME_CONTRACT_STATUS_Active_sum,CC_NAME_CONTRACT_STATUS_Active_var,CC_NAME_CONTRACT_STATUS_Approved_max,CC_NAME_CONTRACT_STATUS_Approved_mean,CC_NAME_CONTRACT_STATUS_Approved_sum,CC_NAME_CONTRACT_STATUS_Approved_var,CC_NAME_CONTRACT_STATUS_Completed_max,CC_NAME_CONTRACT_STATUS_Completed_mean,CC_NAME_CONTRACT_STATUS_Completed_sum,CC_NAME_CONTRACT_STATUS_Completed_var,CC_NAME_CONTRACT_STATUS_Demand_max,CC_NAME_CONTRACT_STATUS_Demand_mean,CC_NAME_CONTRACT_STATUS_Demand_sum,CC_NAME_CONTRACT_STATUS_Demand_var,CC_NAME_CONTRACT_STATUS_Refused_max,CC_NAME_CONTRACT_STATUS_Refused_mean,CC_NAME_CONTRACT_STATUS_Refused_sum,CC_NAME_CONTRACT_STATUS_Refused_var,CC_NAME_CONTRACT_STATUS_Sent proposal_max,CC_NAME_CONTRACT_STATUS_Sent proposal_mean,CC_NAME_CONTRACT_STATUS_Sent proposal_sum,CC_NAME_CONTRACT_STATUS_Sent proposal_var,CC_NAME_CONTRACT_STATUS_Signed_max,CC_NAME_CONTRACT_STATUS_Signed_mean,CC_NAME_CONTRACT_STATUS_Signed_sum,CC_NAME_CONTRACT_STATUS_Signed_var,CC_NAME_CONTRACT_STATUS_nan_max,CC_NAME_CONTRACT_STATUS_nan_mean,CC_NAME_CONTRACT_STATUS_nan_sum,CC_NAME_CONTRACT_STATUS_nan_var,CC_dpddef_dpd_gap_max,CC_dpddef_dpd_gap_mean,CC_dpddef_dpd_gap_sum,CC_dpddef_dpd_gap_var,cc_count
0,24700.5,406597.5,351000.0,202500.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0247,0.025,0.0252,0.0369,0.0369,0.0383,0,1.0,0,0.0143,0.0144,0.0144,-9461,-637.0,-2120,-1134.0,-3648.0,2.0,2.0,0.0,0.0,0.0,0.069,0.069,0.069,0.083037,0.262949,0.139376,1,1,0,1,1,0,0,1,0,0.0833,0.0833,0.0833,0.125,0.125,0.125,10,0.0369,0.0375,0.0377,0,0,0.0202,0.0205,0.022,0.019,0.0193,0.0198,0.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,,0.018801,2,2,0,0,0,0,100002,1.0,0.0149,0.9722,0.9722,0.9722,0.6192,0.6243,0.6341,1,0,0,0,1,0,1,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,-8824.0,-5813.0,,-8327.0,1.78022,16.461104,2.007889,0.121978,1.733333,0.070372,1.158397,202500.0,202500.0,406597.5,406597.5,1.0,0.0,202500.0,406597.5,5,0.178571,0.485361,0.161787,0.139376,0.075139,0.003043,8.0,-874.0,186150.0,-349.0,-499.875,0.0,1681.029,8405.145,108131.945625,865055.565,49156.2,245781.0,0.0,0.0,7997.14125,31988.565,0.0,0.0,0.0,0.0,-47.0,0.0,13.75,110.0,0.25,0.375,0.25,0.0,0.75,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.40696,0.255682,0.0,0.0,0.0,0.0,0.175426,0.161932,0.0,2.0,-572.5,440860.5,780.0,-15.5,0.0,40.5,40.5,240994.2825,481988.565,122890.5,245781.0,0.0,0.0,15994.2825,31988.565,0.0,0.0,0.0,0.0,-34.0,0.0,10.0,20.0,1.0,0.5,6.0,-974.5,123956.7,-574.8,-661.333333,0.0,2091.16125,8364.645,63844.5,383067.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-47.0,0.0,15.0,90.0,0.0,0.333333,9251.775,9251.775,179055.0,179055.0,179055.0,179055.0,0.0,0.0,179055.0,179055.0,9.0,9.0,0.0,0.0,-606.0,-606.0,24.0,24.0,1.0,1.0,0.05167,0.05167,0.05167,0.05167,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,9251.775,9251.775,179055.0,179055.0,179055.0,179055.0,0.0,0.0,179055.0,179055.0,9.0,9.0,0.0,0.0,-606.0,-606.0,24.0,24.0,1.0,1.0,0.05167,0.05167,0.05167,0.05167,,,,,,,,,,,,,,,,,,,,,,,,,-1.0,-10.0,19.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,2.0,53093.745,11559.247105,219625.695,10058.037722,9251.775,53093.745,11559.247105,219625.695,10058.037722,-49.0,-315.421053,-5993.0,172.058877,1.0,1.0,19.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,31.0,20.421053,388.0,4.925171,19.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,35698.5,1293502.5,1129500.0,270000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0959,0.0968,0.0924,0.0529,0.0529,0.0538,0,2.0,1,0.0605,0.0608,0.0497,-16765,-1188.0,-291,-828.0,-1186.0,0.0,0.0,0.08,0.08,0.0806,0.0345,0.0345,0.0345,0.311267,0.622246,,1,1,0,1,1,0,1,1,0,0.2917,0.2917,0.2917,0.3333,0.3333,0.3333,11,0.013,0.0132,0.0128,0,0,0.0773,0.0787,0.079,0.0549,0.0558,0.0554,0.0039,0.0039,0.0,0.0098,0.01,0.0,1.0,1.0,,0.003541,1,1,0,0,0,0,100003,0.0,0.0714,0.9851,0.9851,0.9851,0.796,0.7987,0.804,1,0,0,0,1,0,1,0,0,1,0,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,-15577.0,-15579.0,,-15937.0,0.69697,36.234085,4.79075,0.132217,4.183333,0.031606,1.145199,135000.0,270000.0,646751.25,1293502.5,2.0,0.0,135000.0,646751.25,6,0.214286,0.933513,0.466757,,0.155489,,4.0,-1400.75,827783.583333,-544.5,-816.0,0.0,0.0,0.0,254350.125,1017400.5,0.0,0.0,0.0,0.0,202500.0,810000.0,,,0.0,0.0,,,,0.0,0.25,0.25,0.25,0.0,0.75,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,1.0,-606.0,,1216.0,-43.0,0.0,0.0,0.0,810000.0,810000.0,0.0,0.0,0.0,0.0,810000.0,810000.0,,,0.0,0.0,,,,0.0,1.0,1.0,3.0,-1665.666667,820590.333333,-1131.333333,-1073.666667,0.0,0.0,0.0,69133.5,207400.5,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,,,,0.0,0.0,0.0,98356.995,56553.99,900000.0,435436.5,1035882.0,484191.0,6885.0,3442.5,900000.0,435436.5,17.0,14.666667,0.100061,0.05003,-746.0,-1305.0,10.0,30.0,1.011109,0.949329,0.1852,0.126383,0.191312,0.132837,0.333333,0.666667,0.0,0.0,0.0,0.333333,0.0,0.333333,0.333333,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.666667,0.333333,0.0,1.0,0.0,0.0,0.0,0.0,0.666667,0.0,0.0,0.333333,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.666667,0.0,0.0,0.0,0.0,0.333333,0.0,0.0,0.666667,0.333333,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.333333,0.0,0.0,0.0,0.333333,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.333333,0.0,0.0,0.0,0.333333,0.666667,0.0,0.0,0.666667,0.0,0.333333,0.0,0.0,0.0,0.0,0.0,0.333333,0.333333,0.0,0.333333,0.0,0.0,0.0,0.0,0.0,0.333333,0.333333,0.0,0.0,0.0,0.0,0.333333,0.0,0.0,0.0,0.0,0.333333,0.666667,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.333333,0.0,0.333333,0.0,0.333333,0.0,0.0,0.0,0.0,0.0,0.0,98356.995,56553.99,900000.0,435436.5,1035882.0,484191.0,6885.0,3442.5,900000.0,435436.5,17.0,14.666667,0.100061,0.05003,-746.0,-1305.0,10.0,30.0,1.011109,0.949329,0.1852,0.126383,0.191312,0.132837,,,,,,,,,,,,,,,,,,,,,,,,,-18.0,-43.785714,28.0,0.0,0.0,0.0,0.0,0.928571,0.0,0.0,0.0,0.071429,0.0,0.0,0.0,0.0,0.0,28.0,2.0,560835.36,64754.586,1618864.65,110542.5923,6662.97,560835.36,64754.586,1618864.65,110542.5923,-544.0,-1385.32,-34633.0,757.325432,1.0,1.0,25.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,14.0,7.16,179.0,3.726929,25.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,6750.0,135000.0,135000.0,67500.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,0,1.0,0,,,,-19046,-225.0,-2531,-815.0,-4260.0,0.0,0.0,,,,,,,,0.555912,0.729567,1,0,0,1,1,1,0,1,1,,,,,,,9,,,,0,0,,,,,,,,,,,,,0.0,0.0,26.0,0.010032,2,2,0,0,0,0,100004,0.0,,,,,,,,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,-18821.0,-14786.0,-19072.0,-18231.0,3.622222,20.0,2.0,0.1,2.0,0.05,1.0,67500.0,67500.0,135000.0,135000.0,1.0,0.0,67500.0,135000.0,6,0.214286,1.285479,0.642739,,0.086827,,2.0,-867.0,421362.0,-488.5,-532.0,0.0,0.0,0.0,94518.9,189037.8,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,,,,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,-867.0,421362.0,-488.5,-532.0,0.0,0.0,0.0,94518.9,189037.8,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,,,,0.0,0.0,0.0,5357.25,5357.25,24282.0,24282.0,20106.0,20106.0,4860.0,4860.0,24282.0,24282.0,5.0,5.0,0.212008,0.212008,-815.0,-815.0,4.0,4.0,1.207699,1.207699,0.26645,0.26645,0.220626,0.220626,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,5357.25,5357.25,24282.0,24282.0,20106.0,20106.0,4860.0,4860.0,24282.0,24282.0,5.0,5.0,0.212008,0.212008,-815.0,-815.0,4.0,4.0,1.207699,1.207699,0.26645,0.26645,0.220626,0.220626,,,,,,,,,,,,,,,,,,,,,,,,,-24.0,-25.5,4.0,0.0,0.0,0.0,0.0,0.75,0.0,0.0,0.0,0.25,0.0,0.0,0.0,0.0,0.0,4.0,2.0,10573.965,7096.155,21288.465,3011.87181,5357.25,10573.965,7096.155,21288.465,3011.87181,-727.0,-761.666667,-2285.0,34.019602,1.0,1.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11.0,7.666667,23.0,4.163332,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


---

# Feature Selection

1) Remove missing values

In [10]:
df = pd.read_csv(os.path.join(PATH_TO_DATA, 'df_all_files.csv'))
train = df[df['TARGET'].notnull()]
test = df[df['TARGET'].isnull()]
test.drop('TARGET', axis=1, inplace=True)
del df
gc.collect()

0

In [11]:
train_missing = (train.isnull().sum() / len(train)).sort_values(ascending = False)
train_missing.head()

REFUSED_RATE_DOWN_PAYMENT_MAX     0.853116
REFUSED_AMT_DOWN_PAYMENT_MAX      0.853116
REFUSED_RATE_DOWN_PAYMENT_MEAN    0.853116
REFUSED_AMT_DOWN_PAYMENT_MEAN     0.853116
CC_AMT_PAYMENT_CURRENT_var        0.802870
dtype: float64

In [12]:
test_missing = (test.isnull().sum() / len(test)).sort_values(ascending = False)
test_missing.head()

REFUSED_AMT_DOWN_PAYMENT_MAX      0.847468
REFUSED_RATE_DOWN_PAYMENT_MEAN    0.847468
REFUSED_RATE_DOWN_PAYMENT_MAX     0.847468
REFUSED_AMT_DOWN_PAYMENT_MEAN     0.847468
CC_AMT_PAYMENT_CURRENT_var        0.774680
dtype: float64

In [13]:
train_missing = train_missing.index[train_missing > 0.80]
test_missing = test_missing.index[test_missing > 0.80]

all_missing = list(set(set(train_missing) | set(test_missing)))
print('There are %d columns with more than 80%% missing values' % len(all_missing))

There are 24 columns with more than 80% missing values


In [14]:
train.drop(all_missing, axis=1, inplace=True)
test.drop(all_missing, axis=1, inplace=True)
print(train.shape, test.shape)

(307507, 737) (48744, 736)


2) Remove Collinear Variables

In [15]:
# i am dealing it with such a limited section of the data (~33%) because of waiting
mini_train = train.sample(100000)

In [16]:
%%time
# Absolute value correlation matrix
corr_matrix = mini_train.corr().abs()

Wall time: 6min 9s


In [17]:
# Upper triangle of correlations
upper = corr_matrix.where(np.triu(np.ones(corr_matrix.shape), k=1).astype(np.bool))
upper.head(3)

Unnamed: 0,AMT_ANNUITY,AMT_CREDIT,AMT_GOODS_PRICE,AMT_INCOME_TOTAL,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_YEAR,APARTMENTS_AVG,APARTMENTS_MEDI,APARTMENTS_MODE,BASEMENTAREA_AVG,BASEMENTAREA_MEDI,BASEMENTAREA_MODE,CNT_CHILDREN,CNT_FAM_MEMBERS,CODE_GENDER,COMMONAREA_AVG,COMMONAREA_MEDI,COMMONAREA_MODE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_ID_PUBLISH,DAYS_LAST_PHONE_CHANGE,DAYS_REGISTRATION,DEF_30_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,ELEVATORS_AVG,ELEVATORS_MEDI,ELEVATORS_MODE,ENTRANCES_AVG,ENTRANCES_MEDI,ENTRANCES_MODE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,FLAG_CONT_MOBILE,FLAG_DOCUMENT_3,FLAG_EMAIL,FLAG_EMP_PHONE,FLAG_MOBIL,FLAG_OWN_CAR,FLAG_OWN_REALTY,FLAG_PHONE,FLAG_WORK_PHONE,FLOORSMAX_AVG,FLOORSMAX_MEDI,FLOORSMAX_MODE,FLOORSMIN_AVG,FLOORSMIN_MEDI,FLOORSMIN_MODE,HOUR_APPR_PROCESS_START,LANDAREA_AVG,LANDAREA_MEDI,LANDAREA_MODE,LIVE_CITY_NOT_WORK_CITY,LIVE_REGION_NOT_WORK_REGION,LIVINGAPARTMENTS_AVG,LIVINGAPARTMENTS_MEDI,LIVINGAPARTMENTS_MODE,LIVINGAREA_AVG,LIVINGAREA_MEDI,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_AVG,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_AVG,NONLIVINGAREA_MEDI,NONLIVINGAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE,REGION_POPULATION_RELATIVE,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,SK_ID_CURR,TARGET,TOTALAREA_MODE,YEARS_BEGINEXPLUATATION_AVG,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_AVG,YEARS_BUILD_MEDI,YEARS_BUILD_MODE,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,FONDKAPREMONT_MODE_not specified,FONDKAPREMONT_MODE_org spec account,FONDKAPREMONT_MODE_reg oper account,FONDKAPREMONT_MODE_reg oper spec account,HOUSETYPE_MODE_block of flats,HOUSETYPE_MODE_specific housing,HOUSETYPE_MODE_terraced house,NAME_CONTRACT_TYPE_Cash loans,NAME_CONTRACT_TYPE_Revolving loans,NAME_EDUCATION_TYPE_Academic degree,NAME_EDUCATION_TYPE_Higher education,NAME_EDUCATION_TYPE_Incomplete higher,NAME_EDUCATION_TYPE_Lower secondary,NAME_EDUCATION_TYPE_Secondary / secondary special,NAME_FAMILY_STATUS_Civil marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single / not married,NAME_FAMILY_STATUS_Widow,NAME_HOUSING_TYPE_Co-op apartment,NAME_HOUSING_TYPE_House / apartment,NAME_HOUSING_TYPE_Municipal apartment,NAME_HOUSING_TYPE_Office apartment,NAME_HOUSING_TYPE_Rented apartment,NAME_HOUSING_TYPE_With parents,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial associate,NAME_INCOME_TYPE_Maternity leave,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group of people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse, partner",NAME_TYPE_SUITE_Unaccompanied,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning staff,OCCUPATION_TYPE_Cooking staff,OCCUPATION_TYPE_Core staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR staff,OCCUPATION_TYPE_High skill tech staff,OCCUPATION_TYPE_IT staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine staff,OCCUPATION_TYPE_Private service staff,OCCUPATION_TYPE_Realty agents,OCCUPATION_TYPE_Sales staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security staff,OCCUPATION_TYPE_Waiters/barmen staff,ORGANIZATION_TYPE_Advertising,ORGANIZATION_TYPE_Agriculture,ORGANIZATION_TYPE_Bank,ORGANIZATION_TYPE_Business Entity Type 1,ORGANIZATION_TYPE_Business Entity Type 2,ORGANIZATION_TYPE_Business Entity Type 3,ORGANIZATION_TYPE_Cleaning,ORGANIZATION_TYPE_Construction,ORGANIZATION_TYPE_Culture,ORGANIZATION_TYPE_Electricity,ORGANIZATION_TYPE_Emergency,ORGANIZATION_TYPE_Government,ORGANIZATION_TYPE_Hotel,ORGANIZATION_TYPE_Housing,ORGANIZATION_TYPE_Industry: type 1,ORGANIZATION_TYPE_Industry: type 10,ORGANIZATION_TYPE_Industry: type 11,ORGANIZATION_TYPE_Industry: type 12,ORGANIZATION_TYPE_Industry: type 13,ORGANIZATION_TYPE_Industry: type 2,ORGANIZATION_TYPE_Industry: type 3,ORGANIZATION_TYPE_Industry: type 4,ORGANIZATION_TYPE_Industry: type 5,ORGANIZATION_TYPE_Industry: type 6,ORGANIZATION_TYPE_Industry: type 7,ORGANIZATION_TYPE_Industry: type 8,ORGANIZATION_TYPE_Industry: type 9,ORGANIZATION_TYPE_Insurance,ORGANIZATION_TYPE_Kindergarten,ORGANIZATION_TYPE_Legal Services,ORGANIZATION_TYPE_Medicine,ORGANIZATION_TYPE_Military,ORGANIZATION_TYPE_Mobile,ORGANIZATION_TYPE_Other,ORGANIZATION_TYPE_Police,ORGANIZATION_TYPE_Postal,ORGANIZATION_TYPE_Realtor,ORGANIZATION_TYPE_Religion,ORGANIZATION_TYPE_Restaurant,ORGANIZATION_TYPE_School,ORGANIZATION_TYPE_Security,ORGANIZATION_TYPE_Security Ministries,ORGANIZATION_TYPE_Self-employed,ORGANIZATION_TYPE_Services,ORGANIZATION_TYPE_Telecom,ORGANIZATION_TYPE_Trade: type 1,ORGANIZATION_TYPE_Trade: type 2,ORGANIZATION_TYPE_Trade: type 3,ORGANIZATION_TYPE_Trade: type 4,ORGANIZATION_TYPE_Trade: type 5,ORGANIZATION_TYPE_Trade: type 6,ORGANIZATION_TYPE_Trade: type 7,ORGANIZATION_TYPE_Transport: type 1,ORGANIZATION_TYPE_Transport: type 2,ORGANIZATION_TYPE_Transport: type 3,ORGANIZATION_TYPE_Transport: type 4,ORGANIZATION_TYPE_University,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone, brick",WALLSMATERIAL_MODE_Wooden,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,birth_employed_gap,birth_registration_gap,birth_car_age_gap,birth_last_phone_gap,last_phone_employed_perc,PAYMENT_RATE,CREDIT_INCOME_PERC,ANNUITY_INCOME_PERC,GOODS_PRICE_INCOME_PERC,ANNUITY_GOODS_PRICE_PERC,GOODS_PRICE_CREDIT_PERC,INCOME_PER_PERSON,INCOME_PER_CHILD,CREDIT_PER_PERSON,CREDIT_PER_CHILD,cnt_non_child,child_to_non_child_ratio,income_per_non_child,credit_per_non_child,flags_sum,flags_mean,ext_sources_sum,ext_sources_mean,ext_sources_median,ext_sources_std,ext_sources_prod,BUREAU_DAYS_CREDIT_COUNT,BUREAU_DAYS_CREDIT_MEAN,BUREAU_DAYS_CREDIT_VAR,BUREAU_DAYS_CREDIT_ENDDATE_MEAN,BUREAU_DAYS_CREDIT_UPDATE_MEAN,BUREAU_CREDIT_DAY_OVERDUE_MEAN,BUREAU_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_AMT_CREDIT_MAX_OVERDUE_SUM,BUREAU_AMT_CREDIT_SUM_MEAN,BUREAU_AMT_CREDIT_SUM_SUM,BUREAU_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_OVERDUE_SUM,BUREAU_AMT_CREDIT_SUM_LIMIT_MEAN,BUREAU_AMT_CREDIT_SUM_LIMIT_SUM,BUREAU_AMT_ANNUITY_MAX,BUREAU_AMT_ANNUITY_MEAN,BUREAU_AMT_ANNUITY_SUM,BUREAU_CNT_CREDIT_PROLONG_SUM,BUREAU_MONTHS_BALANCE_MIN_MIN,BUREAU_MONTHS_BALANCE_MAX_MAX,BUREAU_MONTHS_BALANCE_SIZE_MEAN,BUREAU_MONTHS_BALANCE_SIZE_SUM,BUREAU_CREDIT_ACTIVE_BINARY_MEAN,BUREAU_CREDIT_ENDDATE_BINARY_MEAN,BUREAU_CREDIT_ACTIVE_Active_MEAN,BUREAU_CREDIT_ACTIVE_Bad debt_MEAN,BUREAU_CREDIT_ACTIVE_Closed_MEAN,BUREAU_CREDIT_ACTIVE_Sold_MEAN,BUREAU_CREDIT_ACTIVE_nan_MEAN,BUREAU_CREDIT_CURRENCY_currency 1_MEAN,BUREAU_CREDIT_CURRENCY_currency 2_MEAN,BUREAU_CREDIT_CURRENCY_currency 3_MEAN,BUREAU_CREDIT_CURRENCY_currency 4_MEAN,BUREAU_CREDIT_CURRENCY_nan_MEAN,BUREAU_CREDIT_TYPE_Another type of loan_MEAN,BUREAU_CREDIT_TYPE_Car loan_MEAN,BUREAU_CREDIT_TYPE_Cash loan (non-earmarked)_MEAN,BUREAU_CREDIT_TYPE_Consumer credit_MEAN,BUREAU_CREDIT_TYPE_Credit card_MEAN,BUREAU_CREDIT_TYPE_Interbank credit_MEAN,BUREAU_CREDIT_TYPE_Loan for business development_MEAN,BUREAU_CREDIT_TYPE_Loan for purchase of shares (margin lending)_MEAN,BUREAU_CREDIT_TYPE_Loan for the purchase of equipment_MEAN,BUREAU_CREDIT_TYPE_Loan for working capital replenishment_MEAN,BUREAU_CREDIT_TYPE_Microloan_MEAN,BUREAU_CREDIT_TYPE_Mobile operator loan_MEAN,BUREAU_CREDIT_TYPE_Mortgage_MEAN,BUREAU_CREDIT_TYPE_Real estate loan_MEAN,BUREAU_CREDIT_TYPE_Unknown type of loan_MEAN,BUREAU_CREDIT_TYPE_nan_MEAN,BUREAU_STATUS_0_MEAN_MEAN,BUREAU_STATUS_1_MEAN_MEAN,BUREAU_STATUS_2_MEAN_MEAN,BUREAU_STATUS_3_MEAN_MEAN,BUREAU_STATUS_4_MEAN_MEAN,BUREAU_STATUS_5_MEAN_MEAN,BUREAU_STATUS_C_MEAN_MEAN,BUREAU_STATUS_X_MEAN_MEAN,BUREAU_STATUS_nan_MEAN_MEAN,ACTIVE_DAYS_CREDIT_count,ACTIVE_DAYS_CREDIT_mean,ACTIVE_DAYS_CREDIT_var,ACTIVE_DAYS_CREDIT_ENDDATE_mean,ACTIVE_DAYS_CREDIT_UPDATE_mean,ACTIVE_CREDIT_DAY_OVERDUE_mean,ACTIVE_AMT_CREDIT_MAX_OVERDUE_mean,ACTIVE_AMT_CREDIT_MAX_OVERDUE_sum,ACTIVE_AMT_CREDIT_SUM_mean,ACTIVE_AMT_CREDIT_SUM_sum,ACTIVE_AMT_CREDIT_SUM_DEBT_mean,ACTIVE_AMT_CREDIT_SUM_DEBT_sum,ACTIVE_AMT_CREDIT_SUM_OVERDUE_mean,ACTIVE_AMT_CREDIT_SUM_OVERDUE_sum,ACTIVE_AMT_CREDIT_SUM_LIMIT_mean,ACTIVE_AMT_CREDIT_SUM_LIMIT_sum,ACTIVE_AMT_ANNUITY_sum,ACTIVE_CNT_CREDIT_PROLONG_sum,ACTIVE_MONTHS_BALANCE_MIN_min,ACTIVE_MONTHS_BALANCE_MAX_max,ACTIVE_MONTHS_BALANCE_SIZE_mean,ACTIVE_MONTHS_BALANCE_SIZE_sum,ACTIVE_CREDIT_ACTIVE_BINARY_mean,ACTIVE_CREDIT_ENDDATE_BINARY_mean,CLOSED_DAYS_CREDIT_count,CLOSED_DAYS_CREDIT_mean,CLOSED_DAYS_CREDIT_var,CLOSED_DAYS_CREDIT_ENDDATE_mean,CLOSED_DAYS_CREDIT_UPDATE_mean,CLOSED_CREDIT_DAY_OVERDUE_mean,CLOSED_AMT_CREDIT_MAX_OVERDUE_mean,CLOSED_AMT_CREDIT_MAX_OVERDUE_sum,CLOSED_AMT_CREDIT_SUM_mean,CLOSED_AMT_CREDIT_SUM_sum,CLOSED_AMT_CREDIT_SUM_DEBT_mean,CLOSED_AMT_CREDIT_SUM_DEBT_sum,CLOSED_AMT_CREDIT_SUM_OVERDUE_mean,CLOSED_AMT_CREDIT_SUM_OVERDUE_sum,CLOSED_AMT_CREDIT_SUM_LIMIT_mean,CLOSED_AMT_CREDIT_SUM_LIMIT_sum,CLOSED_AMT_ANNUITY_max,CLOSED_AMT_ANNUITY_mean,CLOSED_AMT_ANNUITY_sum,CLOSED_CNT_CREDIT_PROLONG_sum,CLOSED_MONTHS_BALANCE_MIN_min,CLOSED_MONTHS_BALANCE_MAX_max,CLOSED_MONTHS_BALANCE_SIZE_mean,CLOSED_MONTHS_BALANCE_SIZE_sum,CLOSED_CREDIT_ACTIVE_BINARY_mean,CLOSED_CREDIT_ENDDATE_BINARY_mean,PREV_AMT_ANNUITY_MAX,PREV_AMT_ANNUITY_MEAN,PREV_AMT_APPLICATION_MAX,PREV_AMT_APPLICATION_MEAN,PREV_AMT_CREDIT_MAX,PREV_AMT_CREDIT_MEAN,PREV_AMT_DOWN_PAYMENT_MAX,PREV_AMT_DOWN_PAYMENT_MEAN,PREV_AMT_GOODS_PRICE_MAX,PREV_AMT_GOODS_PRICE_MEAN,PREV_HOUR_APPR_PROCESS_START_MAX,PREV_HOUR_APPR_PROCESS_START_MEAN,PREV_RATE_DOWN_PAYMENT_MAX,PREV_RATE_DOWN_PAYMENT_MEAN,PREV_DAYS_DECISION_MAX,PREV_DAYS_DECISION_MEAN,PREV_CNT_PAYMENT_MEAN,PREV_CNT_PAYMENT_SUM,PREV_APP_CREDIT_PERC_MAX,PREV_APP_CREDIT_PERC_MEAN,PREV_PAYMENT_RATE_MAX,PREV_PAYMENT_RATE_MEAN,PREV_ANNUITY_GOODS_PRICE_PERC_MAX,PREV_ANNUITY_GOODS_PRICE_PERC_MEAN,PREV_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_NAME_CONTRACT_TYPE_XNA_MEAN,PREV_NAME_CONTRACT_TYPE_nan_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_FRIDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_MONDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SATURDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SUNDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_THURSDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_TUESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_nan_MEAN,PREV_FLAG_LAST_APPL_PER_CONTRACT_N_MEAN,PREV_FLAG_LAST_APPL_PER_CONTRACT_Y_MEAN,PREV_FLAG_LAST_APPL_PER_CONTRACT_nan_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Building a house or an annex_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Business development_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a garage_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a holiday home / land_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a home_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a new car_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Buying a used car_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Car repairs_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Education_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Everyday expenses_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Furniture_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Gasification / water supply_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Hobby_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Journey_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Medicine_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Money for a third person_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Other_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Payments on other loans_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Purchase of electronic equipment_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Refusal to name the goal_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Repairs_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Urgent needs_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_Wedding / gift / holiday_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_XAP_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_XNA_MEAN,PREV_NAME_CASH_LOAN_PURPOSE_nan_MEAN,PREV_NAME_CONTRACT_STATUS_Approved_MEAN,PREV_NAME_CONTRACT_STATUS_Canceled_MEAN,PREV_NAME_CONTRACT_STATUS_Refused_MEAN,PREV_NAME_CONTRACT_STATUS_Unused offer_MEAN,PREV_NAME_CONTRACT_STATUS_nan_MEAN,PREV_NAME_PAYMENT_TYPE_Cash through the bank_MEAN,PREV_NAME_PAYMENT_TYPE_Cashless from the account of the employer_MEAN,PREV_NAME_PAYMENT_TYPE_Non-cash from your account_MEAN,PREV_NAME_PAYMENT_TYPE_XNA_MEAN,PREV_NAME_PAYMENT_TYPE_nan_MEAN,PREV_CODE_REJECT_REASON_CLIENT_MEAN,PREV_CODE_REJECT_REASON_HC_MEAN,PREV_CODE_REJECT_REASON_LIMIT_MEAN,PREV_CODE_REJECT_REASON_SCO_MEAN,PREV_CODE_REJECT_REASON_SCOFR_MEAN,PREV_CODE_REJECT_REASON_SYSTEM_MEAN,PREV_CODE_REJECT_REASON_VERIF_MEAN,PREV_CODE_REJECT_REASON_XAP_MEAN,PREV_CODE_REJECT_REASON_XNA_MEAN,PREV_CODE_REJECT_REASON_nan_MEAN,PREV_NAME_TYPE_SUITE_Children_MEAN,PREV_NAME_TYPE_SUITE_Family_MEAN,PREV_NAME_TYPE_SUITE_Group of people_MEAN,PREV_NAME_TYPE_SUITE_Other_A_MEAN,PREV_NAME_TYPE_SUITE_Other_B_MEAN,"PREV_NAME_TYPE_SUITE_Spouse, partner_MEAN",PREV_NAME_TYPE_SUITE_Unaccompanied_MEAN,PREV_NAME_TYPE_SUITE_nan_MEAN,PREV_NAME_CLIENT_TYPE_New_MEAN,PREV_NAME_CLIENT_TYPE_Refreshed_MEAN,PREV_NAME_CLIENT_TYPE_Repeater_MEAN,PREV_NAME_CLIENT_TYPE_XNA_MEAN,PREV_NAME_CLIENT_TYPE_nan_MEAN,PREV_NAME_GOODS_CATEGORY_Additional Service_MEAN,PREV_NAME_GOODS_CATEGORY_Animals_MEAN,PREV_NAME_GOODS_CATEGORY_Audio/Video_MEAN,PREV_NAME_GOODS_CATEGORY_Auto Accessories_MEAN,PREV_NAME_GOODS_CATEGORY_Clothing and Accessories_MEAN,PREV_NAME_GOODS_CATEGORY_Computers_MEAN,PREV_NAME_GOODS_CATEGORY_Construction Materials_MEAN,PREV_NAME_GOODS_CATEGORY_Consumer Electronics_MEAN,PREV_NAME_GOODS_CATEGORY_Direct Sales_MEAN,PREV_NAME_GOODS_CATEGORY_Education_MEAN,PREV_NAME_GOODS_CATEGORY_Fitness_MEAN,PREV_NAME_GOODS_CATEGORY_Furniture_MEAN,PREV_NAME_GOODS_CATEGORY_Gardening_MEAN,PREV_NAME_GOODS_CATEGORY_Homewares_MEAN,PREV_NAME_GOODS_CATEGORY_House Construction_MEAN,PREV_NAME_GOODS_CATEGORY_Insurance_MEAN,PREV_NAME_GOODS_CATEGORY_Jewelry_MEAN,PREV_NAME_GOODS_CATEGORY_Medical Supplies_MEAN,PREV_NAME_GOODS_CATEGORY_Medicine_MEAN,PREV_NAME_GOODS_CATEGORY_Mobile_MEAN,PREV_NAME_GOODS_CATEGORY_Office Appliances_MEAN,PREV_NAME_GOODS_CATEGORY_Other_MEAN,PREV_NAME_GOODS_CATEGORY_Photo / Cinema Equipment_MEAN,PREV_NAME_GOODS_CATEGORY_Sport and Leisure_MEAN,PREV_NAME_GOODS_CATEGORY_Tourism_MEAN,PREV_NAME_GOODS_CATEGORY_Vehicles_MEAN,PREV_NAME_GOODS_CATEGORY_Weapon_MEAN,PREV_NAME_GOODS_CATEGORY_XNA_MEAN,PREV_NAME_GOODS_CATEGORY_nan_MEAN,PREV_NAME_PORTFOLIO_Cards_MEAN,PREV_NAME_PORTFOLIO_Cars_MEAN,PREV_NAME_PORTFOLIO_Cash_MEAN,PREV_NAME_PORTFOLIO_POS_MEAN,PREV_NAME_PORTFOLIO_XNA_MEAN,PREV_NAME_PORTFOLIO_nan_MEAN,PREV_NAME_PRODUCT_TYPE_XNA_MEAN,PREV_NAME_PRODUCT_TYPE_walk-in_MEAN,PREV_NAME_PRODUCT_TYPE_x-sell_MEAN,PREV_NAME_PRODUCT_TYPE_nan_MEAN,PREV_CHANNEL_TYPE_AP+ (Cash loan)_MEAN,PREV_CHANNEL_TYPE_Car dealer_MEAN,PREV_CHANNEL_TYPE_Channel of corporate sales_MEAN,PREV_CHANNEL_TYPE_Contact center_MEAN,PREV_CHANNEL_TYPE_Country-wide_MEAN,PREV_CHANNEL_TYPE_Credit and cash offices_MEAN,PREV_CHANNEL_TYPE_Regional / Local_MEAN,PREV_CHANNEL_TYPE_Stone_MEAN,PREV_CHANNEL_TYPE_nan_MEAN,PREV_NAME_SELLER_INDUSTRY_Auto technology_MEAN,PREV_NAME_SELLER_INDUSTRY_Clothing_MEAN,PREV_NAME_SELLER_INDUSTRY_Connectivity_MEAN,PREV_NAME_SELLER_INDUSTRY_Construction_MEAN,PREV_NAME_SELLER_INDUSTRY_Consumer electronics_MEAN,PREV_NAME_SELLER_INDUSTRY_Furniture_MEAN,PREV_NAME_SELLER_INDUSTRY_Industry_MEAN,PREV_NAME_SELLER_INDUSTRY_Jewelry_MEAN,PREV_NAME_SELLER_INDUSTRY_MLM partners_MEAN,PREV_NAME_SELLER_INDUSTRY_Tourism_MEAN,PREV_NAME_SELLER_INDUSTRY_XNA_MEAN,PREV_NAME_SELLER_INDUSTRY_nan_MEAN,PREV_NAME_YIELD_GROUP_XNA_MEAN,PREV_NAME_YIELD_GROUP_high_MEAN,PREV_NAME_YIELD_GROUP_low_action_MEAN,PREV_NAME_YIELD_GROUP_low_normal_MEAN,PREV_NAME_YIELD_GROUP_middle_MEAN,PREV_NAME_YIELD_GROUP_nan_MEAN,PREV_PRODUCT_COMBINATION_Card Street_MEAN,PREV_PRODUCT_COMBINATION_Card X-Sell_MEAN,PREV_PRODUCT_COMBINATION_Cash_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: high_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: low_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: middle_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: high_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: low_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: middle_MEAN,PREV_PRODUCT_COMBINATION_POS household with interest_MEAN,PREV_PRODUCT_COMBINATION_POS household without interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry with interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry without interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile with interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile without interest_MEAN,PREV_PRODUCT_COMBINATION_POS other with interest_MEAN,PREV_PRODUCT_COMBINATION_POS others without interest_MEAN,PREV_PRODUCT_COMBINATION_nan_MEAN,APPROVED_AMT_ANNUITY_MAX,APPROVED_AMT_ANNUITY_MEAN,APPROVED_AMT_APPLICATION_MAX,APPROVED_AMT_APPLICATION_MEAN,APPROVED_AMT_CREDIT_MAX,APPROVED_AMT_CREDIT_MEAN,APPROVED_AMT_DOWN_PAYMENT_MAX,APPROVED_AMT_DOWN_PAYMENT_MEAN,APPROVED_AMT_GOODS_PRICE_MAX,APPROVED_AMT_GOODS_PRICE_MEAN,APPROVED_HOUR_APPR_PROCESS_START_MAX,APPROVED_HOUR_APPR_PROCESS_START_MEAN,APPROVED_RATE_DOWN_PAYMENT_MAX,APPROVED_RATE_DOWN_PAYMENT_MEAN,APPROVED_DAYS_DECISION_MAX,APPROVED_DAYS_DECISION_MEAN,APPROVED_CNT_PAYMENT_MEAN,APPROVED_CNT_PAYMENT_SUM,APPROVED_APP_CREDIT_PERC_MAX,APPROVED_APP_CREDIT_PERC_MEAN,APPROVED_PAYMENT_RATE_MAX,APPROVED_PAYMENT_RATE_MEAN,APPROVED_ANNUITY_GOODS_PRICE_PERC_MAX,APPROVED_ANNUITY_GOODS_PRICE_PERC_MEAN,REFUSED_AMT_ANNUITY_MAX,REFUSED_AMT_ANNUITY_MEAN,REFUSED_AMT_APPLICATION_MAX,REFUSED_AMT_APPLICATION_MEAN,REFUSED_AMT_CREDIT_MAX,REFUSED_AMT_CREDIT_MEAN,REFUSED_AMT_GOODS_PRICE_MAX,REFUSED_AMT_GOODS_PRICE_MEAN,REFUSED_HOUR_APPR_PROCESS_START_MAX,REFUSED_HOUR_APPR_PROCESS_START_MEAN,REFUSED_DAYS_DECISION_MAX,REFUSED_DAYS_DECISION_MEAN,REFUSED_CNT_PAYMENT_MEAN,REFUSED_CNT_PAYMENT_SUM,REFUSED_APP_CREDIT_PERC_MAX,REFUSED_APP_CREDIT_PERC_MEAN,REFUSED_PAYMENT_RATE_MAX,REFUSED_PAYMENT_RATE_MEAN,REFUSED_ANNUITY_GOODS_PRICE_PERC_MAX,REFUSED_ANNUITY_GOODS_PRICE_PERC_MEAN,POS_MONTHS_BALANCE_MAX,POS_MONTHS_BALANCE_MEAN,POS_MONTHS_BALANCE_SIZE,POS_SK_DPD_MAX,POS_SK_DPD_MEAN,POS_SK_DPD_DEF_MAX,POS_SK_DPD_DEF_MEAN,POS_NAME_CONTRACT_STATUS_Active_MEAN,POS_NAME_CONTRACT_STATUS_Amortized debt_MEAN,POS_NAME_CONTRACT_STATUS_Approved_MEAN,POS_NAME_CONTRACT_STATUS_Canceled_MEAN,POS_NAME_CONTRACT_STATUS_Completed_MEAN,POS_NAME_CONTRACT_STATUS_Demand_MEAN,POS_NAME_CONTRACT_STATUS_Returned to the store_MEAN,POS_NAME_CONTRACT_STATUS_Signed_MEAN,POS_NAME_CONTRACT_STATUS_XNA_MEAN,POS_NAME_CONTRACT_STATUS_nan_MEAN,pos_cash_acc_count,INSTAL_NUM_INSTALMENT_VERSION_NUNIQUE,INSTAL_AMT_INSTALMENT_MAX,INSTAL_AMT_INSTALMENT_MEAN,INSTAL_AMT_INSTALMENT_SUM,INSTAL_AMT_INSTALMENT_STD,INSTAL_AMT_PAYMENT_MIN,INSTAL_AMT_PAYMENT_MAX,INSTAL_AMT_PAYMENT_MEAN,INSTAL_AMT_PAYMENT_SUM,INSTAL_AMT_PAYMENT_STD,INSTAL_DAYS_ENTRY_PAYMENT_MAX,INSTAL_DAYS_ENTRY_PAYMENT_MEAN,INSTAL_DAYS_ENTRY_PAYMENT_SUM,INSTAL_DAYS_ENTRY_PAYMENT_STD,INSTAL_PAYMENT_PERC_MAX,INSTAL_PAYMENT_PERC_MEAN,INSTAL_PAYMENT_PERC_SUM,INSTAL_PAYMENT_PERC_STD,INSTAL_PAYMENT_DIFF_MAX,INSTAL_PAYMENT_DIFF_MEAN,INSTAL_PAYMENT_DIFF_SUM,INSTAL_PAYMENT_DIFF_STD,INSTAL_PAID_OVER_MEAN,INSTAL_PAID_OVER_SUM,INSTAL_DPD_MAX,INSTAL_DPD_MEAN,INSTAL_DPD_SUM,INSTAL_DPD_STD,INSTAL_DPD_LATE_MEAN,INSTAL_DPD_LATE_SUM,INSTAL_DBD_MAX,INSTAL_DBD_MEAN,INSTAL_DBD_SUM,INSTAL_DBD_STD,install_count,CC_MONTHS_BALANCE_max,CC_MONTHS_BALANCE_mean,CC_MONTHS_BALANCE_sum,CC_MONTHS_BALANCE_var,CC_AMT_BALANCE_max,CC_AMT_BALANCE_mean,CC_AMT_BALANCE_sum,CC_AMT_BALANCE_var,CC_AMT_CREDIT_LIMIT_ACTUAL_max,CC_AMT_CREDIT_LIMIT_ACTUAL_mean,CC_AMT_CREDIT_LIMIT_ACTUAL_sum,CC_AMT_CREDIT_LIMIT_ACTUAL_var,CC_AMT_DRAWINGS_ATM_CURRENT_max,CC_AMT_DRAWINGS_ATM_CURRENT_mean,CC_AMT_DRAWINGS_ATM_CURRENT_sum,CC_AMT_DRAWINGS_ATM_CURRENT_var,CC_AMT_DRAWINGS_CURRENT_max,CC_AMT_DRAWINGS_CURRENT_mean,CC_AMT_DRAWINGS_CURRENT_sum,CC_AMT_DRAWINGS_CURRENT_var,CC_AMT_DRAWINGS_OTHER_CURRENT_sum,CC_AMT_DRAWINGS_POS_CURRENT_sum,CC_AMT_INST_MIN_REGULARITY_max,CC_AMT_INST_MIN_REGULARITY_mean,CC_AMT_INST_MIN_REGULARITY_sum,CC_AMT_INST_MIN_REGULARITY_var,CC_AMT_PAYMENT_CURRENT_sum,CC_AMT_PAYMENT_TOTAL_CURRENT_max,CC_AMT_PAYMENT_TOTAL_CURRENT_mean,CC_AMT_PAYMENT_TOTAL_CURRENT_sum,CC_AMT_PAYMENT_TOTAL_CURRENT_var,CC_AMT_RECEIVABLE_PRINCIPAL_max,CC_AMT_RECEIVABLE_PRINCIPAL_mean,CC_AMT_RECEIVABLE_PRINCIPAL_sum,CC_AMT_RECEIVABLE_PRINCIPAL_var,CC_AMT_RECIVABLE_max,CC_AMT_RECIVABLE_mean,CC_AMT_RECIVABLE_sum,CC_AMT_RECIVABLE_var,CC_AMT_TOTAL_RECEIVABLE_max,CC_AMT_TOTAL_RECEIVABLE_mean,CC_AMT_TOTAL_RECEIVABLE_sum,CC_AMT_TOTAL_RECEIVABLE_var,CC_CNT_DRAWINGS_ATM_CURRENT_sum,CC_CNT_DRAWINGS_CURRENT_max,CC_CNT_DRAWINGS_CURRENT_mean,CC_CNT_DRAWINGS_CURRENT_sum,CC_CNT_DRAWINGS_CURRENT_var,CC_CNT_DRAWINGS_OTHER_CURRENT_sum,CC_CNT_DRAWINGS_POS_CURRENT_sum,CC_CNT_INSTALMENT_MATURE_CUM_max,CC_CNT_INSTALMENT_MATURE_CUM_mean,CC_CNT_INSTALMENT_MATURE_CUM_sum,CC_CNT_INSTALMENT_MATURE_CUM_var,CC_SK_DPD_max,CC_SK_DPD_mean,CC_SK_DPD_sum,CC_SK_DPD_var,CC_SK_DPD_DEF_max,CC_SK_DPD_DEF_mean,CC_SK_DPD_DEF_sum,CC_SK_DPD_DEF_var,CC_NAME_CONTRACT_STATUS_Active_max,CC_NAME_CONTRACT_STATUS_Active_mean,CC_NAME_CONTRACT_STATUS_Active_sum,CC_NAME_CONTRACT_STATUS_Active_var,CC_NAME_CONTRACT_STATUS_Approved_max,CC_NAME_CONTRACT_STATUS_Approved_mean,CC_NAME_CONTRACT_STATUS_Approved_sum,CC_NAME_CONTRACT_STATUS_Approved_var,CC_NAME_CONTRACT_STATUS_Completed_max,CC_NAME_CONTRACT_STATUS_Completed_mean,CC_NAME_CONTRACT_STATUS_Completed_sum,CC_NAME_CONTRACT_STATUS_Completed_var,CC_NAME_CONTRACT_STATUS_Demand_max,CC_NAME_CONTRACT_STATUS_Demand_mean,CC_NAME_CONTRACT_STATUS_Demand_sum,CC_NAME_CONTRACT_STATUS_Demand_var,CC_NAME_CONTRACT_STATUS_Refused_max,CC_NAME_CONTRACT_STATUS_Refused_mean,CC_NAME_CONTRACT_STATUS_Refused_sum,CC_NAME_CONTRACT_STATUS_Refused_var,CC_NAME_CONTRACT_STATUS_Sent proposal_max,CC_NAME_CONTRACT_STATUS_Sent proposal_mean,CC_NAME_CONTRACT_STATUS_Sent proposal_sum,CC_NAME_CONTRACT_STATUS_Sent proposal_var,CC_NAME_CONTRACT_STATUS_Signed_max,CC_NAME_CONTRACT_STATUS_Signed_mean,CC_NAME_CONTRACT_STATUS_Signed_sum,CC_NAME_CONTRACT_STATUS_Signed_var,CC_NAME_CONTRACT_STATUS_nan_max,CC_NAME_CONTRACT_STATUS_nan_mean,CC_NAME_CONTRACT_STATUS_nan_sum,CC_NAME_CONTRACT_STATUS_nan_var,CC_dpddef_dpd_gap_max,CC_dpddef_dpd_gap_mean,CC_dpddef_dpd_gap_sum,CC_dpddef_dpd_gap_var,cc_count
AMT_ANNUITY,,0.770441,0.774736,0.119176,0.00133,0.003002,0.037009,0.008089,0.01239,0.012864,0.067652,0.064845,0.057441,0.036663,0.03456,0.028068,0.018328,0.073067,0.078035,0.050929,0.049126,0.043911,0.011858,0.052018,0.010611,0.059863,0.039867,0.022737,0.024293,0.090106,0.087505,0.081288,0.011404,0.009678,0.004326,0.111378,0.121299,0.030429,0.019996,0.106206,0.067872,0.104682,0.00026,0.143194,0.006987,0.012997,0.02491,0.12147,0.120544,0.11797,0.095862,0.094794,0.090449,0.051359,0.006253,0.00515,0.001656,0.009484,0.074348,0.071166,0.067811,0.060457,0.080847,0.078526,0.070724,0.0207,0.020077,0.012743,0.047042,0.044275,0.037681,0.011409,0.01126,0.096179,0.113299,0.126266,0.139013,0.004625,0.00298,0.042184,0.080115,0.004512,0.01204,0.081584,0.008403,0.007642,0.008185,0.034558,0.034108,0.031242,0.062599,0.000988,0.012513,0.011566,0.0449,0.013054,0.062335,0.002724,0.002983,0.242384,0.242384,0.007238,0.144618,0.00203,0.036364,0.129446,0.045493,0.139156,0.040513,0.070783,0.082395,0.001751,0.027291,0.004334,0.005719,0.009027,0.033998,0.023624,0.124739,0.002918,0.104714,0.032182,0.000762,0.003037,0.042005,0.011777,0.021869,0.002094,7.5e-05,0.006235,0.018932,0.02215,0.04768,0.033918,0.017419,0.006587,0.02863,0.010814,0.021299,0.010131,0.021864,0.021976,0.143394,0.015321,0.013502,0.007324,0.016336,0.004133,0.021834,0.011411,0.003707,0.015215,0.004373,0.012485,0.004723,0.065558,0.007239,0.028546,0.007791,0.000968,0.003928,0.003324,0.000584,0.004492,0.000797,0.007055,0.001239,0.002343,0.005157,0.003942,0.014586,0.000476,0.007571,0.001866,0.000671,0.004294,0.01244,0.008403,0.022935,0.012481,0.009621,0.024105,0.006797,0.010938,0.017341,0.01997,0.010952,0.001454,0.002619,0.00678,0.002561,0.012359,0.018941,0.010682,0.000671,0.001018,0.007171,0.008757,0.000267,0.000181,0.006334,0.012921,0.00034,0.001705,0.003547,0.021235,0.011374,0.01567,0.012192,0.033815,0.016099,0.048489,0.008954,0.006952,0.008885,0.00156,0.006412,0.007546,0.01229,0.003373,0.004563,0.057494,0.019258,0.054672,0.023178,0.000206,0.118009,0.393185,0.484556,0.402869,0.085833,0.060085,0.147493,0.176902,0.590863,0.663993,0.121068,0.003817,0.122011,0.650613,0.156016,0.156016,0.117984,0.120175,0.109749,0.007532,0.119791,0.02112,0.066339,0.017022,0.006174,0.025474,0.002204,0.014402,0.012565,0.14295,0.11759,0.05844,0.090759,0.004848,0.003396,0.042713,0.045706,0.016912,0.024008,0.022286,0.020471,0.046602,0.018899,0.072254,0.118258,0.037229,0.010171,0.037236,0.001928,0.037229,0.000122,,0.048467,0.047368,0.009987,0.004098,,0.008844,0.09808,0.003317,0.068585,0.031113,,0.009039,,0.005435,0.006761,0.022736,0.004499,0.030227,0.001799,0.000309,,0.052872,0.018894,0.012824,0.003006,0.0024,0.000696,0.040881,0.015999,,0.00173,0.063271,0.012889,0.020486,0.008501,0.008874,0.043161,0.031719,0.129459,0.137275,0.093371,0.104857,0.003454,0.003508,0.062672,0.058078,0.047312,0.014773,0.050386,0.003302,0.078072,0.121546,,0.014976,0.022339,0.04625,0.004313,0.030226,0.009891,0.008639,0.013476,0.012193,0.149896,0.079281,0.01439,0.020372,0.000483,0.000433,0.003753,0.003709,0.009852,0.016835,0.013157,0.018166,0.039441,0.031306,0.062667,0.113568,,0.043006,0.261271,0.288495,0.174512,0.208444,0.164848,0.199531,0.08591,0.08607,0.174934,0.207176,0.076649,0.07343,0.039362,0.037285,0.030693,0.045986,0.001476,0.002838,0.028568,0.031236,0.012801,0.003373,0.006907,0.015219,0.016231,0.008308,0.013082,0.005842,,0.00697,0.001281,0.002351,0.014016,0.000486,0.00708,0.002517,,0.009265,0.009265,,0.006908,0.01232,0.002704,0.00479,0.004458,0.008523,0.004338,0.005642,0.006082,0.000922,0.00158,0.007107,0.006135,0.011138,0.012805,0.002712,0.002168,0.003739,0.001922,0.000655,0.007731,0.023516,0.002765,0.016231,0.01891,,0.000761,0.011629,0.012374,0.001183,,0.011941,0.000429,0.012687,0.00965,,0.001183,0.010157,0.008413,0.001175,0.013365,0.00479,0.020885,0.01216,0.002103,,0.015977,0.018002,0.003212,0.00308,0.001205,0.030876,0.000335,0.022506,0.030966,0.01321,0.022267,0.004265,,0.003439,0.002921,0.010365,0.001397,0.027798,0.011084,0.01234,0.010529,0.000931,0.000591,0.003124,0.02098,0.001776,0.005511,,0.00358,0.017139,0.005651,0.00602,0.037983,0.000186,0.001045,0.002485,0.000206,0.014523,0.003508,0.000551,0.009277,,0.007563,0.008834,0.012891,0.008587,0.003438,,0.007649,0.000755,0.009571,,0.056163,0.00837,0.004174,0.02291,0.009276,0.037211,0.000944,0.040685,,0.003302,0.028043,0.053694,0.002423,0.005654,0.0212,0.006009,0.017936,0.004364,0.007006,0.023428,,0.001644,0.058145,0.035502,0.031549,0.007146,,0.018389,0.003861,0.010955,0.025616,0.033334,0.028734,0.004638,0.023874,0.014332,0.003516,0.018643,0.0171,0.035742,0.047359,0.012732,0.000464,0.010131,0.005842,0.260984,0.282843,0.1741,0.206175,0.163356,0.196765,0.087374,0.084343,0.174495,0.207962,0.078167,0.077569,0.038539,0.037753,0.043394,0.04811,0.008377,0.011525,0.031194,0.030399,0.013184,0.003397,0.00564,0.014716,0.235225,0.240155,0.170888,0.171227,0.16627,0.167798,0.17737,0.180017,0.060563,0.062043,0.055261,0.061717,0.028378,0.031092,0.017318,0.017548,0.012194,0.007722,0.004208,0.00827,0.032376,0.03772,0.001288,0.003982,0.006742,0.004743,0.00321,0.043254,0.001568,0.004831,0.002441,0.056799,0.004725,0.000809,0.0106,,,0.001288,0.059478,0.143801,0.168748,0.163608,0.145607,0.059856,0.144498,0.166741,0.164334,0.146779,0.031959,0.046827,0.045128,0.018073,0.003687,0.003554,0.005249,0.00354,0.060389,0.045194,0.034877,0.079324,0.03923,0.044601,0.000999,0.006485,0.000499,0.00439,0.015955,0.001072,0.01343,0.017258,0.001513,0.007662,0.033388,0.033388,0.091229,0.087132,0.086958,0.025373,0.021092,0.017322,0.02419,0.04661,0.018522,0.082864,0.061915,0.037931,0.015398,0.04632,0.016088,0.066463,0.027774,0.084381,0.044771,0.000196,0.082114,0.029506,0.011619,0.029604,0.022748,0.104002,0.073548,0.058034,0.103277,0.046508,0.026793,0.02023,0.017792,0.024828,0.025943,0.020624,0.017534,0.02437,0.025938,0.020623,0.017532,0.024373,0.01375,0.012595,0.025785,0.005043,0.018993,0.018086,0.010241,0.020523,0.035327,0.04365,0.006691,0.00889,0.007616,0.008116,0.007764,0.006329,0.005324,0.004965,0.004949,0.018538,0.0201,0.086504,0.024861,0.012636,0.012636,0.012636,0.012689,0.026811,0.027003,0.040001,0.031465,0.003689,0.0031,0.003118,0.002335,0.008923,0.009123,0.008923,0.009165,0.001518,0.002311,0.001518,0.002344,0.006214,0.019362,0.002383,0.018834,,,,,,0.009651,0.010223,0.009554,0.089274
AMT_CREDIT,,,0.987071,0.097036,0.001869,0.006794,0.054124,0.015246,0.005158,0.047797,0.054041,0.051809,0.04677,0.032313,0.030163,0.025408,0.00349,0.063735,0.023086,0.046795,0.044842,0.040707,0.052395,0.088988,0.006423,0.071121,0.010001,0.024531,0.027902,0.07163,0.069324,0.065416,0.013998,0.012412,0.008701,0.157017,0.127869,0.044563,0.023644,0.09703,0.014012,0.065536,0.002509,0.118005,0.04368,0.029061,0.02226,0.094181,0.093457,0.091218,0.070827,0.070309,0.067401,0.054452,0.005262,0.004822,0.002788,0.000343,0.052902,0.053966,0.051417,0.046061,0.064248,0.06209,0.055812,0.014393,0.013394,0.00955,0.038895,0.036931,0.03253,0.001327,0.001348,0.096681,0.094645,0.101444,0.109807,0.02312,0.015991,0.023251,0.052014,0.001339,0.029744,0.065604,0.001372,0.000754,9.3e-05,0.031092,0.030769,0.02826,0.053887,0.001238,0.014738,0.011658,0.0355,0.011913,0.054085,0.003764,0.00173,0.222169,0.222169,0.004412,0.126211,0.015244,0.031014,0.106321,0.048376,0.145604,0.031823,0.094023,0.065187,0.001174,0.046781,0.00389,0.006913,0.021228,0.055614,0.0081,0.097862,0.00165,0.06561,0.048195,0.002133,0.000673,0.057206,0.000646,0.026407,0.001059,0.003495,0.010051,0.021912,0.032698,0.046634,0.026608,0.018752,0.019314,0.003494,0.007595,0.025488,0.006733,0.031842,0.030477,0.11861,0.003454,0.005564,0.00169,0.02568,0.002484,0.017357,0.018021,0.003222,0.010311,0.000338,0.011443,0.000119,0.036481,0.007454,0.014087,0.008201,0.004807,7.4e-05,0.008644,0.000337,0.000747,0.000979,0.004053,0.000864,0.004641,0.004464,0.004168,0.00997,0.006728,0.006795,0.004316,0.001389,0.004845,0.009081,0.013183,0.007182,0.010162,0.007889,0.017597,0.001952,0.009251,0.017899,0.013263,0.007153,0.002287,0.01034,0.008775,0.003352,0.012359,0.008739,0.001027,0.002008,0.001784,0.002377,0.007883,0.004766,0.002273,0.001766,0.003213,0.000237,0.000588,0.009576,0.011949,0.012739,0.016838,0.007023,0.02463,0.013531,0.038949,0.011627,0.006644,0.007629,0.005877,0.005825,0.003411,0.006357,0.005123,0.008704,0.097377,0.057366,0.123361,0.038838,0.000113,0.659836,0.652039,0.376499,0.650445,0.561191,0.01835,0.115543,0.146235,0.776054,0.869904,0.126155,0.010565,0.094299,0.84833,0.148842,0.148842,0.138221,0.140192,0.145554,0.004728,0.150795,0.050256,0.084041,0.046768,0.009446,0.036342,0.001068,0.009042,0.007858,0.122431,0.112716,0.05507,0.094889,0.004903,0.004471,0.038704,0.05358,0.016007,0.023445,0.009843,0.024102,0.087042,0.016417,0.071947,0.029114,0.021255,0.014691,0.020986,0.003257,0.021255,0.00229,,0.036448,0.035494,0.007055,0.007174,,0.007475,0.087155,0.004825,0.062122,0.030714,,0.011066,,0.009986,0.002644,0.033675,0.002467,0.028366,0.001492,0.001487,,0.045663,0.043878,0.008646,0.008525,0.006119,0.00214,0.028008,0.026936,,0.030401,0.071328,0.025573,0.007062,0.014401,0.00412,0.030382,0.024421,0.113861,0.131495,0.083005,0.100264,0.003308,0.004677,0.051123,0.058088,0.020578,0.015015,0.073263,0.004243,0.081996,0.029738,,0.001038,0.036596,0.080209,0.02824,0.019243,0.034041,0.006594,0.008135,0.007365,0.123998,0.070159,0.017688,0.024242,0.001504,0.001564,0.006746,0.009128,0.010601,0.017203,0.005019,0.020719,0.07953,0.007571,0.060642,0.020827,,0.058528,0.207756,0.224774,0.185668,0.210306,0.178863,0.206655,0.06712,0.067136,0.186269,0.207572,0.064105,0.059669,0.041139,0.037855,0.04221,0.084078,0.058474,0.031413,0.027938,0.013462,0.005474,0.030786,0.032311,0.052309,0.010249,0.002547,0.013712,0.005653,,0.005836,0.002149,0.006798,0.010653,0.000848,0.006512,0.001945,,0.006887,0.006887,,0.004802,0.002274,0.000737,0.005756,0.005829,0.006258,0.001047,0.001053,0.0076,0.007053,0.003077,0.00556,0.005791,0.000722,0.012013,0.003335,0.00739,0.002131,0.002205,0.001272,0.001606,0.030284,0.004504,0.010249,0.018319,,0.03914,0.001352,0.052804,0.004068,,0.019165,0.000917,0.007583,0.017948,,0.004068,0.035928,0.026949,0.010238,0.047403,0.004511,0.012952,0.051498,0.000654,,0.002635,0.032383,0.00494,0.00895,0.003119,0.037751,0.011544,0.029377,0.048602,0.021645,0.03445,0.007388,,0.001053,0.003903,0.009205,0.006408,0.024693,0.000792,0.008256,0.009769,0.004653,0.004588,0.002221,0.022982,0.002045,0.002194,,0.003682,0.020704,0.008416,0.0112,0.038741,0.005948,0.007675,0.000854,0.001595,0.012547,0.006755,0.003054,0.004088,,0.000529,0.009718,0.017742,0.001115,0.020841,,0.015491,0.018446,0.032166,,0.052717,0.009265,0.020334,0.023714,0.001295,0.024772,0.000763,0.019934,,0.014797,0.02362,0.053901,0.00118,0.015701,0.022885,0.007968,0.02343,0.006246,0.005557,0.015112,,0.017442,0.053752,0.041798,0.044112,8.1e-05,,0.0263,0.014615,0.007115,0.031264,0.03796,0.021302,0.017474,0.049784,0.006001,0.001576,0.027333,0.019181,0.032615,0.042868,0.00475,0.004015,0.0114,0.005653,0.212812,0.220613,0.190616,0.204155,0.183791,0.200957,0.071623,0.066277,0.191089,0.209586,0.069225,0.059588,0.04222,0.035698,0.056745,0.085314,0.050555,0.041047,0.032628,0.01099,0.003232,0.035874,0.028027,0.056511,0.189552,0.201323,0.186025,0.19337,0.183741,0.193452,0.192365,0.20065,0.041862,0.052657,0.113325,0.11711,0.087098,0.062121,0.000308,0.001139,0.025599,0.024239,0.04645,0.04467,0.044089,0.072686,0.030095,0.004001,0.005563,0.005192,0.003952,0.030335,0.002835,0.002409,0.000617,0.044017,6e-05,0.006912,0.01439,,,0.030095,0.065562,0.174729,0.151022,0.166787,0.167364,0.043814,0.175207,0.154342,0.172769,0.168311,0.036051,0.081904,0.085191,0.054951,0.007073,0.006816,0.010546,0.006891,0.079943,0.065896,0.063177,0.086355,0.029337,0.042433,0.002364,0.006785,0.00589,0.003474,0.039926,0.00323,0.026077,0.012706,0.041115,0.013618,0.06796,0.028389,0.126936,0.125524,0.126386,0.032573,0.016738,0.039971,0.02934,0.042878,0.022025,0.101969,0.049451,0.046079,0.004043,0.055294,0.01782,0.060858,0.024485,0.075527,0.041397,0.000711,0.058355,0.034041,0.007421,0.056057,0.026803,0.102107,0.06977,0.04475,0.099718,0.044606,0.033699,0.016024,0.040348,0.029845,0.033293,0.016272,0.040281,0.029483,0.033311,0.016263,0.040295,0.029491,0.008779,0.028754,0.035629,0.00678,0.030331,0.002767,0.010066,0.058946,0.075768,0.086302,0.048101,0.018258,0.014137,0.014141,0.013231,0.003701,0.004824,0.004545,0.004537,0.017379,0.013385,0.124627,0.003048,0.011474,0.011474,0.011474,0.011525,0.004281,0.010702,0.026625,0.000621,0.000992,2.5e-05,0.000285,0.000985,0.005706,0.006018,0.005706,0.006036,0.00552,0.004836,0.00552,0.004913,0.003072,0.011344,0.013782,0.010947,,,,,,0.016327,0.016435,0.015131,0.125014
AMT_GOODS_PRICE,,,,0.0985,0.001993,0.005811,0.056174,0.015942,0.004635,0.050591,0.058788,0.056674,0.051719,0.036392,0.034239,0.029443,0.000206,0.062454,0.023655,0.046637,0.044725,0.04057,0.050516,0.091081,0.009287,0.073733,0.011589,0.025003,0.028142,0.075027,0.072888,0.069324,0.017456,0.01604,0.012374,0.164262,0.135863,0.049204,0.020461,0.075156,0.014446,0.063411,0.002443,0.122362,0.050109,0.044347,0.000138,0.099829,0.099031,0.096789,0.073934,0.0734,0.07024,0.064612,0.012137,0.011735,0.009407,0.000973,0.053598,0.057531,0.054995,0.049212,0.069633,0.067617,0.061497,0.0154,0.014162,0.010069,0.04337,0.041556,0.037141,0.001793,0.001765,0.105115,0.098352,0.103889,0.111468,0.023411,0.017522,0.025067,0.053452,0.001237,0.039466,0.070642,0.002455,0.001818,0.001259,0.036459,0.036068,0.033368,0.058451,0.002125,0.013483,0.01297,0.034254,0.010346,0.058297,0.003322,0.002475,0.186497,0.186497,0.004946,0.139416,0.014252,0.033702,0.1186,0.05187,0.150261,0.033422,0.095338,0.066726,0.00025,0.049938,0.00939,0.006695,0.022261,0.055042,0.009976,0.096971,0.002313,0.063472,0.047613,0.002172,0.000899,0.057853,0.002284,0.02714,0.000351,0.004323,0.011446,0.019732,0.033541,0.050853,0.029205,0.02133,0.021769,0.001712,0.007861,0.027538,0.008322,0.03828,0.032829,0.125692,0.001215,0.005718,0.001147,0.026277,0.002821,0.020923,0.017201,0.003643,0.0114,0.004847,0.010427,0.000154,0.036742,0.008043,0.014462,0.008482,0.004996,0.000555,0.006853,0.000248,0.001165,0.001196,0.004053,0.000863,0.004035,0.002952,0.004611,0.01161,0.006823,0.005676,0.004509,0.001968,0.005036,0.011166,0.015413,0.009562,0.011533,0.006206,0.017076,0.000871,0.009498,0.018654,0.014802,0.008404,0.002214,0.011147,0.007607,0.005124,0.013101,0.010144,0.001093,0.001901,0.001569,0.003843,0.00706,0.003976,0.002491,0.002171,0.003999,7.8e-05,0.000528,0.009739,0.011826,0.012604,0.016627,0.009237,0.02615,0.013771,0.041838,0.014356,0.008222,0.008113,0.006124,0.00678,0.001488,0.006761,0.004385,0.009419,0.090672,0.056795,0.120252,0.036465,0.000256,0.633224,0.631882,0.370443,0.655221,0.564238,0.114473,0.117715,0.149561,0.764105,0.860999,0.128881,0.013994,0.095506,0.833595,0.156606,0.156606,0.146517,0.149331,0.154767,0.006999,0.159569,0.054196,0.085832,0.045424,0.010125,0.037646,0.001365,0.008259,0.007116,0.127078,0.117411,0.056263,0.097692,0.005276,0.004834,0.041075,0.055498,0.015854,0.022043,0.009733,0.024376,0.09026,0.016177,0.074222,0.030323,0.026696,0.011131,0.02652,0.0028,0.026696,0.001563,,0.037613,0.036584,0.007474,0.007438,,0.007341,0.090763,0.004666,0.0634,0.029744,,0.010941,,0.00949,0.002998,0.033924,0.003248,0.031725,0.002406,0.002054,,0.050324,0.047363,0.01036,0.009203,0.00637,0.001681,0.032025,0.028275,,0.030133,0.073682,0.026049,0.007967,0.016904,0.003379,0.031129,0.024806,0.118774,0.136763,0.086371,0.10399,0.00388,0.005105,0.054374,0.06066,0.02056,0.014867,0.075324,0.003498,0.083896,0.029589,,0.000882,0.041797,0.077781,0.027854,0.022327,0.03134,0.00583,0.00693,0.006524,0.128148,0.073308,0.016022,0.022984,0.001033,0.00109,0.006741,0.008899,0.010025,0.01582,0.004872,0.02145,0.079923,0.010134,0.059545,0.022018,,0.060727,0.212434,0.229743,0.18938,0.215181,0.18076,0.20902,0.07037,0.068574,0.189895,0.210613,0.072706,0.068737,0.044498,0.038094,0.037806,0.081883,0.057847,0.031366,0.032034,0.02414,0.001883,0.026086,0.030769,0.051069,0.007698,0.004189,0.022784,0.005085,,0.005264,0.002609,0.006745,0.011659,0.000493,0.007193,0.002639,,0.006048,0.006048,,0.005604,0.002039,0.000323,0.005986,0.005536,0.008554,0.000214,0.001113,0.007496,0.007299,0.003277,0.005486,0.004887,0.000876,0.013227,0.00353,0.007716,0.002576,0.002563,0.001365,0.001307,0.030987,0.004951,0.007698,0.01579,,0.040473,0.003542,0.0534,0.001655,,0.02696,4.5e-05,0.007995,0.02569,,0.001655,0.03698,0.02662,0.009131,0.049142,0.004197,0.01335,0.051211,0.001101,,0.001231,0.03643,0.005802,0.009892,0.003711,0.038201,0.011619,0.031788,0.049253,0.025169,0.032997,0.007789,,0.000558,0.003868,0.01045,0.005201,0.03025,8.8e-05,0.007254,0.010338,0.003519,0.004924,0.003518,0.027603,0.001632,0.004594,,0.002902,0.019938,0.010444,0.011464,0.039579,0.00667,0.006526,0.002264,0.001615,0.014262,0.008167,0.001914,0.002473,,0.009771,0.009393,0.015709,0.005075,0.022359,,0.009043,0.020444,0.026089,,0.052504,0.009065,0.025916,0.024367,0.002834,0.018139,0.000519,0.015822,,0.013938,0.028973,0.055191,0.003206,0.01621,0.028084,0.009591,0.023052,0.003789,0.007334,0.009861,,0.024152,0.060383,0.047849,0.05121,0.001756,,0.03211,0.006854,0.008824,0.033728,0.041688,0.020224,0.020682,0.051614,0.008616,0.000743,0.031537,0.025334,0.036734,0.044797,0.000619,0.001805,0.011394,0.005085,0.217582,0.225814,0.194298,0.208429,0.185668,0.202697,0.074818,0.067757,0.194622,0.212896,0.077862,0.068781,0.045219,0.036052,0.051684,0.082471,0.05147,0.042325,0.03689,0.021217,0.00021,0.031182,0.026533,0.055399,0.191384,0.20168,0.188181,0.19443,0.184073,0.192561,0.193887,0.200946,0.05045,0.061122,0.115709,0.120556,0.082059,0.060427,0.006418,0.00657,0.020726,0.020282,0.044397,0.043554,0.040337,0.071791,0.030474,0.004081,0.005637,0.005436,0.004307,0.032556,0.003018,0.002868,0.000785,0.046504,0.00081,0.007312,0.013825,,,0.030474,0.066353,0.177198,0.156172,0.166214,0.171139,0.047789,0.177696,0.159835,0.172829,0.172166,0.035274,0.082497,0.082232,0.056519,0.00715,0.007054,0.010342,0.006971,0.082297,0.069328,0.066485,0.089079,0.032617,0.044938,0.00173,0.007643,0.003924,0.004036,0.042546,0.007209,0.026853,0.009903,0.038878,0.014491,0.06251,0.033244,0.130727,0.129425,0.130216,0.023307,0.028205,0.030944,0.022931,0.037574,0.015518,0.097919,0.051059,0.038958,0.013796,0.047864,0.014262,0.056478,0.020015,0.072942,0.040225,0.000472,0.06243,0.025582,0.01842,0.047761,0.020259,0.101366,0.070829,0.044964,0.099314,0.046614,0.024601,0.027391,0.031344,0.023585,0.024084,0.027689,0.031291,0.02313,0.024106,0.027678,0.031312,0.02314,0.000286,0.030363,0.036872,0.006644,0.030252,0.003437,0.006946,0.05321,0.072387,0.084676,0.042344,0.017869,0.013923,0.013649,0.01291,0.003943,0.004865,0.00453,0.004424,0.016409,0.004775,0.127617,0.00621,0.013688,0.013688,0.013688,0.013747,0.014573,0.001707,0.032518,0.009224,0.001169,0.000488,0.000699,7.8e-05,0.005637,0.00589,0.005637,0.005907,0.007402,0.006902,0.007402,0.006982,0.002627,0.011253,0.012617,0.010809,,,,,,0.016115,0.015911,0.014762,0.12865


In [18]:
threshold = 0.90

to_drop = [column for column in upper.columns if any(upper[column] > threshold)]
print('There are %d columns to remove.' % (len(to_drop)))

There are 183 columns to remove.


In [19]:
to_drop

['AMT_GOODS_PRICE',
 'APARTMENTS_MEDI',
 'APARTMENTS_MODE',
 'BASEMENTAREA_MEDI',
 'BASEMENTAREA_MODE',
 'COMMONAREA_MEDI',
 'COMMONAREA_MODE',
 'ELEVATORS_MEDI',
 'ELEVATORS_MODE',
 'ENTRANCES_MEDI',
 'ENTRANCES_MODE',
 'FLOORSMAX_MEDI',
 'FLOORSMAX_MODE',
 'FLOORSMIN_MEDI',
 'FLOORSMIN_MODE',
 'LANDAREA_MEDI',
 'LANDAREA_MODE',
 'LIVINGAPARTMENTS_AVG',
 'LIVINGAPARTMENTS_MEDI',
 'LIVINGAPARTMENTS_MODE',
 'LIVINGAREA_AVG',
 'LIVINGAREA_MEDI',
 'LIVINGAREA_MODE',
 'NONLIVINGAPARTMENTS_MEDI',
 'NONLIVINGAPARTMENTS_MODE',
 'NONLIVINGAREA_MEDI',
 'NONLIVINGAREA_MODE',
 'OBS_60_CNT_SOCIAL_CIRCLE',
 'REGION_RATING_CLIENT_W_CITY',
 'TOTALAREA_MODE',
 'YEARS_BEGINEXPLUATATION_MEDI',
 'YEARS_BEGINEXPLUATATION_MODE',
 'YEARS_BUILD_MEDI',
 'YEARS_BUILD_MODE',
 'HOUSETYPE_MODE_block of flats',
 'NAME_CONTRACT_TYPE_Revolving loans',
 'NAME_INCOME_TYPE_Pensioner',
 'birth_car_age_gap',
 'birth_last_phone_gap',
 'GOODS_PRICE_INCOME_PERC',
 'INCOME_PER_PERSON',
 'INCOME_PER_CHILD',
 'child_to_non_chi

In [20]:
train.drop(to_drop, axis=1, inplace=True)
test.drop(to_drop, axis=1, inplace=True)
del mini_train
gc.collect()
print(train.shape, test.shape)

(307507, 554) (48744, 553)


In [21]:
train = train.append(test).reset_index(drop=True)
train.to_csv(os.path.join(PATH_TO_DATA, 'df_all_files_with_fs.csv'), index=False)

del train, test, train_missing, test_missing
gc.collect()

14