In [1]:
import pandas as pd 
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', 200)
import numpy as np
import numpy_financial as npf
import matplotlib.pyplot as plt 
%matplotlib inline
import seaborn as sns # for making plots with seaborn
color = sns.color_palette()
import random
import re

## Contents

**[1. Instalments Payments](#1.-Instalments-Payments)**
    
**[2. Credit Card Balance](#2.-Credit-Card-Balance)**
   
**[3. Bureau & Bureau Balance](#3.-Bureau-&-Bureau-Balance)**

**[4. POS CASH](#4.-POS-CASH)**
    
**[5. Previous Applications](#5.-Previous-Applications)**
   
**[6. Combining everything into train and test set](#6.-Combining-everything-into-train-and-test-set)**
- [6.1. Merging past & bureau data into train_1 and test_1](#6.1.-Merging-past-&-bureau-data-into-train_1-and-test_1)
- [6.2. Merging bureau data into train_2 and test_2](#6.2.-Merging-bureau-data-into-train_2-and-test_2)
- [6.3. Merging past data into train_3 and test_3](#6.3.-Merging-past-data-into-train_3-and-test_3)
- [6.4. Preparing data for train_4 and test_4](#6.4.-Preparing-data-for-train_4-and-test_4)

Looking at other datasets, generate new features:


In [2]:
bureau_bal = pd.read_csv('../datasets/bureau_balance.csv')
bureau = pd.read_csv('../datasets/bureau.csv')
pre_app = pd.read_csv('../datasets/previous_application.csv')
install_pay = pd.read_csv('../datasets/installments_payments.csv')
cc = pd.read_csv('../datasets/credit_card_balance.csv')
pos = pd.read_csv('../datasets/pos_cash_balance.csv')

In [3]:
# reuse our missing data function from EDA noteboook
def missing_data(df):
    total_num_missing = df.isnull().sum()
    total_percent_missing = df.isnull().sum()/len(df)*100
    total_missing_df = pd.concat([total_num_missing, total_percent_missing], axis=1, keys=['Total', '% of Missing Values'])
    total_missing_df = total_missing_df[
        total_missing_df.iloc[:,1] != 0].sort_values('% of Missing Values', ascending=False).round(1)
    print('The dataframe has ' + str(df.shape[1]) + ' columns.\n' 
         'There are ' +str(total_missing_df.shape[0]) + ' columns that have missing values.')
    return total_missing_df

In [4]:
# define function to sum up the columns we want
def do_sum(df, groupby_cols, counted, agg_name):
    gp = df[groupby_cols + [counted]].groupby(groupby_cols)[counted].sum().reset_index().rename(columns={counted: agg_name})
    df = df.merge(gp, on=groupby_cols, how='left')
    return df

In [5]:
# define function to aggregate the df 
def group(df_to_agg, prefix, aggregations, aggregate_by= 'SK_ID_CURR'):
    agg_df = df_to_agg.groupby(aggregate_by).agg(aggregations)
    agg_df.columns = pd.Index(['{}{}_{}'.format(prefix, e[0], e[1].upper())
                               for e in agg_df.columns.tolist()])
    return agg_df.reset_index()

In [6]:
# def function to group and merge to a dataframe
def group_and_merge(df_to_agg, df_to_merge, prefix, aggregations, aggregate_by= 'SK_ID_CURR'):
    agg_df = group(df_to_agg, prefix, aggregations, aggregate_by= aggregate_by)
    return df_to_merge.merge(agg_df, how='left', on= aggregate_by)

## 1. Instalments Payments
[top](#Contents)

In [7]:
missing_data(install_pay)

The dataframe has 8 columns.
There are 2 columns that have missing values.


Unnamed: 0,Total,% of Missing Values
DAYS_ENTRY_PAYMENT,2905,0.0
AMT_PAYMENT,2905,0.0


This dataset gives the history of payments in previous contracts that the current applicant has taken out. We would like to aggregate and engineer some features based on applicant's past payment behavior, specifically, we would like to determine:
- was monthly instalment amount fully paid
- ratio of payment amount and instalment amount, i.e did applicant paid more and hence, aim to end the contract earlier, or was payment less
- was payment on time, early, or late
- if late, was it 30-days or 60-days past due
- recent payment behavior

However, before aggregating the data, we have to appreciate some nuances in applicant's payment behavior. In our example below of a sample contract, we see that payment was made twice for instalment number 3, 10, 11. For these instalment number, the applicant has split the payment twice to meet the instalment amount. However, if we were to do row-wise aggregation, some rows will be flagged as the applicant has underpaid, making him look like a bad customer which is certainly not the case!

In [8]:
# example
install_pay.loc[install_pay['SK_ID_PREV'] == 2069908].sort_values('NUM_INSTALMENT_NUMBER')

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,NUM_INSTALMENT_VERSION,NUM_INSTALMENT_NUMBER,DAYS_INSTALMENT,DAYS_ENTRY_PAYMENT,AMT_INSTALMENT,AMT_PAYMENT
2498001,2069908,166397,1.0,1,-1010.0,-1025.0,27982.575,27982.575
2822705,2069908,166397,1.0,2,-980.0,-997.0,27982.575,27982.575
3557451,2069908,166397,1.0,3,-950.0,-968.0,27982.575,27982.035
1251429,2069908,166397,1.0,3,-950.0,-937.0,27982.575,0.54
95318,2069908,166397,1.0,4,-920.0,-937.0,27982.575,27982.575
2283016,2069908,166397,1.0,5,-890.0,-906.0,27982.575,27982.575
2578653,2069908,166397,1.0,6,-860.0,-877.0,27982.575,27982.575
3770650,2069908,166397,1.0,7,-830.0,-843.0,27982.575,27982.575
1224304,2069908,166397,1.0,8,-800.0,-806.0,27982.575,27982.575
1159113,2069908,166397,1.0,9,-770.0,-772.0,27982.575,27982.575


In [9]:
install_pay = do_sum(install_pay, ['SK_ID_PREV', 'NUM_INSTALMENT_NUMBER'], 'AMT_PAYMENT', 'AMT_PAYMENT_GROUPED')

In [10]:
# check
install_pay.loc[install_pay['SK_ID_PREV'] == 2069908].sort_values('NUM_INSTALMENT_NUMBER')


Unnamed: 0,SK_ID_PREV,SK_ID_CURR,NUM_INSTALMENT_VERSION,NUM_INSTALMENT_NUMBER,DAYS_INSTALMENT,DAYS_ENTRY_PAYMENT,AMT_INSTALMENT,AMT_PAYMENT,AMT_PAYMENT_GROUPED
2498001,2069908,166397,1.0,1,-1010.0,-1025.0,27982.575,27982.575,27982.575
2822705,2069908,166397,1.0,2,-980.0,-997.0,27982.575,27982.575,27982.575
3557451,2069908,166397,1.0,3,-950.0,-968.0,27982.575,27982.035,27982.575
1251429,2069908,166397,1.0,3,-950.0,-937.0,27982.575,0.54,27982.575
95318,2069908,166397,1.0,4,-920.0,-937.0,27982.575,27982.575,27982.575
2283016,2069908,166397,1.0,5,-890.0,-906.0,27982.575,27982.575,27982.575
2578653,2069908,166397,1.0,6,-860.0,-877.0,27982.575,27982.575,27982.575
3770650,2069908,166397,1.0,7,-830.0,-843.0,27982.575,27982.575,27982.575
1224304,2069908,166397,1.0,8,-800.0,-806.0,27982.575,27982.575,27982.575
1159113,2069908,166397,1.0,9,-770.0,-772.0,27982.575,27982.575,27982.575


In [11]:
# create features that calculate number of days payment was early or late
install_pay['DAYS_BEFORE_DUE'] = install_pay['DAYS_INSTALMENT'] - install_pay['DAYS_ENTRY_PAYMENT']
install_pay['DAYS_BEFORE_DUE'] = install_pay['DAYS_BEFORE_DUE'].apply(lambda x: 0 if x<=0 else x)
install_pay['DAYS_PAST_DUE'] =  install_pay['DAYS_ENTRY_PAYMENT'] - install_pay['DAYS_INSTALMENT'] 
install_pay['DAYS_PAST_DUE'] = install_pay['DAYS_PAST_DUE'].apply(lambda x: 0 if x<=0 else x)

# flag late payments
install_pay['FLAG_LATE_PAY'] = install_pay['DAYS_PAST_DUE'].apply(lambda x: 1 if x>0 else 0)

# % of payments that were late
install_pay['INSTALL_PAY_RATIO'] = install_pay['AMT_PAYMENT'] / install_pay['AMT_INSTALMENT']
install_pay['LATE_PAY_RATIO'] = install_pay.apply(lambda x: x['INSTALL_PAY_RATIO'] if x['FLAG_LATE_PAY']==1 else 0, axis=1)

# Flag late payments that have a significant amount > 20%
install_pay['SIGNIFICANT_LATE_PAY'] = install_pay['LATE_PAY_RATIO'].apply(lambda x: 1 if x > 0.20 else 0)

# create feature FLAG_30DAYS_DUE where 1 = payment was late by 30 days
install_pay['FLAG_15DAYS_DUE'] = install_pay['DAYS_PAST_DUE'].apply(lambda x: 1 if x >= 15 else 0)

# create feature FLAG_30DAYS_DUE where 1 = payment was late by 30 days
install_pay['FLAG_30DAYS_DUE'] = install_pay['DAYS_PAST_DUE'].apply(lambda x: 1 if x >= 30 else 0)

# create feature FLAG_60DAYS_DUE where 1 = payment was late by 60 days
install_pay['FLAG_60DAYS_DUE'] = install_pay['DAYS_PAST_DUE'].apply(lambda x: 1 if x >= 60 else 0)

# create feature PAYMENT_RATIO which is payment amt / instalment amt
install_pay['PAYMENT_RATIO'] = install_pay['AMT_PAYMENT_GROUPED'] / install_pay['AMT_INSTALMENT']

# create feature FLAG_PAYMENT_OVER which indicates that payment was more than the instalment amount
install_pay['PAYMENT_OVER'] = install_pay['AMT_PAYMENT'] - install_pay['AMT_INSTALMENT']
install_pay['FLAG_PAYMENT_OVER'] = install_pay['PAYMENT_OVER'].apply(lambda x: 1 if x>0 else 0)


In [12]:
# for overall instalment history
instalments_agg = {'SK_ID_PREV': ['nunique'],
                    'DAYS_ENTRY_PAYMENT': ['mean', 'min', 'max'], 
                    'AMT_INSTALMENT': ['mean', 'min', 'max', 'std'], 
                    'AMT_PAYMENT': ['mean', 'min', 'max', 'std'],
                    'DAYS_BEFORE_DUE': ['mean', 'max', 'std'],
                    'DAYS_PAST_DUE': ['mean', 'max', 'std'],
                    'FLAG_LATE_PAY': ['mean', 'sum'],
                    'INSTALL_PAY_RATIO': ['mean', 'std'],
                    'LATE_PAY_RATIO': ['mean', 'std'],
                    'SIGNIFICANT_LATE_PAY': ['mean', 'sum'], 
                    'FLAG_15DAYS_DUE': ['mean'], 
                    'FLAG_30DAYS_DUE': ['mean'],
                    'FLAG_60DAYS_DUE': ['mean'],
                    'PAYMENT_RATIO': ['mean'],
                    'FLAG_PAYMENT_OVER': ['mean']
                    }

# for recent instalment history
instalments_time_agg = {'SK_ID_PREV': ['size'],
                        'DAYS_ENTRY_PAYMENT': ['mean', 'min', 'max'], 
                        'AMT_INSTALMENT': ['mean', 'min', 'max', 'std'], 
                        'AMT_PAYMENT': ['mean', 'min', 'max', 'std'],
                        'DAYS_BEFORE_DUE': ['mean', 'max', 'std'],
                        'DAYS_PAST_DUE': ['mean', 'max', 'std'],
                        'FLAG_LATE_PAY': ['mean', 'sum'],
                        'INSTALL_PAY_RATIO': ['mean', 'std'],
                        'LATE_PAY_RATIO': ['mean', 'std'],
                        'SIGNIFICANT_LATE_PAY': ['mean', 'sum'], 
                        'FLAG_15DAYS_DUE': ['mean'], 
                        'FLAG_30DAYS_DUE': ['mean'],
                        'FLAG_60DAYS_DUE': ['mean'],
                        'PAYMENT_RATIO': ['mean'],
                        'FLAG_PAYMENT_OVER': ['mean']
                        }

In [13]:
# aggregate df
install_pay_agg = group(install_pay, 'INS_', instalments_agg)

In [14]:
install_pay_agg.head(3)

Unnamed: 0,SK_ID_CURR,INS_SK_ID_PREV_NUNIQUE,INS_DAYS_ENTRY_PAYMENT_MEAN,INS_DAYS_ENTRY_PAYMENT_MIN,INS_DAYS_ENTRY_PAYMENT_MAX,INS_AMT_INSTALMENT_MEAN,INS_AMT_INSTALMENT_MIN,INS_AMT_INSTALMENT_MAX,INS_AMT_INSTALMENT_STD,INS_AMT_PAYMENT_MEAN,INS_AMT_PAYMENT_MIN,INS_AMT_PAYMENT_MAX,INS_AMT_PAYMENT_STD,INS_DAYS_BEFORE_DUE_MEAN,INS_DAYS_BEFORE_DUE_MAX,INS_DAYS_BEFORE_DUE_STD,INS_DAYS_PAST_DUE_MEAN,INS_DAYS_PAST_DUE_MAX,INS_DAYS_PAST_DUE_STD,INS_FLAG_LATE_PAY_MEAN,INS_FLAG_LATE_PAY_SUM,INS_INSTALL_PAY_RATIO_MEAN,INS_INSTALL_PAY_RATIO_STD,INS_LATE_PAY_RATIO_MEAN,INS_LATE_PAY_RATIO_STD,INS_SIGNIFICANT_LATE_PAY_MEAN,INS_SIGNIFICANT_LATE_PAY_SUM,INS_FLAG_15DAYS_DUE_MEAN,INS_FLAG_30DAYS_DUE_MEAN,INS_FLAG_60DAYS_DUE_MEAN,INS_PAYMENT_RATIO_MEAN,INS_FLAG_PAYMENT_OVER_MEAN
0,100001,2,-2195.000000,-2916.0,-1628.0,5885.132143,3951.000,17397.900,5076.676624,5885.132143,3951.000,17397.900,5076.676624,8.857143,36.0,12.811825,1.571429,11.0,4.157609,0.142857,1,1.000000,0.000000,0.142857,0.377964,0.142857,1,0.0,0.0,0.0,1.000000,0.000000
1,100002,1,-315.421053,-587.0,-49.0,11559.247105,9251.775,53093.745,10058.037722,11559.247105,9251.775,53093.745,10058.037722,20.421053,31.0,4.925171,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000
2,100003,3,-1385.320000,-2324.0,-544.0,64754.586000,6662.970,560835.360,110542.592300,64754.586000,6662.970,560835.360,110542.592300,7.160000,14.0,3.726929,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000
3,100004,1,-761.666667,-795.0,-727.0,7096.155000,5357.250,10573.965,3011.871810,7096.155000,5357.250,10573.965,3011.871810,7.666667,11.0,4.163332,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000
4,100005,1,-609.555556,-736.0,-470.0,6240.205000,4813.200,17656.245,4281.015000,6240.205000,4813.200,17656.245,4281.015000,23.666667,37.0,13.285330,0.111111,1.0,0.333333,0.111111,1,1.000000,0.000000,0.111111,0.333333,0.111111,1,0.0,0.0,0.0,1.000000,0.000000
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
339582,456251,1,-156.285714,-237.0,-38.0,7492.924286,6605.910,12815.010,2346.819209,7492.924286,6605.910,12815.010,2346.819209,36.285714,46.0,14.079705,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000
339583,456252,1,-2393.833333,-2470.0,-2327.0,10069.867500,10046.880,10074.465,11.261529,10069.867500,10046.880,10074.465,11.261529,3.333333,11.0,4.082483,0.500000,3.0,1.224745,0.166667,1,1.000000,0.000000,0.166667,0.408248,0.166667,1,0.0,0.0,0.0,1.000000,0.000000
339584,456253,3,-2387.428571,-2915.0,-1738.0,4399.707857,2754.450,5575.185,1145.446623,4115.915357,27.270,5575.185,1638.228743,15.142857,51.0,15.629642,0.642857,9.0,2.405351,0.071429,1,0.928571,0.265292,0.070938,0.265427,0.071429,1,0.0,0.0,0.0,1.000000,0.000000
339585,456254,2,-161.263158,-317.0,-18.0,10239.832895,2296.440,19065.825,8602.512994,10239.832895,2296.440,19065.825,8602.512994,19.000000,31.0,8.198916,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000


In [15]:
# looking at data in recent 2, and 4 years
for months in [24, 48]:
    recent_id_prev = install_pay[install_pay['DAYS_INSTALMENT'] >= -30*months]['SK_ID_PREV'].unique()
    pay_recent = install_pay[install_pay['SK_ID_PREV'].isin(recent_id_prev)]
    prefix = f'INS_{months}M_'
    install_pay_agg = group_and_merge(pay_recent, install_pay_agg, prefix, instalments_time_agg)

In [16]:
# check
install_pay_agg.head(3)

Unnamed: 0,SK_ID_CURR,INS_SK_ID_PREV_NUNIQUE,INS_DAYS_ENTRY_PAYMENT_MEAN,INS_DAYS_ENTRY_PAYMENT_MIN,INS_DAYS_ENTRY_PAYMENT_MAX,INS_AMT_INSTALMENT_MEAN,INS_AMT_INSTALMENT_MIN,INS_AMT_INSTALMENT_MAX,INS_AMT_INSTALMENT_STD,INS_AMT_PAYMENT_MEAN,INS_AMT_PAYMENT_MIN,INS_AMT_PAYMENT_MAX,INS_AMT_PAYMENT_STD,INS_DAYS_BEFORE_DUE_MEAN,INS_DAYS_BEFORE_DUE_MAX,INS_DAYS_BEFORE_DUE_STD,INS_DAYS_PAST_DUE_MEAN,INS_DAYS_PAST_DUE_MAX,INS_DAYS_PAST_DUE_STD,INS_FLAG_LATE_PAY_MEAN,INS_FLAG_LATE_PAY_SUM,INS_INSTALL_PAY_RATIO_MEAN,INS_INSTALL_PAY_RATIO_STD,INS_LATE_PAY_RATIO_MEAN,INS_LATE_PAY_RATIO_STD,INS_SIGNIFICANT_LATE_PAY_MEAN,INS_SIGNIFICANT_LATE_PAY_SUM,INS_FLAG_15DAYS_DUE_MEAN,INS_FLAG_30DAYS_DUE_MEAN,INS_FLAG_60DAYS_DUE_MEAN,INS_PAYMENT_RATIO_MEAN,INS_FLAG_PAYMENT_OVER_MEAN,INS_24M_SK_ID_PREV_SIZE,INS_24M_DAYS_ENTRY_PAYMENT_MEAN,INS_24M_DAYS_ENTRY_PAYMENT_MIN,INS_24M_DAYS_ENTRY_PAYMENT_MAX,INS_24M_AMT_INSTALMENT_MEAN,INS_24M_AMT_INSTALMENT_MIN,INS_24M_AMT_INSTALMENT_MAX,INS_24M_AMT_INSTALMENT_STD,INS_24M_AMT_PAYMENT_MEAN,INS_24M_AMT_PAYMENT_MIN,INS_24M_AMT_PAYMENT_MAX,INS_24M_AMT_PAYMENT_STD,INS_24M_DAYS_BEFORE_DUE_MEAN,INS_24M_DAYS_BEFORE_DUE_MAX,INS_24M_DAYS_BEFORE_DUE_STD,INS_24M_DAYS_PAST_DUE_MEAN,INS_24M_DAYS_PAST_DUE_MAX,INS_24M_DAYS_PAST_DUE_STD,INS_24M_FLAG_LATE_PAY_MEAN,INS_24M_FLAG_LATE_PAY_SUM,INS_24M_INSTALL_PAY_RATIO_MEAN,INS_24M_INSTALL_PAY_RATIO_STD,INS_24M_LATE_PAY_RATIO_MEAN,INS_24M_LATE_PAY_RATIO_STD,INS_24M_SIGNIFICANT_LATE_PAY_MEAN,INS_24M_SIGNIFICANT_LATE_PAY_SUM,INS_24M_FLAG_15DAYS_DUE_MEAN,INS_24M_FLAG_30DAYS_DUE_MEAN,INS_24M_FLAG_60DAYS_DUE_MEAN,INS_24M_PAYMENT_RATIO_MEAN,INS_24M_FLAG_PAYMENT_OVER_MEAN,INS_48M_SK_ID_PREV_SIZE,INS_48M_DAYS_ENTRY_PAYMENT_MEAN,INS_48M_DAYS_ENTRY_PAYMENT_MIN,INS_48M_DAYS_ENTRY_PAYMENT_MAX,INS_48M_AMT_INSTALMENT_MEAN,INS_48M_AMT_INSTALMENT_MIN,INS_48M_AMT_INSTALMENT_MAX,INS_48M_AMT_INSTALMENT_STD,INS_48M_AMT_PAYMENT_MEAN,INS_48M_AMT_PAYMENT_MIN,INS_48M_AMT_PAYMENT_MAX,INS_48M_AMT_PAYMENT_STD,INS_48M_DAYS_BEFORE_DUE_MEAN,INS_48M_DAYS_BEFORE_DUE_MAX,INS_48M_DAYS_BEFORE_DUE_STD,INS_48M_DAYS_PAST_DUE_MEAN,INS_48M_DAYS_PAST_DUE_MAX,INS_48M_DAYS_PAST_DUE_STD,INS_48M_FLAG_LATE_PAY_MEAN,INS_48M_FLAG_LATE_PAY_SUM,INS_48M_INSTALL_PAY_RATIO_MEAN,INS_48M_INSTALL_PAY_RATIO_STD,INS_48M_LATE_PAY_RATIO_MEAN,INS_48M_LATE_PAY_RATIO_STD,INS_48M_SIGNIFICANT_LATE_PAY_MEAN,INS_48M_SIGNIFICANT_LATE_PAY_SUM,INS_48M_FLAG_15DAYS_DUE_MEAN,INS_48M_FLAG_30DAYS_DUE_MEAN,INS_48M_FLAG_60DAYS_DUE_MEAN,INS_48M_PAYMENT_RATIO_MEAN,INS_48M_FLAG_PAYMENT_OVER_MEAN
0,100001,2,-2195.000000,-2916.0,-1628.0,5885.132143,3951.000,17397.900,5076.676624,5885.132143,3951.000,17397.900,5076.676624,8.857143,36.0,12.811825,1.571429,11.0,4.157609,0.142857,1,1.000000,0.000000,0.142857,0.377964,0.142857,1,0.0,0.0,0.0,1.000000,0.000000,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,100002,1,-315.421053,-587.0,-49.0,11559.247105,9251.775,53093.745,10058.037722,11559.247105,9251.775,53093.745,10058.037722,20.421053,31.0,4.925171,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000,19.0,-315.421053,-587.0,-49.0,11559.247105,9251.775,53093.745,10058.037722,11559.247105,9251.775,53093.745,10058.037722,20.421053,31.0,4.925171,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000,19.0,-315.421053,-587.0,-49.0,11559.247105,9251.775,53093.745,10058.037722,11559.247105,9251.775,53093.745,10058.037722,20.421053,31.0,4.925171,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000
2,100003,3,-1385.320000,-2324.0,-544.0,64754.586000,6662.970,560835.360,110542.592300,64754.586000,6662.970,560835.360,110542.592300,7.160000,14.0,3.726929,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000,13.0,-677.846154,-806.0,-544.0,118314.713077,64275.615,560835.360,134033.060606,118314.713077,64275.615,560835.360,134033.060606,7.538462,14.0,3.950008,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000,13.0,-677.846154,-806.0,-544.0,118314.713077,64275.615,560835.360,134033.060606,118314.713077,64275.615,560835.360,134033.060606,7.538462,14.0,3.950008,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000
3,100004,1,-761.666667,-795.0,-727.0,7096.155000,5357.250,10573.965,3011.871810,7096.155000,5357.250,10573.965,3011.871810,7.666667,11.0,4.163332,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,3.0,-761.666667,-795.0,-727.0,7096.155000,5357.250,10573.965,3011.871810,7096.155000,5357.250,10573.965,3011.871810,7.666667,11.0,4.163332,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000
4,100005,1,-609.555556,-736.0,-470.0,6240.205000,4813.200,17656.245,4281.015000,6240.205000,4813.200,17656.245,4281.015000,23.666667,37.0,13.285330,0.111111,1.0,0.333333,0.111111,1,1.000000,0.000000,0.111111,0.333333,0.111111,1,0.0,0.0,0.0,1.000000,0.000000,9.0,-609.555556,-736.0,-470.0,6240.205000,4813.200,17656.245,4281.015000,6240.205000,4813.200,17656.245,4281.015000,23.666667,37.0,13.285330,0.111111,1.0,0.333333,0.111111,1.0,1.000000,0.000000,0.111111,0.333333,0.111111,1.0,0.0,0.0,0.0,1.000000,0.000000,9.0,-609.555556,-736.0,-470.0,6240.205000,4813.200,17656.245,4281.015000,6240.205000,4813.200,17656.245,4281.015000,23.666667,37.0,13.285330,0.111111,1.0,0.333333,0.111111,1.0,1.000000,0.000000,0.111111,0.333333,0.111111,1.0,0.0,0.0,0.0,1.000000,0.000000
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
339582,456251,1,-156.285714,-237.0,-38.0,7492.924286,6605.910,12815.010,2346.819209,7492.924286,6605.910,12815.010,2346.819209,36.285714,46.0,14.079705,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000,7.0,-156.285714,-237.0,-38.0,7492.924286,6605.910,12815.010,2346.819209,7492.924286,6605.910,12815.010,2346.819209,36.285714,46.0,14.079705,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000,7.0,-156.285714,-237.0,-38.0,7492.924286,6605.910,12815.010,2346.819209,7492.924286,6605.910,12815.010,2346.819209,36.285714,46.0,14.079705,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000
339583,456252,1,-2393.833333,-2470.0,-2327.0,10069.867500,10046.880,10074.465,11.261529,10069.867500,10046.880,10074.465,11.261529,3.333333,11.0,4.082483,0.500000,3.0,1.224745,0.166667,1,1.000000,0.000000,0.166667,0.408248,0.166667,1,0.0,0.0,0.0,1.000000,0.000000,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
339584,456253,3,-2387.428571,-2915.0,-1738.0,4399.707857,2754.450,5575.185,1145.446623,4115.915357,27.270,5575.185,1638.228743,15.142857,51.0,15.629642,0.642857,9.0,2.405351,0.071429,1,0.928571,0.265292,0.070938,0.265427,0.071429,1,0.0,0.0,0.0,1.000000,0.000000,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
339585,456254,2,-161.263158,-317.0,-18.0,10239.832895,2296.440,19065.825,8602.512994,10239.832895,2296.440,19065.825,8602.512994,19.000000,31.0,8.198916,0.000000,0.0,0.000000,0.000000,0,1.000000,0.000000,0.000000,0.000000,0.000000,0,0.0,0.0,0.0,1.000000,0.000000,19.0,-161.263158,-317.0,-18.0,10239.832895,2296.440,19065.825,8602.512994,10239.832895,2296.440,19065.825,8602.512994,19.000000,31.0,8.198916,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000,19.0,-161.263158,-317.0,-18.0,10239.832895,2296.440,19065.825,8602.512994,10239.832895,2296.440,19065.825,8602.512994,19.000000,31.0,8.198916,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,1.000000,0.000000


## 2. Credit Card Balance
[top](#Contents)

In [17]:
missing_data(cc)

The dataframe has 23 columns.
There are 9 columns that have missing values.


Unnamed: 0,Total,% of Missing Values
AMT_PAYMENT_CURRENT,767988,20.0
AMT_DRAWINGS_ATM_CURRENT,749816,19.5
AMT_DRAWINGS_OTHER_CURRENT,749816,19.5
AMT_DRAWINGS_POS_CURRENT,749816,19.5
CNT_DRAWINGS_ATM_CURRENT,749816,19.5
CNT_DRAWINGS_OTHER_CURRENT,749816,19.5
CNT_DRAWINGS_POS_CURRENT,749816,19.5
AMT_INST_MIN_REGULARITY,305236,7.9
CNT_INSTALMENT_MATURE_CUM,305236,7.9


In [18]:
# sort df by SK_ID_PREV and Months Balance to order the data
cc = cc.sort_values(by=['SK_ID_PREV', 'MONTHS_BALANCE'])

In [19]:
# example of a previous credit card account
cc.loc[cc['SK_ID_PREV']==1000096]

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,MONTHS_BALANCE,AMT_BALANCE,AMT_CREDIT_LIMIT_ACTUAL,AMT_DRAWINGS_ATM_CURRENT,AMT_DRAWINGS_CURRENT,AMT_DRAWINGS_OTHER_CURRENT,AMT_DRAWINGS_POS_CURRENT,AMT_INST_MIN_REGULARITY,AMT_PAYMENT_CURRENT,AMT_PAYMENT_TOTAL_CURRENT,AMT_RECEIVABLE_PRINCIPAL,AMT_RECIVABLE,AMT_TOTAL_RECEIVABLE,CNT_DRAWINGS_ATM_CURRENT,CNT_DRAWINGS_CURRENT,CNT_DRAWINGS_OTHER_CURRENT,CNT_DRAWINGS_POS_CURRENT,CNT_INSTALMENT_MATURE_CUM,NAME_CONTRACT_STATUS,SK_DPD,SK_DPD_DEF
1514052,1000096,306118,-96,177072.57,180000,13500.0,13500.0,0.0,0.0,9000.0,9000.0,9000.0,171077.805,177072.57,177072.57,1.0,1,0.0,0.0,7.0,Active,0,0
96202,1000096,306118,-95,178592.94,180000,4500.0,4500.0,0.0,0.0,9000.0,9000.0,9000.0,172572.57,178592.94,178592.94,1.0,1,0.0,0.0,8.0,Active,0,0
2250768,1000096,306118,-94,180242.37,180000,0.0,5098.5,0.0,5098.5,9000.0,9000.0,9000.0,174691.44,180242.37,180242.37,0.0,1,0.0,1.0,9.0,Active,0,0
734483,1000096,306118,-93,176652.495,180000,0.0,0.0,0.0,0.0,9000.0,9000.0,9000.0,171242.37,176652.495,176652.495,0.0,0,0.0,0.0,10.0,Active,0,0
2117399,1000096,306118,-92,31753.71,180000,0.0,0.0,0.0,0.0,9000.0,148500.0,148500.0,28152.495,31753.71,31753.71,0.0,0,0.0,0.0,11.0,Active,0,0
1899634,1000096,306118,-91,25857.45,180000,0.0,0.0,0.0,0.0,9000.0,9000.0,9000.0,22753.71,25857.45,25857.45,0.0,0,0.0,0.0,12.0,Active,0,0
911548,1000096,306118,-90,19906.65,180000,0.0,0.0,0.0,0.0,9000.0,9000.0,9000.0,16857.45,19906.65,19906.65,0.0,0,0.0,0.0,13.0,Active,0,0
1342104,1000096,306118,-89,21766.41,180000,6750.0,7200.0,0.0,450.0,9000.0,9000.0,9000.0,18106.65,21766.41,21766.41,1.0,2,0.0,1.0,14.0,Active,0,0
1033852,1000096,306118,-88,79502.985,180000,0.0,63027.0,0.0,63027.0,9000.0,9000.0,9000.0,75793.41,79502.985,79502.985,0.0,1,0.0,1.0,15.0,Active,0,0
1906048,1000096,306118,-87,119878.74,180000,45000.0,45000.0,0.0,0.0,9000.0,9000.0,9000.0,115502.985,119878.74,119878.74,2.0,2,0.0,0.0,16.0,Active,0,0


In [20]:
cc.shape

(3840312, 23)

In [21]:
# set marker column to identify the row with contract status == 'Completed'
cc['marker'] = cc['NAME_CONTRACT_STATUS'].apply(lambda x: -99 if x=='Completed' else random.uniform(0,100))

#drop duplicates based on subsets
cc.drop_duplicates(subset=['SK_ID_PREV', 'NAME_CONTRACT_STATUS', 'marker'], keep='first', inplace=True)


In [22]:
# check
# example of a previous credit card account
cc.loc[cc['SK_ID_PREV']==1000096]

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,MONTHS_BALANCE,AMT_BALANCE,AMT_CREDIT_LIMIT_ACTUAL,AMT_DRAWINGS_ATM_CURRENT,AMT_DRAWINGS_CURRENT,AMT_DRAWINGS_OTHER_CURRENT,AMT_DRAWINGS_POS_CURRENT,AMT_INST_MIN_REGULARITY,AMT_PAYMENT_CURRENT,AMT_PAYMENT_TOTAL_CURRENT,AMT_RECEIVABLE_PRINCIPAL,AMT_RECIVABLE,AMT_TOTAL_RECEIVABLE,CNT_DRAWINGS_ATM_CURRENT,CNT_DRAWINGS_CURRENT,CNT_DRAWINGS_OTHER_CURRENT,CNT_DRAWINGS_POS_CURRENT,CNT_INSTALMENT_MATURE_CUM,NAME_CONTRACT_STATUS,SK_DPD,SK_DPD_DEF,marker
1514052,1000096,306118,-96,177072.57,180000,13500.0,13500.0,0.0,0.0,9000.0,9000.0,9000.0,171077.805,177072.57,177072.57,1.0,1,0.0,0.0,7.0,Active,0,0,80.153613
96202,1000096,306118,-95,178592.94,180000,4500.0,4500.0,0.0,0.0,9000.0,9000.0,9000.0,172572.57,178592.94,178592.94,1.0,1,0.0,0.0,8.0,Active,0,0,40.130008
2250768,1000096,306118,-94,180242.37,180000,0.0,5098.5,0.0,5098.5,9000.0,9000.0,9000.0,174691.44,180242.37,180242.37,0.0,1,0.0,1.0,9.0,Active,0,0,45.350077
734483,1000096,306118,-93,176652.495,180000,0.0,0.0,0.0,0.0,9000.0,9000.0,9000.0,171242.37,176652.495,176652.495,0.0,0,0.0,0.0,10.0,Active,0,0,31.532693
2117399,1000096,306118,-92,31753.71,180000,0.0,0.0,0.0,0.0,9000.0,148500.0,148500.0,28152.495,31753.71,31753.71,0.0,0,0.0,0.0,11.0,Active,0,0,90.145127
1899634,1000096,306118,-91,25857.45,180000,0.0,0.0,0.0,0.0,9000.0,9000.0,9000.0,22753.71,25857.45,25857.45,0.0,0,0.0,0.0,12.0,Active,0,0,24.191556
911548,1000096,306118,-90,19906.65,180000,0.0,0.0,0.0,0.0,9000.0,9000.0,9000.0,16857.45,19906.65,19906.65,0.0,0,0.0,0.0,13.0,Active,0,0,99.571806
1342104,1000096,306118,-89,21766.41,180000,6750.0,7200.0,0.0,450.0,9000.0,9000.0,9000.0,18106.65,21766.41,21766.41,1.0,2,0.0,1.0,14.0,Active,0,0,40.230359
1033852,1000096,306118,-88,79502.985,180000,0.0,63027.0,0.0,63027.0,9000.0,9000.0,9000.0,75793.41,79502.985,79502.985,0.0,1,0.0,1.0,15.0,Active,0,0,42.544986
1906048,1000096,306118,-87,119878.74,180000,45000.0,45000.0,0.0,0.0,9000.0,9000.0,9000.0,115502.985,119878.74,119878.74,2.0,2,0.0,0.0,16.0,Active,0,0,68.513159


In [23]:
# create feature to look at usage to credit limit
cc['USAGE_RATIO'] = cc['AMT_BALANCE'] / cc['AMT_CREDIT_LIMIT_ACTUAL']

# feature to look at payment rate on min payment
cc['PAYMENT_RATE'] = cc['AMT_PAYMENT_CURRENT']/cc['AMT_INST_MIN_REGULARITY']

# feature to look at drawing limit rate
cc['DRAWING_LIMIT_RATE'] = cc['AMT_DRAWINGS_ATM_CURRENT'] / cc['AMT_CREDIT_LIMIT_ACTUAL']

# create feature FLAG_30DAYS_DUE where 1 = payment was late by 15 days
cc['FLAG_15DAYS_DUE'] = cc['SK_DPD'].apply(lambda x: 1 if x >= 15 else 0)

# create feature FLAG_30DAYS_DUE where 1 = payment was late by 30 days
cc['FLAG_30DAYS_DUE'] = cc['SK_DPD'].apply(lambda x: 1 if x >= 30 else 0)

# create feature FLAG_60DAYS_DUE where 1 = payment was late by 60 days
cc['FLAG_60DAYS_DUE'] = cc['SK_DPD'].apply(lambda x: 1 if x >= 60 else 0)

In [24]:
# for overall credit card features

credit_card_agg = {'MONTHS_BALANCE': ['min'],
                   'AMT_BALANCE': ['max', 'mean'],
                   'AMT_CREDIT_LIMIT_ACTUAL': ['max'],
                   'AMT_DRAWINGS_ATM_CURRENT': ['max', 'sum'],
                   'AMT_DRAWINGS_CURRENT': ['max', 'sum'],
                   'AMT_DRAWINGS_POS_CURRENT': ['max', 'sum'],
                   'AMT_INST_MIN_REGULARITY': ['max', 'mean'],
                   'AMT_PAYMENT_TOTAL_CURRENT': ['max', 'mean', 'sum', 'std'],
                   'AMT_TOTAL_RECEIVABLE': ['max', 'mean'],
                   'CNT_DRAWINGS_ATM_CURRENT': ['max', 'mean', 'sum'],
                   'CNT_DRAWINGS_CURRENT': ['max', 'mean', 'sum'],
                   'CNT_DRAWINGS_POS_CURRENT': ['max', 'mean', 'sum'],
                   'SK_DPD': ['max', 'mean', 'sum'],
                   'SK_DPD_DEF': ['max', 'sum'],
                   'USAGE_RATIO': ['max', 'mean'],
                   'PAYMENT_RATE': ['min', 'mean'],
                   'DRAWING_LIMIT_RATE': ['max', 'mean'],
                   'FLAG_15DAYS_DUE': ['sum'],
                   'FLAG_30DAYS_DUE': ['sum'],
                   'FLAG_60DAYS_DUE': ['sum'],
                  }

# for credit card features based on last 12, 24 and 36 months

credit_card_time_agg = {'AMT_BALANCE': ['max', 'mean'],
                        'SK_DPD': ['max', 'mean', 'sum'],
                        'USAGE_RATIO': ['max', 'mean'],
                        'FLAG_15DAYS_DUE': ['sum'],
                        'FLAG_30DAYS_DUE': ['sum'],
                        'FLAG_60DAYS_DUE': ['sum'],   
                       }

In [25]:
cc_agg = group(cc, 'CC_', credit_card_agg)

In [26]:
# looking at data in recent 1, 2 and 3 years
for months in [12, 24, 36]:
    cc_prev_id = cc[cc['MONTHS_BALANCE'] >= -months]['SK_ID_PREV'].unique()
    cc_time = cc[cc['SK_ID_PREV'].isin(cc_prev_id)]
    prefix = f'INS_{months}M_'
    cc_agg = group_and_merge(cc_time, cc_agg, prefix, credit_card_time_agg)

In [27]:
# check
cc_agg.head(3)

Unnamed: 0,SK_ID_CURR,CC_MONTHS_BALANCE_MIN,CC_AMT_BALANCE_MAX,CC_AMT_BALANCE_MEAN,CC_AMT_CREDIT_LIMIT_ACTUAL_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_SUM,CC_AMT_DRAWINGS_CURRENT_MAX,CC_AMT_DRAWINGS_CURRENT_SUM,CC_AMT_DRAWINGS_POS_CURRENT_MAX,CC_AMT_DRAWINGS_POS_CURRENT_SUM,CC_AMT_INST_MIN_REGULARITY_MAX,CC_AMT_INST_MIN_REGULARITY_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_MAX,CC_AMT_PAYMENT_TOTAL_CURRENT_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_SUM,CC_AMT_PAYMENT_TOTAL_CURRENT_STD,CC_AMT_TOTAL_RECEIVABLE_MAX,CC_AMT_TOTAL_RECEIVABLE_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_MAX,CC_CNT_DRAWINGS_ATM_CURRENT_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_SUM,CC_CNT_DRAWINGS_CURRENT_MAX,CC_CNT_DRAWINGS_CURRENT_MEAN,CC_CNT_DRAWINGS_CURRENT_SUM,CC_CNT_DRAWINGS_POS_CURRENT_MAX,CC_CNT_DRAWINGS_POS_CURRENT_MEAN,CC_CNT_DRAWINGS_POS_CURRENT_SUM,CC_SK_DPD_MAX,CC_SK_DPD_MEAN,CC_SK_DPD_SUM,CC_SK_DPD_DEF_MAX,CC_SK_DPD_DEF_SUM,CC_USAGE_RATIO_MAX,CC_USAGE_RATIO_MEAN,CC_PAYMENT_RATE_MIN,CC_PAYMENT_RATE_MEAN,CC_DRAWING_LIMIT_RATE_MAX,CC_DRAWING_LIMIT_RATE_MEAN,CC_FLAG_15DAYS_DUE_SUM,CC_FLAG_30DAYS_DUE_SUM,CC_FLAG_60DAYS_DUE_SUM,INS_12M_AMT_BALANCE_MAX,INS_12M_AMT_BALANCE_MEAN,INS_12M_SK_DPD_MAX,INS_12M_SK_DPD_MEAN,INS_12M_SK_DPD_SUM,INS_12M_USAGE_RATIO_MAX,INS_12M_USAGE_RATIO_MEAN,INS_12M_FLAG_15DAYS_DUE_SUM,INS_12M_FLAG_30DAYS_DUE_SUM,INS_12M_FLAG_60DAYS_DUE_SUM,INS_24M_AMT_BALANCE_MAX,INS_24M_AMT_BALANCE_MEAN,INS_24M_SK_DPD_MAX,INS_24M_SK_DPD_MEAN,INS_24M_SK_DPD_SUM,INS_24M_USAGE_RATIO_MAX,INS_24M_USAGE_RATIO_MEAN,INS_24M_FLAG_15DAYS_DUE_SUM,INS_24M_FLAG_30DAYS_DUE_SUM,INS_24M_FLAG_60DAYS_DUE_SUM,INS_36M_AMT_BALANCE_MAX,INS_36M_AMT_BALANCE_MEAN,INS_36M_SK_DPD_MAX,INS_36M_SK_DPD_MEAN,INS_36M_SK_DPD_SUM,INS_36M_USAGE_RATIO_MAX,INS_36M_USAGE_RATIO_MEAN,INS_36M_FLAG_15DAYS_DUE_SUM,INS_36M_FLAG_30DAYS_DUE_SUM,INS_36M_FLAG_60DAYS_DUE_SUM
0,100006,-6,0.000,0.000000,270000,,0.0,0.00,0.000,,0.000,0.000,0.000000,0.00,0.000000,0.000,0.000000,0.000,0.000000,,,0.0,0,0.000000,0,,,0.0,0,0.000000,0,0,0,0.000000,0.000000,,,,,0,0,0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0
1,100011,-75,189000.000,54482.111149,180000,180000.0,180000.0,180000.00,180000.000,0.000,0.000,9000.000,3956.221849,55485.00,4520.067568,334485.000,7473.872687,189000.000,54433.179122,4.0,0.054054,4.0,4,0.054054,4,0.0,0.000000,0.0,0,0.000000,0,0,0,1.050000,0.302678,1.000000,inf,1.0000,0.013514,0,0,0,189000.000,54482.111149,0.0,0.000000,0.0,1.050000,0.302678,0.0,0.0,0.0,189000.000,54482.111149,0.0,0.000000,0.0,1.050000,0.302678,0.0,0.0,0.0,189000.000,54482.111149,0.0,0.000000,0.0,1.050000,0.302678,0.0,0.0,0.0
2,100013,-96,161420.220,18159.919219,157500,157500.0,571500.0,157500.00,571500.000,0.000,0.000,7875.000,1454.539551,153675.00,6817.172344,654448.545,21730.655260,161420.220,18101.079844,7.0,0.255556,23.0,7,0.239583,23,0.0,0.000000,0.0,1,0.010417,1,1,1,1.024890,0.115301,0.000000,inf,1.0000,0.040317,0,0,0,161420.220,18159.919219,1.0,0.010417,1.0,1.024890,0.115301,0.0,0.0,0.0,161420.220,18159.919219,1.0,0.010417,1.0,1.024890,0.115301,0.0,0.0,0.0,161420.220,18159.919219,1.0,0.010417,1.0,1.024890,0.115301,0.0,0.0,0.0
3,100021,-18,0.000,0.000000,675000,,0.0,0.00,0.000,,0.000,0.000,0.000000,0.00,0.000000,0.000,0.000000,0.000,0.000000,,,0.0,0,0.000000,0,,,0.0,0,0.000000,0,0,0,0.000000,0.000000,,,,,0,0,0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0
4,100023,-11,0.000,0.000000,225000,,0.0,0.00,0.000,,0.000,0.000,0.000000,0.00,0.000000,0.000,0.000000,0.000,0.000000,,,0.0,0,0.000000,0,,,0.0,0,0.000000,0,0,0,0.000000,0.000000,,,,,0,0,0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
103553,456244,-41,453627.675,146087.134054,450000,279000.0,1003500.0,307953.45,1100537.910,30911.850,96883.650,23343.165,7238.000000,482329.62,36257.901081,1341542.340,100382.518298,453627.675,144904.040270,6.0,1.162162,43.0,8,1.513514,56,4.0,0.351351,13.0,0,0.000000,0,0,0,1.008061,0.444874,1.029728,inf,0.6200,0.082593,0,0,0,453627.675,146087.134054,0.0,0.000000,0.0,1.008061,0.444874,0.0,0.0,0.0,453627.675,146087.134054,0.0,0.000000,0.0,1.008061,0.444874,0.0,0.0,0.0,453627.675,146087.134054,0.0,0.000000,0.0,1.008061,0.444874,0.0,0.0,0.0
103554,456246,-9,43490.115,13136.731875,135000,0.0,0.0,48929.85,121594.050,48929.850,121594.050,2250.000,1439.150625,41419.71,15554.340000,124434.720,17012.766963,43490.115,12897.894375,0.0,0.000000,0.0,8,2.500000,20,8.0,2.500000,20.0,0,0.000000,0,0,0,0.322149,0.097309,0.000000,9.481342,0.0000,0.000000,0,0,0,43490.115,13136.731875,0.0,0.000000,0.0,0.322149,0.097309,0.0,0.0,0.0,43490.115,13136.731875,0.0,0.000000,0.0,0.322149,0.097309,0.0,0.0,0.0,43490.115,13136.731875,0.0,0.000000,0.0,0.322149,0.097309,0.0,0.0,0.0
103555,456247,-96,190202.130,23216.396211,180000,96750.0,202950.0,96750.00,204203.115,1253.115,1253.115,9000.000,1414.704789,99990.00,4115.878105,391008.420,16973.145046,190202.130,23128.243105,4.0,0.115789,11.0,4,0.147368,14,3.0,0.031579,3.0,1,0.031579,3,1,2,1.056679,0.161225,0.000000,inf,0.5375,0.014836,0,0,0,190202.130,23216.396211,1.0,0.031579,3.0,1.056679,0.161225,0.0,0.0,0.0,190202.130,23216.396211,1.0,0.031579,3.0,1.056679,0.161225,0.0,0.0,0.0,190202.130,23216.396211,1.0,0.031579,3.0,1.056679,0.161225,0.0,0.0,0.0
103556,456248,-24,0.000,0.000000,900000,,0.0,0.00,0.000,,0.000,0.000,0.000000,0.00,0.000000,0.000,0.000000,0.000,0.000000,,,0.0,0,0.000000,0,,,0.0,0,0.000000,0,0,0,0.000000,0.000000,,,,,0,0,0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0


## 3. Bureau & Bureau Balance
[top](#Contents)

In [28]:
missing_data(bureau_bal)

The dataframe has 3 columns.
There are 0 columns that have missing values.


Unnamed: 0,Total,% of Missing Values


In [29]:
missing_data(bureau)

The dataframe has 17 columns.
There are 7 columns that have missing values.


Unnamed: 0,Total,% of Missing Values
AMT_ANNUITY,1226791,71.5
AMT_CREDIT_MAX_OVERDUE,1124488,65.5
DAYS_ENDDATE_FACT,633653,36.9
AMT_CREDIT_SUM_LIMIT,591780,34.5
AMT_CREDIT_SUM_DEBT,257669,15.0
DAYS_CREDIT_ENDDATE,105553,6.1
AMT_CREDIT_SUM,13,0.0


In [30]:
bureau_bal

Unnamed: 0,SK_ID_BUREAU,MONTHS_BALANCE,STATUS
0,5715448,0,C
1,5715448,-1,C
2,5715448,-2,C
3,5715448,-3,C
4,5715448,-4,C
...,...,...,...
27299920,5041336,-47,X
27299921,5041336,-48,X
27299922,5041336,-49,X
27299923,5041336,-50,X


In [31]:
# set marker column to identify the row with status C
bureau_bal['marker'] = bureau_bal['STATUS'].apply(lambda x: -99 if x=='C' else random.uniform(0,100))

# drop duplicates based on subsets
bureau_bal.drop_duplicates(subset=['SK_ID_BUREAU', 'STATUS', 'marker'], keep='last', inplace=True)

# drop marker
bureau_bal.drop('marker', axis=1, inplace=True)

In [32]:
# get dummies for status column
bureau_bal = pd.get_dummies(bureau_bal, columns=['STATUS'])

In [33]:
# create feature to flag late payment for the month
bureau_bal['FLAG_DPD'] = bureau_bal.iloc[:, 3:8].sum(axis=1)

In [34]:
# check
bureau_bal.head(3)

Unnamed: 0,SK_ID_BUREAU,MONTHS_BALANCE,STATUS_0,STATUS_1,STATUS_2,STATUS_3,STATUS_4,STATUS_5,STATUS_C,STATUS_X,FLAG_DPD
8,5715448,-8,0,0,0,0,0,0,1,0,0
9,5715448,-9,1,0,0,0,0,0,0,0,0
10,5715448,-10,1,0,0,0,0,0,0,0,0
11,5715448,-11,0,0,0,0,0,0,0,1,0
12,5715448,-12,0,0,0,0,0,0,0,1,0
...,...,...,...,...,...,...,...,...,...,...,...
27299920,5041336,-47,0,0,0,0,0,0,0,1,0
27299921,5041336,-48,0,0,0,0,0,0,0,1,0
27299922,5041336,-49,0,0,0,0,0,0,0,1,0
27299923,5041336,-50,0,0,0,0,0,0,0,1,0


In [35]:
# for bureau_bal features
bureau_bal_agg = {'MONTHS_BALANCE': ['min', 'max', 'mean', 'size'],
                  'STATUS_0': ['mean'],
                  'STATUS_C': ['sum'],
                  'STATUS_X': ['mean'],
                  'FLAG_DPD': ['mean']
                  }

In [36]:
# merge to bureau df
bb_bal_agg = group_and_merge(bureau_bal, bureau, 'BB_BAL_', bureau_bal_agg, aggregate_by='SK_ID_BUREAU')

In [37]:
bb_bal_agg = pd.get_dummies(bb_bal_agg,  columns=['CREDIT_ACTIVE', 'CREDIT_TYPE'])

In [38]:
# check
bb_bal_agg.head(3)

Unnamed: 0,SK_ID_CURR,SK_ID_BUREAU,CREDIT_CURRENCY,DAYS_CREDIT,CREDIT_DAY_OVERDUE,DAYS_CREDIT_ENDDATE,DAYS_ENDDATE_FACT,AMT_CREDIT_MAX_OVERDUE,CNT_CREDIT_PROLONG,AMT_CREDIT_SUM,AMT_CREDIT_SUM_DEBT,AMT_CREDIT_SUM_LIMIT,AMT_CREDIT_SUM_OVERDUE,DAYS_CREDIT_UPDATE,AMT_ANNUITY,BB_BAL_MONTHS_BALANCE_MIN,BB_BAL_MONTHS_BALANCE_MAX,BB_BAL_MONTHS_BALANCE_MEAN,BB_BAL_MONTHS_BALANCE_SIZE,BB_BAL_STATUS_0_MEAN,BB_BAL_STATUS_C_SUM,BB_BAL_STATUS_X_MEAN,BB_BAL_FLAG_DPD_MEAN,CREDIT_ACTIVE_Active,CREDIT_ACTIVE_Bad debt,CREDIT_ACTIVE_Closed,CREDIT_ACTIVE_Sold,CREDIT_TYPE_Another type of loan,CREDIT_TYPE_Car loan,CREDIT_TYPE_Cash loan (non-earmarked),CREDIT_TYPE_Consumer credit,CREDIT_TYPE_Credit card,CREDIT_TYPE_Interbank credit,CREDIT_TYPE_Loan for business development,CREDIT_TYPE_Loan for purchase of shares (margin lending),CREDIT_TYPE_Loan for the purchase of equipment,CREDIT_TYPE_Loan for working capital replenishment,CREDIT_TYPE_Microloan,CREDIT_TYPE_Mobile operator loan,CREDIT_TYPE_Mortgage,CREDIT_TYPE_Real estate loan,CREDIT_TYPE_Unknown type of loan
0,215354,5714462,currency 1,-497,0,-153.0,-153.0,,0,91323.00,0.0,,0.0,-131,,,,,,,,,,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0
1,215354,5714463,currency 1,-208,0,1075.0,,,0,225000.00,171342.0,,0.0,-20,,,,,,,,,,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0
2,215354,5714464,currency 1,-203,0,528.0,,,0,464323.50,,,0.0,-16,,,,,,,,,,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0
3,215354,5714465,currency 1,-203,0,,,,0,90000.00,,,0.0,-16,,,,,,,,,,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0
4,215354,5714466,currency 1,-629,0,1197.0,,77674.5,0,2700000.00,,,0.0,-21,,,,,,,,,,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1716423,259355,5057750,currency 1,-44,0,-30.0,,0.0,0,11250.00,11250.0,0.0,0.0,-19,,,,,,,,,,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0
1716424,100044,5057754,currency 1,-2648,0,-2433.0,-2493.0,5476.5,0,38130.84,0.0,0.0,0.0,-2493,,,,,,,,,,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0
1716425,100044,5057762,currency 1,-1809,0,-1628.0,-970.0,,0,15570.00,,,0.0,-967,,,,,,,,,,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0
1716426,246829,5057770,currency 1,-1878,0,-1513.0,-1513.0,,0,36000.00,0.0,0.0,0.0,-1508,,,,,,,,,,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0


In [39]:
# for DAYS_ENDDATE_FACT, this is the date (wrt credit application) the the loan ended
# null values are mainly for current active loans
# fill this with the DAYS_CREDIT_ENDDATE num if DAYS_ENDDATE_FACT is empty
bb_bal_agg['DAYS_ENDDATE_FACT'].fillna(bb_bal_agg.DAYS_CREDIT_ENDDATE, inplace=True)

# there are also rows where DAYS_CREDIT_ENDDATE is empty but DAYS_ENDDATE_FACT is not
# assumed these were closed on time at the FACT date
bb_bal_agg['DAYS_CREDIT_ENDDATE'].fillna(bb_bal_agg.DAYS_ENDDATE_FACT, inplace=True)

In [40]:
# create feature credit duration to look at length of credit
bb_bal_agg['CREDIT_DURATION'] = -bb_bal_agg['DAYS_CREDIT'] + bb_bal_agg['DAYS_CREDIT_ENDDATE']

# create feature to look at contractual end date and actual end date (indication of early payment)
bb_bal_agg['END_DATE_DIFF'] = bb_bal_agg['DAYS_CREDIT_ENDDATE'] - bb_bal_agg['DAYS_ENDDATE_FACT']

# create feature to look at debt ratio and difference
bb_bal_agg['DEBT_PERCENTAGE'] = bb_bal_agg['AMT_CREDIT_SUM'] / bb_bal_agg['AMT_CREDIT_SUM_DEBT']
bb_bal_agg['DEBT_CREDIT_DIFF'] = bb_bal_agg['AMT_CREDIT_SUM'] - bb_bal_agg['AMT_CREDIT_SUM_DEBT']
bb_bal_agg['CREDIT_TO_ANNUITY_RATIO'] = bb_bal_agg['AMT_CREDIT_SUM'] / bb_bal_agg['AMT_ANNUITY']

In [41]:
bb_bal_agg.head(2)

Unnamed: 0,SK_ID_CURR,SK_ID_BUREAU,CREDIT_CURRENCY,DAYS_CREDIT,CREDIT_DAY_OVERDUE,DAYS_CREDIT_ENDDATE,DAYS_ENDDATE_FACT,AMT_CREDIT_MAX_OVERDUE,CNT_CREDIT_PROLONG,AMT_CREDIT_SUM,AMT_CREDIT_SUM_DEBT,AMT_CREDIT_SUM_LIMIT,AMT_CREDIT_SUM_OVERDUE,DAYS_CREDIT_UPDATE,AMT_ANNUITY,BB_BAL_MONTHS_BALANCE_MIN,BB_BAL_MONTHS_BALANCE_MAX,BB_BAL_MONTHS_BALANCE_MEAN,BB_BAL_MONTHS_BALANCE_SIZE,BB_BAL_STATUS_0_MEAN,BB_BAL_STATUS_C_SUM,BB_BAL_STATUS_X_MEAN,BB_BAL_FLAG_DPD_MEAN,CREDIT_ACTIVE_Active,CREDIT_ACTIVE_Bad debt,CREDIT_ACTIVE_Closed,CREDIT_ACTIVE_Sold,CREDIT_TYPE_Another type of loan,CREDIT_TYPE_Car loan,CREDIT_TYPE_Cash loan (non-earmarked),CREDIT_TYPE_Consumer credit,CREDIT_TYPE_Credit card,CREDIT_TYPE_Interbank credit,CREDIT_TYPE_Loan for business development,CREDIT_TYPE_Loan for purchase of shares (margin lending),CREDIT_TYPE_Loan for the purchase of equipment,CREDIT_TYPE_Loan for working capital replenishment,CREDIT_TYPE_Microloan,CREDIT_TYPE_Mobile operator loan,CREDIT_TYPE_Mortgage,CREDIT_TYPE_Real estate loan,CREDIT_TYPE_Unknown type of loan,CREDIT_DURATION,END_DATE_DIFF,DEBT_PERCENTAGE,DEBT_CREDIT_DIFF,CREDIT_TO_ANNUITY_RATIO
0,215354,5714462,currency 1,-497,0,-153.0,-153.0,,0,91323.0,0.0,,0.0,-131,,,,,,,,,,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,344.0,0.0,inf,91323.0,
1,215354,5714463,currency 1,-208,0,1075.0,1075.0,,0,225000.0,171342.0,,0.0,-20,,,,,,,,,,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1283.0,0.0,1.313163,53658.0,


In [42]:
# general bureau aggregation
bureau_aggregation = {'SK_ID_BUREAU': ['nunique'],
                      'DAYS_CREDIT': ['min', 'max', 'mean'],
                      'DAYS_CREDIT_ENDDATE': ['min', 'max'],
                      'AMT_CREDIT_MAX_OVERDUE': ['max', 'mean'],
                      'AMT_CREDIT_SUM': ['max', 'mean', 'sum'],
                      'AMT_CREDIT_SUM_DEBT': ['max', 'mean', 'sum'],
                      'AMT_CREDIT_SUM_OVERDUE': ['max', 'mean', 'sum'],
                      'AMT_ANNUITY': ['mean'],
                      'DEBT_CREDIT_DIFF': ['mean', 'sum'],
                      'BB_BAL_MONTHS_BALANCE_MEAN': ['mean', 'std'],
                      'BB_BAL_MONTHS_BALANCE_SIZE': ['mean', 'sum'],
                      # Categorical
                      'BB_BAL_STATUS_0_MEAN': ['mean'],
                      'BB_BAL_FLAG_DPD_MEAN': ['mean'],
                      'BB_BAL_STATUS_C_SUM': ['mean'],
                      'BB_BAL_STATUS_X_MEAN': ['mean'],
                      'CREDIT_ACTIVE_Active': ['mean'],
                      'CREDIT_ACTIVE_Closed': ['mean'],
                      'CREDIT_ACTIVE_Sold': ['mean'],
                      'CREDIT_ACTIVE_Bad debt': ['mean'],
                      'CREDIT_TYPE_Consumer credit': ['mean'],
                      'CREDIT_TYPE_Credit card': ['mean'],
                      'CREDIT_TYPE_Car loan': ['mean'],
                      'CREDIT_TYPE_Mortgage': ['mean'],
                      'CREDIT_TYPE_Microloan': ['mean'],
                     }

# recent time aggregation
bureau_time_aggregation = {'AMT_CREDIT_MAX_OVERDUE': ['max', 'mean'],
                           'AMT_CREDIT_SUM_OVERDUE': ['mean'],
                           'AMT_CREDIT_SUM': ['max', 'sum'],
                           'AMT_CREDIT_SUM_DEBT': ['mean', 'sum'],
                           'DEBT_PERCENTAGE': ['mean'],
                           'DEBT_CREDIT_DIFF': ['mean'],
                           'BB_BAL_STATUS_0_MEAN': ['mean'],
                           'BB_BAL_FLAG_DPD_MEAN': ['mean'],
                          }

# active loans aggregation
bureau_active_aggregations = {'DAYS_CREDIT': ['max', 'mean'],
                              'DAYS_CREDIT_ENDDATE': ['min', 'max'],
                              'AMT_CREDIT_MAX_OVERDUE': ['max', 'mean'],
                              'AMT_CREDIT_SUM': ['max', 'sum'],
                              'AMT_CREDIT_SUM_DEBT': ['mean', 'sum'],
                              'AMT_CREDIT_SUM_OVERDUE': ['max', 'mean'],
                              'DAYS_CREDIT_UPDATE': ['min', 'mean'],
                              'DEBT_PERCENTAGE': ['mean'],
                              'DEBT_CREDIT_DIFF': ['mean'],
                              'CREDIT_TO_ANNUITY_RATIO': ['mean'],
                              'BB_BAL_MONTHS_BALANCE_MEAN': ['mean', 'std'],
                              'BB_BAL_MONTHS_BALANCE_SIZE': ['mean', 'sum'],
                             }

In [43]:
# aggregate the bureau aggregation
agg_bureau = group(bb_bal_agg, 'BUREAU_', bureau_aggregation)

In [44]:
# active loan aggregation
active = bb_bal_agg.loc[bb_bal_agg['CREDIT_ACTIVE_Active']==1]
agg_bureau = group_and_merge(active, agg_bureau, 'BUREAU_ACTIVE_', bureau_active_aggregations)

In [45]:
# time aggregations
for month in [12, 24]:
    prefix = f'BUREAU_LAST{month}M_'
    time_frame_df = bb_bal_agg[bb_bal_agg['DAYS_CREDIT'] >= -30*month]
    agg_bureau = group_and_merge(time_frame_df, agg_bureau, prefix, bureau_time_aggregation)

In [46]:
# check
agg_bureau.head(3)

Unnamed: 0,SK_ID_CURR,BUREAU_SK_ID_BUREAU_NUNIQUE,BUREAU_DAYS_CREDIT_MIN,BUREAU_DAYS_CREDIT_MAX,BUREAU_DAYS_CREDIT_MEAN,BUREAU_DAYS_CREDIT_ENDDATE_MIN,BUREAU_DAYS_CREDIT_ENDDATE_MAX,BUREAU_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_MAX,BUREAU_AMT_CREDIT_SUM_MEAN,BUREAU_AMT_CREDIT_SUM_SUM,BUREAU_AMT_CREDIT_SUM_DEBT_MAX,BUREAU_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_AMT_CREDIT_SUM_OVERDUE_MAX,BUREAU_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_OVERDUE_SUM,BUREAU_AMT_ANNUITY_MEAN,BUREAU_DEBT_CREDIT_DIFF_MEAN,BUREAU_DEBT_CREDIT_DIFF_SUM,BUREAU_BB_BAL_MONTHS_BALANCE_MEAN_MEAN,BUREAU_BB_BAL_MONTHS_BALANCE_MEAN_STD,BUREAU_BB_BAL_MONTHS_BALANCE_SIZE_MEAN,BUREAU_BB_BAL_MONTHS_BALANCE_SIZE_SUM,BUREAU_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_BB_BAL_FLAG_DPD_MEAN_MEAN,BUREAU_BB_BAL_STATUS_C_SUM_MEAN,BUREAU_BB_BAL_STATUS_X_MEAN_MEAN,BUREAU_CREDIT_ACTIVE_Active_MEAN,BUREAU_CREDIT_ACTIVE_Closed_MEAN,BUREAU_CREDIT_ACTIVE_Sold_MEAN,BUREAU_CREDIT_ACTIVE_Bad debt_MEAN,BUREAU_CREDIT_TYPE_Consumer credit_MEAN,BUREAU_CREDIT_TYPE_Credit card_MEAN,BUREAU_CREDIT_TYPE_Car loan_MEAN,BUREAU_CREDIT_TYPE_Mortgage_MEAN,BUREAU_CREDIT_TYPE_Microloan_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_MAX,BUREAU_ACTIVE_DAYS_CREDIT_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_ENDDATE_MIN,BUREAU_ACTIVE_DAYS_CREDIT_ENDDATE_MAX,BUREAU_ACTIVE_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_ACTIVE_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_ACTIVE_AMT_CREDIT_SUM_MAX,BUREAU_ACTIVE_AMT_CREDIT_SUM_SUM,BUREAU_ACTIVE_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_ACTIVE_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_ACTIVE_AMT_CREDIT_SUM_OVERDUE_MAX,BUREAU_ACTIVE_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_UPDATE_MIN,BUREAU_ACTIVE_DAYS_CREDIT_UPDATE_MEAN,BUREAU_ACTIVE_DEBT_PERCENTAGE_MEAN,BUREAU_ACTIVE_DEBT_CREDIT_DIFF_MEAN,BUREAU_ACTIVE_CREDIT_TO_ANNUITY_RATIO_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_MEAN_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_MEAN_STD,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_SIZE_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_SIZE_SUM,BUREAU_LAST12M_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_LAST12M_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_MAX,BUREAU_LAST12M_AMT_CREDIT_SUM_SUM,BUREAU_LAST12M_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_LAST12M_DEBT_PERCENTAGE_MEAN,BUREAU_LAST12M_DEBT_CREDIT_DIFF_MEAN,BUREAU_LAST12M_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_LAST12M_BB_BAL_FLAG_DPD_MEAN_MEAN,BUREAU_LAST24M_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_LAST24M_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_MAX,BUREAU_LAST24M_AMT_CREDIT_SUM_SUM,BUREAU_LAST24M_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_LAST24M_DEBT_PERCENTAGE_MEAN,BUREAU_LAST24M_DEBT_CREDIT_DIFF_MEAN,BUREAU_LAST24M_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_LAST24M_BB_BAL_FLAG_DPD_MEAN_MEAN
0,100001,7,-1572,-49,-735.000000,-1329.0,1778.0,,,378000.00,2.076236e+05,1453365.000,373239.00,85240.928571,596686.500,0.0,0.0,0.0,3545.357143,122382.642857,856678.500,-19.357143,16.020077,9.428571,66.0,0.454583,0.007519,0.571429,0.425704,0.428571,0.571429,0.0,0.0,1.000000,0.000000,0.0,0.0,0.0,-49.0,-309.333333,411.0,1778.0,,,378000.00,884025.000,1.988955e+05,596686.500,0.0,0.0,-16.0,-10.666667,1.841065,95779.5000,41.943113,-4.833333,4.252450,10.666667,32.0,,,0.0,378000.000,546345.000,241760.25,483520.5,1.269629,31412.250,0.750000,0.0,,,0.0,378000.0,884025.000,1.988955e+05,596686.50,1.841065,95779.5000,0.710526,0.017544
1,100002,8,-1437,-103,-874.000000,-1072.0,780.0,5043.645,1681.029,450000.00,1.081319e+05,865055.565,245781.00,49156.200000,245781.000,0.0,0.0,0.0,0.000000,98388.513000,491942.565,-22.937500,11.530821,11.625000,93.0,0.492560,0.268452,0.750000,0.168452,0.250000,0.750000,0.0,0.0,0.500000,0.500000,0.0,0.0,0.0,-103.0,-572.500000,780.0,780.0,40.500,40.5000,450000.00,481988.565,1.228905e+05,245781.000,0.0,0.0,-24.0,-15.500000,inf,118103.7825,inf,-14.250000,18.031223,9.500000,19.0,40.5,40.5,0.0,31988.565,31988.565,0.00,0.0,inf,31988.565,0.500000,0.0,5043.645,2542.0725,0.0,120735.0,152723.565,0.000000e+00,0.00,inf,50907.8550,0.583333,0.166667
2,100003,4,-2586,-606,-1400.750000,-2434.0,1216.0,0.000,0.000,810000.00,2.543501e+05,1017400.500,0.00,0.000000,0.000,0.0,0.0,0.0,,254350.125000,1017400.500,,,,0.0,,,,,0.250000,0.750000,0.0,0.0,0.500000,0.500000,0.0,0.0,0.0,-606.0,-606.000000,1216.0,1216.0,0.000,0.0000,810000.00,810000.000,0.000000e+00,0.000,0.0,0.0,-43.0,-43.000000,inf,810000.0000,,,,,0.0,,,,,,,,,,,,0.000,0.0000,0.0,810000.0,810000.000,0.000000e+00,0.00,inf,810000.0000,,
3,100004,2,-1326,-408,-867.000000,-595.0,-382.0,0.000,0.000,94537.80,9.451890e+04,189037.800,0.00,0.000000,0.000,0.0,0.0,0.0,,94518.900000,189037.800,,,,0.0,,,,,0.000000,1.000000,0.0,0.0,1.000000,0.000000,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.000,0.0000,0.0,94537.8,94537.800,0.000000e+00,0.00,inf,94537.8000,,
4,100005,3,-373,-62,-190.666667,-128.0,1324.0,0.000,0.000,568800.00,2.190420e+05,657126.000,543087.00,189469.500000,568408.500,0.0,0.0,0.0,1420.500000,29572.500000,88717.500,-3.666667,3.785939,5.666667,17.0,0.814815,0.000000,0.333333,0.148148,0.666667,0.333333,0.0,0.0,0.666667,0.333333,0.0,0.0,0.0,-62.0,-99.500000,122.0,1324.0,0.000,0.0000,568800.00,598626.000,2.842042e+05,568408.500,0.0,0.0,-31.0,-21.000000,1.112619,15108.7500,inf,-1.500000,0.707107,4.000000,8.0,0.0,0.0,0.0,568800.000,598626.000,284204.25,568408.5,1.112619,15108.750,0.833333,0.0,0.000,0.0000,0.0,568800.0,657126.000,1.894695e+05,568408.50,inf,29572.5000,0.814815,0.000000
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
305806,456249,13,-2713,-483,-1667.076923,-2499.0,1363.0,18945.000,6147.000,765000.00,2.841430e+05,3693858.660,163071.00,16307.100000,163071.000,0.0,0.0,0.0,,209078.766000,2090787.660,,,,0.0,,,,,0.153846,0.846154,0.0,0.0,0.692308,0.230769,0.0,0.0,0.0,-483.0,-1547.500000,-1497.0,1363.0,0.000,0.0000,225000.00,405000.000,8.153550e+04,163071.000,0.0,0.0,-1213.0,-612.500000,inf,120964.5000,,,,,0.0,,,,,,,,,,,,,,0.0,180000.0,180000.000,1.630710e+05,163071.00,1.103814,16929.0000,,
305807,456250,3,-1002,-760,-862.000000,-272.0,2340.0,0.000,0.000,2153110.05,1.028820e+06,3086459.550,1840308.48,744013.365000,2232040.095,0.0,0.0,0.0,154567.965000,284806.485000,854419.455,-18.000000,8.674676,21.000000,63.0,0.345747,0.000000,0.333333,0.617216,0.666667,0.333333,0.0,0.0,0.666667,0.333333,0.0,0.0,0.0,-760.0,-792.000000,1797.0,2340.0,0.000,0.0000,2153110.05,2603110.050,1.116020e+06,2232040.095,0.0,0.0,-31.0,-27.000000,1.159359,185534.9775,28.889064,-13.000000,0.707107,27.000000,54.0,,,,,,,,,,,,,,,,,,,,,,
305808,456253,4,-919,-713,-867.500000,-189.0,1113.0,,,2250000.00,9.900000e+05,3960000.000,1624797.00,448958.250000,1795833.000,0.0,0.0,0.0,58369.500000,541041.750000,2164167.000,-20.875000,6.250000,15.750000,63.0,0.806891,0.000000,0.750000,0.135417,0.500000,0.500000,0.0,0.0,0.750000,0.250000,0.0,0.0,0.0,-713.0,-816.000000,387.0,1113.0,,,2250000.00,2610000.000,8.979165e+05,1795833.000,0.0,0.0,-179.0,-92.000000,1.744804,407083.5000,6.167605,-17.750000,8.838835,18.500000,37.0,,,,,,,,,,,,,,0.0,2250000.0,2250000.000,1.624797e+06,1624797.00,1.384788,625203.0000,0.458333,0.000000
305809,456254,1,-1104,-1104,-1104.000000,-859.0,-859.0,,,45000.00,4.500000e+04,45000.000,0.00,0.000000,0.000,0.0,0.0,0.0,0.000000,45000.000000,45000.000,-32.000000,,9.000000,9.0,0.888889,0.000000,1.000000,0.000000,0.000000,1.000000,0.0,0.0,1.000000,0.000000,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


## 4. POS CASH
[top](#Contents)

In [47]:
missing_data(pos)

The dataframe has 8 columns.
There are 2 columns that have missing values.


Unnamed: 0,Total,% of Missing Values
CNT_INSTALMENT,1898,0.2
CNT_INSTALMENT_FUTURE,1898,0.2


In [48]:
pos.head(3)

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,MONTHS_BALANCE,CNT_INSTALMENT,CNT_INSTALMENT_FUTURE,NAME_CONTRACT_STATUS,SK_DPD,SK_DPD_DEF
0,1803195,182943,-31,48.0,45.0,Active,0,0
1,1715348,367990,-33,36.0,35.0,Active,0,0
2,1784872,397406,-32,12.0,9.0,Active,0,0
3,1903291,269225,-35,48.0,42.0,Active,0,0
4,2341044,334279,-35,36.0,35.0,Active,0,0


In [49]:
pos.loc[pos['SK_ID_PREV']==2116637]

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,MONTHS_BALANCE,CNT_INSTALMENT,CNT_INSTALMENT_FUTURE,NAME_CONTRACT_STATUS,SK_DPD,SK_DPD_DEF
431,2116637,337030,-41,10.0,0.0,Completed,0,0
267833,2116637,337030,-43,24.0,2.0,Active,0,0


In [50]:
pos = pd.get_dummies(pos, columns=['NAME_CONTRACT_STATUS'])

In [51]:
# flag months with late payments
pos['FLAG_LATE_PAYMENT'] = pos['SK_DPD'].apply(lambda x: 1 if x > 0 else 0)

In [52]:
# check
pos.head(3)

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,MONTHS_BALANCE,CNT_INSTALMENT,CNT_INSTALMENT_FUTURE,SK_DPD,SK_DPD_DEF,NAME_CONTRACT_STATUS_Active,NAME_CONTRACT_STATUS_Approved,NAME_CONTRACT_STATUS_Canceled,NAME_CONTRACT_STATUS_Completed,NAME_CONTRACT_STATUS_Demand,NAME_CONTRACT_STATUS_Returned to the store,NAME_CONTRACT_STATUS_Signed,FLAG_LATE_PAYMENT
0,1803195,182943,-31,48.0,45.0,0,0,1,0,0,0,0,0,0,0
1,1715348,367990,-33,36.0,35.0,0,0,1,0,0,0,0,0,0,0
2,1784872,397406,-32,12.0,9.0,0,0,1,0,0,0,0,0,0,0
3,1903291,269225,-35,48.0,42.0,0,0,1,0,0,0,0,0,0,0
4,2341044,334279,-35,36.0,35.0,0,0,1,0,0,0,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1048570,2674109,363927,-2,48.0,39.0,0,0,1,0,0,0,0,0,0,0
1048571,1359930,438122,-4,20.0,0.0,0,0,0,0,0,1,0,0,0,0
1048572,2820160,147643,-9,24.0,15.0,0,0,1,0,0,0,0,0,0,0
1048573,1945170,307924,-11,12.0,7.0,0,0,1,0,0,0,0,0,0,0


In [53]:
pos_cash_aggregation = {'SK_ID_PREV': ['nunique'],
                        'MONTHS_BALANCE': ['min', 'max', 'size'],
                        'SK_DPD': ['max', 'mean', 'sum', 'std'],
                        'SK_DPD_DEF': ['max', 'mean', 'sum'],
                        'FLAG_LATE_PAYMENT': ['mean'],
                        'NAME_CONTRACT_STATUS_Active': ['mean'],
                        'NAME_CONTRACT_STATUS_Approved': ['mean'],
                        'NAME_CONTRACT_STATUS_Canceled': ['mean'],
                        'NAME_CONTRACT_STATUS_Completed': ['mean'],
                        'NAME_CONTRACT_STATUS_Demand': ['mean'],
                        'NAME_CONTRACT_STATUS_Returned to the store': ['mean'],
                        'NAME_CONTRACT_STATUS_Signed': ['mean'],
                       }


In [54]:
# Aggregate by SK_ID_CURR
pos_agg = group(pos, 'POS_', pos_cash_aggregation)

In [55]:
# check
pos_agg.head(3)

Unnamed: 0,SK_ID_CURR,POS_SK_ID_PREV_NUNIQUE,POS_MONTHS_BALANCE_MIN,POS_MONTHS_BALANCE_MAX,POS_MONTHS_BALANCE_SIZE,POS_SK_DPD_MAX,POS_SK_DPD_MEAN,POS_SK_DPD_SUM,POS_SK_DPD_STD,POS_SK_DPD_DEF_MAX,POS_SK_DPD_DEF_MEAN,POS_SK_DPD_DEF_SUM,POS_FLAG_LATE_PAYMENT_MEAN,POS_NAME_CONTRACT_STATUS_Active_MEAN,POS_NAME_CONTRACT_STATUS_Approved_MEAN,POS_NAME_CONTRACT_STATUS_Canceled_MEAN,POS_NAME_CONTRACT_STATUS_Completed_MEAN,POS_NAME_CONTRACT_STATUS_Demand_MEAN,POS_NAME_CONTRACT_STATUS_Returned to the store_MEAN,POS_NAME_CONTRACT_STATUS_Signed_MEAN
0,100002,1,-13,-13,1,0,0.0,0,,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0
1,100003,2,-66,-23,2,0,0.0,0,0.0,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0
2,100005,1,-21,-21,1,0,0.0,0,,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0
3,100007,4,-73,-3,6,0,0.0,0,0.0,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0
4,100008,1,-19,-13,3,0,0.0,0,0.0,0,0.0,0,0.0,0.666667,0.0,0.0,0.333333,0.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
262087,456248,2,-27,-4,8,0,0.0,0,0.0,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0
262088,456249,1,-41,-40,2,0,0.0,0,0.0,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0
262089,456250,2,-19,-2,5,0,0.0,0,0.0,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0
262090,456253,1,-59,-59,1,0,0.0,0,,0,0.0,0,0.0,1.000000,0.0,0.0,0.000000,0.0,0.0,0.0


In [56]:
sort_pos = pos.sort_values(by=['SK_ID_PREV', 'MONTHS_BALANCE'])
gp = sort_pos.groupby('SK_ID_PREV')

In [57]:
# create empty dataframe which we will populate
df = pd.DataFrame()
df['SK_ID_CURR'] = gp['SK_ID_CURR'].first()
df['MONTHS_BALANCE_MAX'] = gp['MONTHS_BALANCE'].max()

# Percentage of previous loans completed 
# and completed before initial term
df['POS_LOAN_COMPLETED_MEAN'] = gp['NAME_CONTRACT_STATUS_Completed'].mean()
df['POS_COMPLETED_BEFORE_MEAN'] = gp['CNT_INSTALMENT'].first() - gp['CNT_INSTALMENT'].last()
df['POS_COMPLETED_BEFORE_MEAN'] = df.apply(lambda x: 1 if x['POS_COMPLETED_BEFORE_MEAN'] > 0
                                                and x['POS_LOAN_COMPLETED_MEAN'] > 0 else 0, axis=1)

# Number of remaining installments (future installments) and percentage from total
df['POS_REMAINING_INSTALMENTS'] = gp['CNT_INSTALMENT_FUTURE'].last()
df['POS_REMAINING_INSTALMENTS_RATIO'] = gp['CNT_INSTALMENT_FUTURE'].last()/gp['CNT_INSTALMENT'].last()
# Group by SK_ID_CURR and merge
df_gp = df.groupby('SK_ID_CURR').sum().reset_index()
df_gp.drop(['MONTHS_BALANCE_MAX'], axis=1, inplace= True)

pos_agg = pd.merge(pos_agg, df_gp, on= 'SK_ID_CURR', how= 'left')

In [58]:
pos_agg.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 262092 entries, 0 to 262091
Data columns (total 24 columns):
 #   Column                                               Non-Null Count   Dtype  
---  ------                                               --------------   -----  
 0   SK_ID_CURR                                           262092 non-null  int64  
 1   POS_SK_ID_PREV_NUNIQUE                               262092 non-null  int64  
 2   POS_MONTHS_BALANCE_MIN                               262092 non-null  int64  
 3   POS_MONTHS_BALANCE_MAX                               262092 non-null  int64  
 4   POS_MONTHS_BALANCE_SIZE                              262092 non-null  int64  
 5   POS_SK_DPD_MAX                                       262092 non-null  int64  
 6   POS_SK_DPD_MEAN                                      262092 non-null  float64
 7   POS_SK_DPD_SUM                                       262092 non-null  int64  
 8   POS_SK_DPD_STD                                       1

## 5. Previous Applications
[top](#Contents)

In [59]:
missing_data(pre_app)

The dataframe has 37 columns.
There are 16 columns that have missing values.


Unnamed: 0,Total,% of Missing Values
RATE_INTEREST_PRIMARY,1664263,99.6
RATE_INTEREST_PRIVILEGED,1664263,99.6
AMT_DOWN_PAYMENT,895844,53.6
RATE_DOWN_PAYMENT,895844,53.6
NAME_TYPE_SUITE,820405,49.1
DAYS_FIRST_DRAWING,673065,40.3
DAYS_FIRST_DUE,673065,40.3
DAYS_LAST_DUE_1ST_VERSION,673065,40.3
DAYS_LAST_DUE,673065,40.3
DAYS_TERMINATION,673065,40.3


In [60]:
# as there are duplicates based on repeat application, we filter these out
pre_app = pre_app.loc[pre_app['FLAG_LAST_APPL_PER_CONTRACT']=='Y']
pre_app = pre_app.loc[pre_app['NFLAG_LAST_APPL_IN_DAY']==1]

In [61]:
pre_app.head(3)

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,NAME_CONTRACT_TYPE,AMT_ANNUITY,AMT_APPLICATION,AMT_CREDIT,AMT_DOWN_PAYMENT,AMT_GOODS_PRICE,WEEKDAY_APPR_PROCESS_START,HOUR_APPR_PROCESS_START,FLAG_LAST_APPL_PER_CONTRACT,NFLAG_LAST_APPL_IN_DAY,RATE_DOWN_PAYMENT,RATE_INTEREST_PRIMARY,RATE_INTEREST_PRIVILEGED,NAME_CASH_LOAN_PURPOSE,NAME_CONTRACT_STATUS,DAYS_DECISION,NAME_PAYMENT_TYPE,CODE_REJECT_REASON,NAME_TYPE_SUITE,NAME_CLIENT_TYPE,NAME_GOODS_CATEGORY,NAME_PORTFOLIO,NAME_PRODUCT_TYPE,CHANNEL_TYPE,SELLERPLACE_AREA,NAME_SELLER_INDUSTRY,CNT_PAYMENT,NAME_YIELD_GROUP,PRODUCT_COMBINATION,DAYS_FIRST_DRAWING,DAYS_FIRST_DUE,DAYS_LAST_DUE_1ST_VERSION,DAYS_LAST_DUE,DAYS_TERMINATION,NFLAG_INSURED_ON_APPROVAL
0,2030495,271877,Consumer loans,1730.43,17145.0,17145.0,0.0,17145.0,SATURDAY,15,Y,1,0.0,0.182832,0.867336,XAP,Approved,-73,Cash through the bank,XAP,,Repeater,Mobile,POS,XNA,Country-wide,35,Connectivity,12.0,middle,POS mobile with interest,365243.0,-42.0,300.0,-42.0,-37.0,0.0
1,2802425,108129,Cash loans,25188.615,607500.0,679671.0,,607500.0,THURSDAY,11,Y,1,,,,XNA,Approved,-164,XNA,XAP,Unaccompanied,Repeater,XNA,Cash,x-sell,Contact center,-1,XNA,36.0,low_action,Cash X-Sell: low,365243.0,-134.0,916.0,365243.0,365243.0,1.0
2,2523466,122040,Cash loans,15060.735,112500.0,136444.5,,112500.0,TUESDAY,11,Y,1,,,,XNA,Approved,-301,Cash through the bank,XAP,"Spouse, partner",Repeater,XNA,Cash,x-sell,Credit and cash offices,-1,XNA,12.0,high,Cash X-Sell: high,365243.0,-271.0,59.0,365243.0,365243.0,1.0


In [62]:
# create feature that aligns with what we did for the train set
# changing the process start hours to morning, afternoon or dusk
pre_app['HOUR_APPR_PROCESS_START'] = pre_app['HOUR_APPR_PROCESS_START'].apply(lambda x: 'morning' if (x>=7 and x<=12) else 'afternoon' if (x>=13 and x<=20) else 'dusk')

In [63]:
pre_app = pd.get_dummies(pre_app, columns=['NAME_CONTRACT_TYPE', 'NAME_CONTRACT_STATUS',
                                           'WEEKDAY_APPR_PROCESS_START', 'NAME_TYPE_SUITE', 
                                           'NAME_CLIENT_TYPE', 'NAME_PRODUCT_TYPE',
                                           'CHANNEL_TYPE', 'NAME_YIELD_GROUP', 
                                           'PRODUCT_COMBINATION', 'HOUR_APPR_PROCESS_START'])

In [64]:
# Feature engineering: ratios and difference
pre_app['APPLICATION_CREDIT_DIFF'] = pre_app['AMT_APPLICATION'] - pre_app['AMT_CREDIT']
pre_app['APPLICATION_CREDIT_RATIO'] = pre_app['AMT_APPLICATION'] / pre_app['AMT_CREDIT']
pre_app['CREDIT_TO_ANNUITY_RATIO'] = pre_app['AMT_CREDIT'] / pre_app['AMT_ANNUITY']
pre_app['DOWN_PAYMENT_TO_CREDIT'] = pre_app['AMT_DOWN_PAYMENT'] / pre_app['AMT_CREDIT']

In [65]:
# Interest ratio on previous application (simplified)
total_payment = pre_app['AMT_ANNUITY'] * pre_app['CNT_PAYMENT']
pre_app['SIMPLE_INTERESTS'] = (total_payment/pre_app['AMT_CREDIT'] - 1)/pre_app['CNT_PAYMENT']

In [66]:
# Active loans - approved and not complete yet (last_due 365243)
approved = pre_app.loc[pre_app['NAME_CONTRACT_STATUS_Approved'] == 1]
active_df = approved[approved['DAYS_LAST_DUE'] == 365243]
    
# Find how much was already payed in active loans (using installments payment df)
active_pay = install_pay.loc[install_pay['SK_ID_PREV'].isin(active_df['SK_ID_PREV'])]
active_pay_agg = active_pay.groupby('SK_ID_PREV')[['AMT_INSTALMENT', 'AMT_PAYMENT']].sum()
active_pay_agg.reset_index(inplace= True)
    
# Active loans: difference of what was payed and installments
active_pay_agg['INSTALMENT_PAYMENT_DIFF'] = active_pay_agg['AMT_INSTALMENT'] - active_pay_agg['AMT_PAYMENT']

In [67]:
# Merge with active_df and calculate remaining debt amount and ratio
active_df = active_df.merge(active_pay_agg, on= 'SK_ID_PREV', how= 'left')
active_df['REMAINING_DEBT'] = active_df['AMT_CREDIT'] - active_df['AMT_PAYMENT']
active_df['REPAYMENT_RATIO'] = active_df['AMT_PAYMENT'] / active_df['AMT_CREDIT']

In [68]:
pre_active_agg = {'SK_ID_PREV': ['nunique'],
                  'SIMPLE_INTERESTS': ['mean'],
                  'AMT_ANNUITY': ['max', 'sum'],
                  'AMT_APPLICATION': ['max', 'mean'],
                  'AMT_CREDIT': ['sum'],
                  'AMT_DOWN_PAYMENT': ['max', 'mean'],
                  'DAYS_DECISION': ['min', 'mean'],
                  'CNT_PAYMENT': ['mean', 'sum'],
                  'DAYS_LAST_DUE_1ST_VERSION': ['min', 'max', 'mean'],
                  'AMT_PAYMENT': ['sum'],
                  'INSTALMENT_PAYMENT_DIFF': ['mean', 'max'],
                  'REMAINING_DEBT': ['max', 'mean', 'sum'],
                  'REPAYMENT_RATIO': ['mean'],
                 }

In [69]:
# Perform aggregations for active applications
active_agg_df = group(active_df, 'PREV_ACTIVE_', pre_active_agg)
active_agg_df['TOTAL_REPAYMENT_RATIO'] = active_agg_df['PREV_ACTIVE_AMT_PAYMENT_SUM']/active_agg_df['PREV_ACTIVE_AMT_CREDIT_SUM']

In [70]:
# Change 365243 values to nan (missing)
pre_app['DAYS_FIRST_DRAWING'].replace(365243, np.nan, inplace= True)
pre_app['DAYS_FIRST_DUE'].replace(365243, np.nan, inplace= True)
pre_app['DAYS_LAST_DUE_1ST_VERSION'].replace(365243, np.nan, inplace= True)
pre_app['DAYS_LAST_DUE'].replace(365243, np.nan, inplace= True)
pre_app['DAYS_TERMINATION'].replace(365243, np.nan, inplace= True)

# Days last due difference (scheduled x done)
pre_app['DAYS_LAST_DUE_DIFF'] = pre_app['DAYS_LAST_DUE_1ST_VERSION'] - pre_app['DAYS_LAST_DUE']

# calculate for approved loans only too
approved['DAYS_LAST_DUE_DIFF'] = approved['DAYS_LAST_DUE_1ST_VERSION'] - approved['DAYS_LAST_DUE']

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  approved['DAYS_LAST_DUE_DIFF'] = approved['DAYS_LAST_DUE_1ST_VERSION'] - approved['DAYS_LAST_DUE']


In [71]:
pre_app.head(2)

Unnamed: 0,SK_ID_PREV,SK_ID_CURR,AMT_ANNUITY,AMT_APPLICATION,AMT_CREDIT,AMT_DOWN_PAYMENT,AMT_GOODS_PRICE,FLAG_LAST_APPL_PER_CONTRACT,NFLAG_LAST_APPL_IN_DAY,RATE_DOWN_PAYMENT,RATE_INTEREST_PRIMARY,RATE_INTEREST_PRIVILEGED,NAME_CASH_LOAN_PURPOSE,DAYS_DECISION,NAME_PAYMENT_TYPE,CODE_REJECT_REASON,NAME_GOODS_CATEGORY,NAME_PORTFOLIO,SELLERPLACE_AREA,NAME_SELLER_INDUSTRY,CNT_PAYMENT,DAYS_FIRST_DRAWING,DAYS_FIRST_DUE,DAYS_LAST_DUE_1ST_VERSION,DAYS_LAST_DUE,DAYS_TERMINATION,NFLAG_INSURED_ON_APPROVAL,NAME_CONTRACT_TYPE_Cash loans,NAME_CONTRACT_TYPE_Consumer loans,NAME_CONTRACT_TYPE_Revolving loans,NAME_CONTRACT_TYPE_XNA,NAME_CONTRACT_STATUS_Approved,NAME_CONTRACT_STATUS_Canceled,NAME_CONTRACT_STATUS_Refused,NAME_CONTRACT_STATUS_Unused offer,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group of people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse, partner",NAME_TYPE_SUITE_Unaccompanied,NAME_CLIENT_TYPE_New,NAME_CLIENT_TYPE_Refreshed,NAME_CLIENT_TYPE_Repeater,NAME_CLIENT_TYPE_XNA,NAME_PRODUCT_TYPE_XNA,NAME_PRODUCT_TYPE_walk-in,NAME_PRODUCT_TYPE_x-sell,CHANNEL_TYPE_AP+ (Cash loan),CHANNEL_TYPE_Car dealer,CHANNEL_TYPE_Channel of corporate sales,CHANNEL_TYPE_Contact center,CHANNEL_TYPE_Country-wide,CHANNEL_TYPE_Credit and cash offices,CHANNEL_TYPE_Regional / Local,CHANNEL_TYPE_Stone,NAME_YIELD_GROUP_XNA,NAME_YIELD_GROUP_high,NAME_YIELD_GROUP_low_action,NAME_YIELD_GROUP_low_normal,NAME_YIELD_GROUP_middle,PRODUCT_COMBINATION_Card Street,PRODUCT_COMBINATION_Card X-Sell,PRODUCT_COMBINATION_Cash,PRODUCT_COMBINATION_Cash Street: high,PRODUCT_COMBINATION_Cash Street: low,PRODUCT_COMBINATION_Cash Street: middle,PRODUCT_COMBINATION_Cash X-Sell: high,PRODUCT_COMBINATION_Cash X-Sell: low,PRODUCT_COMBINATION_Cash X-Sell: middle,PRODUCT_COMBINATION_POS household with interest,PRODUCT_COMBINATION_POS household without interest,PRODUCT_COMBINATION_POS industry with interest,PRODUCT_COMBINATION_POS industry without interest,PRODUCT_COMBINATION_POS mobile with interest,PRODUCT_COMBINATION_POS mobile without interest,PRODUCT_COMBINATION_POS other with interest,PRODUCT_COMBINATION_POS others without interest,HOUR_APPR_PROCESS_START_afternoon,HOUR_APPR_PROCESS_START_dusk,HOUR_APPR_PROCESS_START_morning,APPLICATION_CREDIT_DIFF,APPLICATION_CREDIT_RATIO,CREDIT_TO_ANNUITY_RATIO,DOWN_PAYMENT_TO_CREDIT,SIMPLE_INTERESTS,DAYS_LAST_DUE_DIFF
0,2030495,271877,1730.43,17145.0,17145.0,0.0,17145.0,Y,1,0.0,0.182832,0.867336,XAP,-73,Cash through the bank,XAP,Mobile,POS,35,Connectivity,12.0,,-42.0,300.0,-42.0,-37.0,0.0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0.0,1.0,9.907942,0.0,0.017596,342.0
1,2802425,108129,25188.615,607500.0,679671.0,,607500.0,Y,1,,,,XNA,-164,XNA,XAP,XNA,Cash,-1,XNA,36.0,,-134.0,916.0,,,1.0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,-72171.0,0.893815,26.983262,,0.009282,


In [72]:
previous_agg = {'SK_ID_PREV': ['nunique'],
                'AMT_ANNUITY': ['min', 'max', 'mean'],
                'AMT_DOWN_PAYMENT': ['max', 'mean'],
                'RATE_DOWN_PAYMENT': ['max', 'mean'],
                'DAYS_DECISION': ['min', 'max', 'mean'],
                'CNT_PAYMENT': ['max', 'mean'],
                'DAYS_TERMINATION': ['max'],
                'CREDIT_TO_ANNUITY_RATIO': ['mean', 'max'],
                'APPLICATION_CREDIT_DIFF': ['min', 'max', 'mean'],
                'APPLICATION_CREDIT_RATIO': ['min', 'max', 'mean', 'std'],
                'DOWN_PAYMENT_TO_CREDIT': ['mean'],
                'NAME_CONTRACT_TYPE_Cash loans': ['mean'],
                'NAME_CONTRACT_TYPE_Consumer loans': ['mean'],
                'NAME_CONTRACT_TYPE_Revolving loans': ['mean'],
                'NAME_CONTRACT_TYPE_XNA': ['mean'],
                'NAME_CONTRACT_TYPE_Cash loans': ['mean'],
                'NAME_CONTRACT_STATUS_Approved': ['mean'],
                'NAME_CONTRACT_STATUS_Canceled': ['mean'],
                'NAME_CONTRACT_STATUS_Refused': ['mean'],
                'NAME_CONTRACT_STATUS_Unused offer': ['mean'],
                'WEEKDAY_APPR_PROCESS_START_MONDAY': ['mean'],
                'WEEKDAY_APPR_PROCESS_START_TUESDAY': ['mean'],
                'WEEKDAY_APPR_PROCESS_START_WEDNESDAY': ['mean'],
                'WEEKDAY_APPR_PROCESS_START_THURSDAY': ['mean'],
                'WEEKDAY_APPR_PROCESS_START_FRIDAY': ['mean'],
                'WEEKDAY_APPR_PROCESS_START_SATURDAY': ['mean'],
                'WEEKDAY_APPR_PROCESS_START_SUNDAY': ['mean'],
                'NAME_TYPE_SUITE_Children': ['mean'], 
                'NAME_TYPE_SUITE_Family': ['mean'], 
                'NAME_TYPE_SUITE_Group of people': ['mean'], 
                'NAME_TYPE_SUITE_Other_A': ['mean'], 
                'NAME_TYPE_SUITE_Other_B': ['mean'], 
                'NAME_TYPE_SUITE_Spouse, partner': ['mean'], 
                'NAME_TYPE_SUITE_Unaccompanied': ['mean'], 
                'NAME_CLIENT_TYPE_New': ['mean'], 
                'NAME_CLIENT_TYPE_Refreshed': ['mean'], 
                'NAME_CLIENT_TYPE_Repeater': ['mean'], 
                'NAME_CLIENT_TYPE_XNA': ['mean'],  
                'NAME_PRODUCT_TYPE_walk-in': ['mean'],
                'NAME_PRODUCT_TYPE_x-sell': ['mean'],
                'CHANNEL_TYPE_AP+ (Cash loan)': ['mean'],
                'CHANNEL_TYPE_Car dealer': ['mean'],
                'CHANNEL_TYPE_Channel of corporate sales': ['mean'],
                'CHANNEL_TYPE_Contact center': ['mean'],
                'CHANNEL_TYPE_Credit and cash offices': ['mean'],
                'CHANNEL_TYPE_Regional / Local': ['mean'],
                'CHANNEL_TYPE_Stone': ['mean'],
                'NAME_YIELD_GROUP_XNA': ['mean'], 
                'NAME_YIELD_GROUP_high': ['mean'], 
                'NAME_YIELD_GROUP_low_action': ['mean'], 
                'NAME_YIELD_GROUP_low_normal': ['mean'], 
                'NAME_YIELD_GROUP_middle': ['mean'], 
                'PRODUCT_COMBINATION_Card Street': ['mean'],
                'PRODUCT_COMBINATION_Card X-Sell': ['mean'],
                'PRODUCT_COMBINATION_Cash': ['mean'],
                'PRODUCT_COMBINATION_Cash Street: high': ['mean'],
                'PRODUCT_COMBINATION_Cash Street: low': ['mean'],
                'PRODUCT_COMBINATION_Cash Street: middle': ['mean'],
                'PRODUCT_COMBINATION_Cash X-Sell: high': ['mean'],
                'PRODUCT_COMBINATION_Cash X-Sell: low': ['mean'],
                'PRODUCT_COMBINATION_Cash X-Sell: middle': ['mean'],
                'PRODUCT_COMBINATION_POS household with interest': ['mean'],
                'PRODUCT_COMBINATION_POS household without interest': ['mean'],
                'PRODUCT_COMBINATION_POS industry with interest': ['mean'],
                'PRODUCT_COMBINATION_POS industry without interest': ['mean'],
                'PRODUCT_COMBINATION_POS mobile with interest': ['mean'],
                'PRODUCT_COMBINATION_POS mobile without interest': ['mean'],
                'PRODUCT_COMBINATION_POS other with interest': ['mean'],
                'PRODUCT_COMBINATION_POS others without interest': ['mean'],
                'HOUR_APPR_PROCESS_START_afternoon': ['mean'],
                'HOUR_APPR_PROCESS_START_dusk': ['mean'],
                'HOUR_APPR_PROCESS_START_morning': ['mean'],
               }

In [73]:
# Perform general aggregations
agg_prev = group(pre_app, 'PREV_', previous_agg)

# Merge active loans dataframe on agg_prev
agg_prev = agg_prev.merge(active_agg_df, how='left', on='SK_ID_CURR')

In [74]:
previous_approved_agg = {'SK_ID_PREV': ['nunique'],
                         'AMT_ANNUITY': ['min', 'max', 'mean'],
                         'AMT_CREDIT': ['min', 'max', 'mean'],
                         'AMT_DOWN_PAYMENT': ['max'],
                         'AMT_GOODS_PRICE': ['max'],
                         'DAYS_DECISION': ['min', 'mean'],
                         'CNT_PAYMENT': ['max', 'mean'],
                         'DAYS_TERMINATION': ['mean'],
                         # Engineered features
                         'CREDIT_TO_ANNUITY_RATIO': ['mean', 'max'],
                         'APPLICATION_CREDIT_DIFF': ['max'],
                         'APPLICATION_CREDIT_RATIO': ['min', 'max', 'mean'],
                         # only applicable for approved applications
                         'DAYS_FIRST_DRAWING': ['max', 'mean'],
                         'DAYS_FIRST_DUE': ['min', 'mean'],
                         'DAYS_LAST_DUE_1ST_VERSION': ['min', 'max', 'mean'],
                         'DAYS_LAST_DUE': ['max', 'mean'],
                         'DAYS_LAST_DUE_DIFF': ['min', 'max', 'mean'],
                         'SIMPLE_INTERESTS': ['min', 'max', 'mean', 'std'],
                        }

previous_refused_agg = {'AMT_APPLICATION': ['max', 'mean'],
                        'AMT_CREDIT': ['min', 'max'],
                        'DAYS_DECISION': ['min', 'max', 'mean'],
                        'CNT_PAYMENT': ['max', 'mean'],
                        # Engineered features
                        'APPLICATION_CREDIT_DIFF': ['min', 'max', 'mean', 'std'],
                        'APPLICATION_CREDIT_RATIO': ['min', 'mean'],
                        'NAME_CONTRACT_TYPE_Consumer loans': ['mean'],
                        'NAME_CONTRACT_TYPE_Cash loans': ['mean'],
                        'NAME_CONTRACT_TYPE_Revolving loans': ['mean'],
                       }

In [75]:
# Aggregations for approved and refused loans
agg_prev = group_and_merge(approved, agg_prev, 'APPROVED_', previous_approved_agg)
refused = pre_app.loc[pre_app['NAME_CONTRACT_STATUS_Refused'] == 1]
agg_prev = group_and_merge(refused, agg_prev, 'REFUSED_', previous_refused_agg)

In [76]:
previous_time_agg = {'AMT_CREDIT': ['sum'],
                     'AMT_ANNUITY': ['mean', 'max'],
                     'SIMPLE_INTERESTS': ['mean', 'max', 'std'],
                     'DAYS_DECISION': ['min', 'mean'],
                     'DAYS_LAST_DUE_1ST_VERSION': ['min', 'max', 'mean'],
                     # Engineered features
                     'APPLICATION_CREDIT_DIFF': ['min'],
                     'APPLICATION_CREDIT_RATIO': ['min', 'max', 'mean'],
                     'NAME_CONTRACT_TYPE_Consumer loans': ['mean'],
                     'NAME_CONTRACT_TYPE_Cash loans': ['mean'],
                     'NAME_CONTRACT_TYPE_Revolving loans': ['mean'],
                    }

In [77]:
# look at history for past 2  years
for time_frame in [12, 24]:
    time_frame_df = pre_app.loc[pre_app['DAYS_DECISION'] >= -30*time_frame]
    prefix = 'PREV_LAST{}M_'.format(time_frame)
    agg_prev = group_and_merge(time_frame_df, agg_prev, prefix, previous_time_agg)

## 6. Combining everything into train and test set
[top](#Contents)

In [78]:
# reading train and test datasets
train_1 = pd.read_csv('../datasets/train_1_eda.csv')
train_2 = pd.read_csv('../datasets/train_2_eda.csv')
train_3 = pd.read_csv('../datasets/train_3_eda.csv')
train_4 = pd.read_csv('../datasets/train_4_eda.csv')

test_1 = pd.read_csv('../datasets/test_1_eda.csv')
test_2 = pd.read_csv('../datasets/test_2_eda.csv')
test_3 = pd.read_csv('../datasets/test_3_eda.csv')
test_4 = pd.read_csv('../datasets/test_4_eda.csv')

train_set = [train_1, train_2, train_3, train_4]
test_set = [test_1, test_2, test_3, test_4]

In [79]:
# install_pay = install_pay_agg
# credit_card = cc_agg
# bureau = agg_bureau
# POS CASH = pos_agg
# previous_app = agg_prev

In [80]:
# create new feature that is the combination of marital status of the applicant and 
# who accomanied the applicant for the loan
for df_train in train_set:
    df_train['TYPE_SUITE_FAMILY_STATUS'] = df_train['NAME_TYPE_SUITE'] + '_' + df_train['NAME_FAMILY_STATUS']
    
for df_test in test_set:
    df_test['TYPE_SUITE_FAMILY_STATUS'] = df_test['NAME_TYPE_SUITE'] + '_' + df_test['NAME_FAMILY_STATUS']    

### 6.1. Merging past & bureau data into train_1 and test_1
`Repeat customer with bureau report`<br>
[top](#Contents)

In [81]:
print(train_1.shape)
print(test_1.shape)

(248631, 51)
(41430, 50)


In [82]:
train_1 = pd.merge(train_1, install_pay_agg, on='SK_ID_CURR', how='left')
train_1 = pd.merge(train_1, cc_agg, on='SK_ID_CURR', how='left')
train_1 = pd.merge(train_1, agg_bureau, on='SK_ID_CURR', how='left')
train_1 = pd.merge(train_1, pos_agg, on='SK_ID_CURR', how='left')
train_1 = pd.merge(train_1, agg_prev, on='SK_ID_CURR', how='left')

test_1 = pd.merge(test_1, install_pay_agg, on='SK_ID_CURR', how='left')
test_1 = pd.merge(test_1, cc_agg, on='SK_ID_CURR', how='left')
test_1 = pd.merge(test_1, agg_bureau, on='SK_ID_CURR', how='left')
test_1 = pd.merge(test_1, pos_agg, on='SK_ID_CURR', how='left')
test_1 = pd.merge(test_1, agg_prev, on='SK_ID_CURR', how='left')

In [83]:
print(train_1.shape)
print(test_1.shape)

(248631, 516)
(41430, 515)


In [84]:
# get dummies for categorical columns
train_1 = pd.get_dummies(train_1, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

test_1 = pd.get_dummies(test_1, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

In [85]:
# check
test_1.head(3)

Unnamed: 0,SK_ID_CURR,NAME_CONTRACT_TYPE,CODE_GENDER,FLAG_OWN_CAR,FLAG_OWN_REALTY,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,NAME_INCOME_TYPE,NAME_EDUCATION_TYPE,REGION_POPULATION_RELATIVE,DAYS_REGISTRATION,DAYS_ID_PUBLISH,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,REGION_RATING_CLIENT_W_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_3,FLAG_DOCUMENT_6,FLAG_DOCUMENT_8,FLAG_DOCUMENT_16,FLAG_DOCUMENT_18,NAME_HOUSING_TYPE_CONVERT,AGE,DAYS_EMPLOYED_PENSION,YRS_EMPLOYED,HAVE_CHILDREN,LOAN_INCOME_RATIO,ANNUITY_INCOME_RATIO,CAR_BINS,FAM_MEMBERS_BIN,AVG_EXT_SOURCE,AVG_OBS_CNT_SOCIAL_CIRCLE,AVG_DEF_CNT_SOCIAL_CIRCLE,RATIO_DEF_OBS_SOCIAL_CIRCLE,INS_SK_ID_PREV_NUNIQUE,INS_DAYS_ENTRY_PAYMENT_MEAN,INS_DAYS_ENTRY_PAYMENT_MIN,INS_DAYS_ENTRY_PAYMENT_MAX,INS_AMT_INSTALMENT_MEAN,INS_AMT_INSTALMENT_MIN,INS_AMT_INSTALMENT_MAX,INS_AMT_INSTALMENT_STD,INS_AMT_PAYMENT_MEAN,INS_AMT_PAYMENT_MIN,INS_AMT_PAYMENT_MAX,INS_AMT_PAYMENT_STD,INS_DAYS_BEFORE_DUE_MEAN,INS_DAYS_BEFORE_DUE_MAX,INS_DAYS_BEFORE_DUE_STD,INS_DAYS_PAST_DUE_MEAN,INS_DAYS_PAST_DUE_MAX,INS_DAYS_PAST_DUE_STD,INS_FLAG_LATE_PAY_MEAN,INS_FLAG_LATE_PAY_SUM,INS_INSTALL_PAY_RATIO_MEAN,INS_INSTALL_PAY_RATIO_STD,INS_LATE_PAY_RATIO_MEAN,INS_LATE_PAY_RATIO_STD,INS_SIGNIFICANT_LATE_PAY_MEAN,INS_SIGNIFICANT_LATE_PAY_SUM,INS_FLAG_15DAYS_DUE_MEAN,INS_FLAG_30DAYS_DUE_MEAN,INS_FLAG_60DAYS_DUE_MEAN,INS_PAYMENT_RATIO_MEAN,INS_FLAG_PAYMENT_OVER_MEAN,INS_24M_SK_ID_PREV_SIZE,INS_24M_DAYS_ENTRY_PAYMENT_MEAN,INS_24M_DAYS_ENTRY_PAYMENT_MIN,INS_24M_DAYS_ENTRY_PAYMENT_MAX,INS_24M_AMT_INSTALMENT_MEAN,INS_24M_AMT_INSTALMENT_MIN,INS_24M_AMT_INSTALMENT_MAX,INS_24M_AMT_INSTALMENT_STD,INS_24M_AMT_PAYMENT_MEAN,INS_24M_AMT_PAYMENT_MIN,INS_24M_AMT_PAYMENT_MAX,INS_24M_AMT_PAYMENT_STD,INS_24M_DAYS_BEFORE_DUE_MEAN,INS_24M_DAYS_BEFORE_DUE_MAX,INS_24M_DAYS_BEFORE_DUE_STD,INS_24M_DAYS_PAST_DUE_MEAN,INS_24M_DAYS_PAST_DUE_MAX,INS_24M_DAYS_PAST_DUE_STD,INS_24M_FLAG_LATE_PAY_MEAN,INS_24M_FLAG_LATE_PAY_SUM,INS_24M_INSTALL_PAY_RATIO_MEAN,INS_24M_INSTALL_PAY_RATIO_STD,INS_24M_LATE_PAY_RATIO_MEAN,INS_24M_LATE_PAY_RATIO_STD,INS_24M_SIGNIFICANT_LATE_PAY_MEAN,INS_24M_SIGNIFICANT_LATE_PAY_SUM,INS_24M_FLAG_15DAYS_DUE_MEAN,INS_24M_FLAG_30DAYS_DUE_MEAN,INS_24M_FLAG_60DAYS_DUE_MEAN,INS_24M_PAYMENT_RATIO_MEAN,INS_24M_FLAG_PAYMENT_OVER_MEAN,INS_48M_SK_ID_PREV_SIZE,INS_48M_DAYS_ENTRY_PAYMENT_MEAN,INS_48M_DAYS_ENTRY_PAYMENT_MIN,INS_48M_DAYS_ENTRY_PAYMENT_MAX,INS_48M_AMT_INSTALMENT_MEAN,INS_48M_AMT_INSTALMENT_MIN,INS_48M_AMT_INSTALMENT_MAX,INS_48M_AMT_INSTALMENT_STD,INS_48M_AMT_PAYMENT_MEAN,INS_48M_AMT_PAYMENT_MIN,INS_48M_AMT_PAYMENT_MAX,INS_48M_AMT_PAYMENT_STD,INS_48M_DAYS_BEFORE_DUE_MEAN,INS_48M_DAYS_BEFORE_DUE_MAX,INS_48M_DAYS_BEFORE_DUE_STD,INS_48M_DAYS_PAST_DUE_MEAN,INS_48M_DAYS_PAST_DUE_MAX,INS_48M_DAYS_PAST_DUE_STD,INS_48M_FLAG_LATE_PAY_MEAN,INS_48M_FLAG_LATE_PAY_SUM,INS_48M_INSTALL_PAY_RATIO_MEAN,INS_48M_INSTALL_PAY_RATIO_STD,INS_48M_LATE_PAY_RATIO_MEAN,INS_48M_LATE_PAY_RATIO_STD,INS_48M_SIGNIFICANT_LATE_PAY_MEAN,INS_48M_SIGNIFICANT_LATE_PAY_SUM,INS_48M_FLAG_15DAYS_DUE_MEAN,INS_48M_FLAG_30DAYS_DUE_MEAN,INS_48M_FLAG_60DAYS_DUE_MEAN,INS_48M_PAYMENT_RATIO_MEAN,INS_48M_FLAG_PAYMENT_OVER_MEAN,CC_MONTHS_BALANCE_MIN,CC_AMT_BALANCE_MAX,CC_AMT_BALANCE_MEAN,CC_AMT_CREDIT_LIMIT_ACTUAL_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_SUM,CC_AMT_DRAWINGS_CURRENT_MAX,CC_AMT_DRAWINGS_CURRENT_SUM,CC_AMT_DRAWINGS_POS_CURRENT_MAX,CC_AMT_DRAWINGS_POS_CURRENT_SUM,CC_AMT_INST_MIN_REGULARITY_MAX,CC_AMT_INST_MIN_REGULARITY_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_MAX,CC_AMT_PAYMENT_TOTAL_CURRENT_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_SUM,CC_AMT_PAYMENT_TOTAL_CURRENT_STD,CC_AMT_TOTAL_RECEIVABLE_MAX,CC_AMT_TOTAL_RECEIVABLE_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_MAX,CC_CNT_DRAWINGS_ATM_CURRENT_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_SUM,CC_CNT_DRAWINGS_CURRENT_MAX,CC_CNT_DRAWINGS_CURRENT_MEAN,CC_CNT_DRAWINGS_CURRENT_SUM,CC_CNT_DRAWINGS_POS_CURRENT_MAX,CC_CNT_DRAWINGS_POS_CURRENT_MEAN,CC_CNT_DRAWINGS_POS_CURRENT_SUM,CC_SK_DPD_MAX,CC_SK_DPD_MEAN,CC_SK_DPD_SUM,CC_SK_DPD_DEF_MAX,CC_SK_DPD_DEF_SUM,CC_USAGE_RATIO_MAX,CC_USAGE_RATIO_MEAN,CC_PAYMENT_RATE_MIN,CC_PAYMENT_RATE_MEAN,CC_DRAWING_LIMIT_RATE_MAX,CC_DRAWING_LIMIT_RATE_MEAN,CC_FLAG_15DAYS_DUE_SUM,CC_FLAG_30DAYS_DUE_SUM,CC_FLAG_60DAYS_DUE_SUM,INS_12M_AMT_BALANCE_MAX,INS_12M_AMT_BALANCE_MEAN,INS_12M_SK_DPD_MAX,INS_12M_SK_DPD_MEAN,INS_12M_SK_DPD_SUM,INS_12M_USAGE_RATIO_MAX,INS_12M_USAGE_RATIO_MEAN,INS_12M_FLAG_15DAYS_DUE_SUM,INS_12M_FLAG_30DAYS_DUE_SUM,INS_12M_FLAG_60DAYS_DUE_SUM,INS_24M_AMT_BALANCE_MAX,INS_24M_AMT_BALANCE_MEAN,INS_24M_SK_DPD_MAX,INS_24M_SK_DPD_MEAN,INS_24M_SK_DPD_SUM,INS_24M_USAGE_RATIO_MAX,INS_24M_USAGE_RATIO_MEAN,INS_24M_FLAG_15DAYS_DUE_SUM,INS_24M_FLAG_30DAYS_DUE_SUM,INS_24M_FLAG_60DAYS_DUE_SUM,INS_36M_AMT_BALANCE_MAX,INS_36M_AMT_BALANCE_MEAN,INS_36M_SK_DPD_MAX,INS_36M_SK_DPD_MEAN,INS_36M_SK_DPD_SUM,INS_36M_USAGE_RATIO_MAX,INS_36M_USAGE_RATIO_MEAN,INS_36M_FLAG_15DAYS_DUE_SUM,INS_36M_FLAG_30DAYS_DUE_SUM,INS_36M_FLAG_60DAYS_DUE_SUM,BUREAU_SK_ID_BUREAU_NUNIQUE,BUREAU_DAYS_CREDIT_MIN,BUREAU_DAYS_CREDIT_MAX,BUREAU_DAYS_CREDIT_MEAN,BUREAU_DAYS_CREDIT_ENDDATE_MIN,BUREAU_DAYS_CREDIT_ENDDATE_MAX,BUREAU_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_MAX,BUREAU_AMT_CREDIT_SUM_MEAN,BUREAU_AMT_CREDIT_SUM_SUM,BUREAU_AMT_CREDIT_SUM_DEBT_MAX,BUREAU_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_AMT_CREDIT_SUM_OVERDUE_MAX,BUREAU_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_OVERDUE_SUM,BUREAU_AMT_ANNUITY_MEAN,BUREAU_DEBT_CREDIT_DIFF_MEAN,BUREAU_DEBT_CREDIT_DIFF_SUM,BUREAU_BB_BAL_MONTHS_BALANCE_MEAN_MEAN,BUREAU_BB_BAL_MONTHS_BALANCE_MEAN_STD,BUREAU_BB_BAL_MONTHS_BALANCE_SIZE_MEAN,BUREAU_BB_BAL_MONTHS_BALANCE_SIZE_SUM,BUREAU_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_BB_BAL_FLAG_DPD_MEAN_MEAN,BUREAU_BB_BAL_STATUS_C_SUM_MEAN,BUREAU_BB_BAL_STATUS_X_MEAN_MEAN,BUREAU_CREDIT_ACTIVE_Active_MEAN,BUREAU_CREDIT_ACTIVE_Closed_MEAN,BUREAU_CREDIT_ACTIVE_Sold_MEAN,BUREAU_CREDIT_ACTIVE_Bad debt_MEAN,BUREAU_CREDIT_TYPE_Consumer credit_MEAN,BUREAU_CREDIT_TYPE_Credit card_MEAN,BUREAU_CREDIT_TYPE_Car loan_MEAN,BUREAU_CREDIT_TYPE_Mortgage_MEAN,BUREAU_CREDIT_TYPE_Microloan_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_MAX,BUREAU_ACTIVE_DAYS_CREDIT_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_ENDDATE_MIN,BUREAU_ACTIVE_DAYS_CREDIT_ENDDATE_MAX,BUREAU_ACTIVE_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_ACTIVE_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_ACTIVE_AMT_CREDIT_SUM_MAX,BUREAU_ACTIVE_AMT_CREDIT_SUM_SUM,BUREAU_ACTIVE_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_ACTIVE_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_ACTIVE_AMT_CREDIT_SUM_OVERDUE_MAX,BUREAU_ACTIVE_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_UPDATE_MIN,BUREAU_ACTIVE_DAYS_CREDIT_UPDATE_MEAN,BUREAU_ACTIVE_DEBT_PERCENTAGE_MEAN,BUREAU_ACTIVE_DEBT_CREDIT_DIFF_MEAN,BUREAU_ACTIVE_CREDIT_TO_ANNUITY_RATIO_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_MEAN_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_MEAN_STD,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_SIZE_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_SIZE_SUM,BUREAU_LAST12M_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_LAST12M_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_MAX,BUREAU_LAST12M_AMT_CREDIT_SUM_SUM,BUREAU_LAST12M_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_LAST12M_DEBT_PERCENTAGE_MEAN,BUREAU_LAST12M_DEBT_CREDIT_DIFF_MEAN,BUREAU_LAST12M_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_LAST12M_BB_BAL_FLAG_DPD_MEAN_MEAN,BUREAU_LAST24M_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_LAST24M_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_MAX,BUREAU_LAST24M_AMT_CREDIT_SUM_SUM,BUREAU_LAST24M_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_LAST24M_DEBT_PERCENTAGE_MEAN,BUREAU_LAST24M_DEBT_CREDIT_DIFF_MEAN,BUREAU_LAST24M_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_LAST24M_BB_BAL_FLAG_DPD_MEAN_MEAN,POS_SK_ID_PREV_NUNIQUE,POS_MONTHS_BALANCE_MIN,POS_MONTHS_BALANCE_MAX,POS_MONTHS_BALANCE_SIZE,POS_SK_DPD_MAX,POS_SK_DPD_MEAN,POS_SK_DPD_SUM,POS_SK_DPD_STD,POS_SK_DPD_DEF_MAX,POS_SK_DPD_DEF_MEAN,POS_SK_DPD_DEF_SUM,POS_FLAG_LATE_PAYMENT_MEAN,POS_NAME_CONTRACT_STATUS_Active_MEAN,POS_NAME_CONTRACT_STATUS_Approved_MEAN,POS_NAME_CONTRACT_STATUS_Canceled_MEAN,POS_NAME_CONTRACT_STATUS_Completed_MEAN,POS_NAME_CONTRACT_STATUS_Demand_MEAN,POS_NAME_CONTRACT_STATUS_Returned to the store_MEAN,POS_NAME_CONTRACT_STATUS_Signed_MEAN,POS_LOAN_COMPLETED_MEAN,POS_COMPLETED_BEFORE_MEAN,POS_REMAINING_INSTALMENTS,POS_REMAINING_INSTALMENTS_RATIO,PREV_SK_ID_PREV_NUNIQUE,PREV_AMT_ANNUITY_MIN,PREV_AMT_ANNUITY_MAX,PREV_AMT_ANNUITY_MEAN,PREV_AMT_DOWN_PAYMENT_MAX,PREV_AMT_DOWN_PAYMENT_MEAN,PREV_RATE_DOWN_PAYMENT_MAX,PREV_RATE_DOWN_PAYMENT_MEAN,PREV_DAYS_DECISION_MIN,PREV_DAYS_DECISION_MAX,PREV_DAYS_DECISION_MEAN,PREV_CNT_PAYMENT_MAX,PREV_CNT_PAYMENT_MEAN,PREV_DAYS_TERMINATION_MAX,PREV_CREDIT_TO_ANNUITY_RATIO_MEAN,PREV_CREDIT_TO_ANNUITY_RATIO_MAX,PREV_APPLICATION_CREDIT_DIFF_MIN,PREV_APPLICATION_CREDIT_DIFF_MAX,PREV_APPLICATION_CREDIT_DIFF_MEAN,PREV_APPLICATION_CREDIT_RATIO_MIN,PREV_APPLICATION_CREDIT_RATIO_MAX,PREV_APPLICATION_CREDIT_RATIO_MEAN,PREV_APPLICATION_CREDIT_RATIO_STD,PREV_DOWN_PAYMENT_TO_CREDIT_MEAN,PREV_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_NAME_CONTRACT_TYPE_XNA_MEAN,PREV_NAME_CONTRACT_STATUS_Approved_MEAN,PREV_NAME_CONTRACT_STATUS_Canceled_MEAN,PREV_NAME_CONTRACT_STATUS_Refused_MEAN,PREV_NAME_CONTRACT_STATUS_Unused offer_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_MONDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_TUESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_THURSDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_FRIDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SATURDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SUNDAY_MEAN,PREV_NAME_TYPE_SUITE_Children_MEAN,PREV_NAME_TYPE_SUITE_Family_MEAN,PREV_NAME_TYPE_SUITE_Group of people_MEAN,PREV_NAME_TYPE_SUITE_Other_A_MEAN,PREV_NAME_TYPE_SUITE_Other_B_MEAN,"PREV_NAME_TYPE_SUITE_Spouse, partner_MEAN",PREV_NAME_TYPE_SUITE_Unaccompanied_MEAN,PREV_NAME_CLIENT_TYPE_New_MEAN,PREV_NAME_CLIENT_TYPE_Refreshed_MEAN,PREV_NAME_CLIENT_TYPE_Repeater_MEAN,PREV_NAME_CLIENT_TYPE_XNA_MEAN,PREV_NAME_PRODUCT_TYPE_walk-in_MEAN,PREV_NAME_PRODUCT_TYPE_x-sell_MEAN,PREV_CHANNEL_TYPE_AP+ (Cash loan)_MEAN,PREV_CHANNEL_TYPE_Car dealer_MEAN,PREV_CHANNEL_TYPE_Channel of corporate sales_MEAN,PREV_CHANNEL_TYPE_Contact center_MEAN,PREV_CHANNEL_TYPE_Credit and cash offices_MEAN,PREV_CHANNEL_TYPE_Regional / Local_MEAN,PREV_CHANNEL_TYPE_Stone_MEAN,PREV_NAME_YIELD_GROUP_XNA_MEAN,PREV_NAME_YIELD_GROUP_high_MEAN,PREV_NAME_YIELD_GROUP_low_action_MEAN,PREV_NAME_YIELD_GROUP_low_normal_MEAN,PREV_NAME_YIELD_GROUP_middle_MEAN,PREV_PRODUCT_COMBINATION_Card Street_MEAN,PREV_PRODUCT_COMBINATION_Card X-Sell_MEAN,PREV_PRODUCT_COMBINATION_Cash_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: high_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: low_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: middle_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: high_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: low_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: middle_MEAN,PREV_PRODUCT_COMBINATION_POS household with interest_MEAN,PREV_PRODUCT_COMBINATION_POS household without interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry with interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry without interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile with interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile without interest_MEAN,PREV_PRODUCT_COMBINATION_POS other with interest_MEAN,PREV_PRODUCT_COMBINATION_POS others without interest_MEAN,PREV_HOUR_APPR_PROCESS_START_afternoon_MEAN,PREV_HOUR_APPR_PROCESS_START_dusk_MEAN,PREV_HOUR_APPR_PROCESS_START_morning_MEAN,PREV_ACTIVE_SK_ID_PREV_NUNIQUE,PREV_ACTIVE_SIMPLE_INTERESTS_MEAN,PREV_ACTIVE_AMT_ANNUITY_MAX,PREV_ACTIVE_AMT_ANNUITY_SUM,PREV_ACTIVE_AMT_APPLICATION_MAX,PREV_ACTIVE_AMT_APPLICATION_MEAN,PREV_ACTIVE_AMT_CREDIT_SUM,PREV_ACTIVE_AMT_DOWN_PAYMENT_MAX,PREV_ACTIVE_AMT_DOWN_PAYMENT_MEAN,PREV_ACTIVE_DAYS_DECISION_MIN,PREV_ACTIVE_DAYS_DECISION_MEAN,PREV_ACTIVE_CNT_PAYMENT_MEAN,PREV_ACTIVE_CNT_PAYMENT_SUM,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_ACTIVE_AMT_PAYMENT_SUM,PREV_ACTIVE_INSTALMENT_PAYMENT_DIFF_MEAN,PREV_ACTIVE_INSTALMENT_PAYMENT_DIFF_MAX,PREV_ACTIVE_REMAINING_DEBT_MAX,PREV_ACTIVE_REMAINING_DEBT_MEAN,PREV_ACTIVE_REMAINING_DEBT_SUM,PREV_ACTIVE_REPAYMENT_RATIO_MEAN,TOTAL_REPAYMENT_RATIO,APPROVED_SK_ID_PREV_NUNIQUE,APPROVED_AMT_ANNUITY_MIN,APPROVED_AMT_ANNUITY_MAX,APPROVED_AMT_ANNUITY_MEAN,APPROVED_AMT_CREDIT_MIN,APPROVED_AMT_CREDIT_MAX,APPROVED_AMT_CREDIT_MEAN,APPROVED_AMT_DOWN_PAYMENT_MAX,APPROVED_AMT_GOODS_PRICE_MAX,APPROVED_DAYS_DECISION_MIN,APPROVED_DAYS_DECISION_MEAN,APPROVED_CNT_PAYMENT_MAX,APPROVED_CNT_PAYMENT_MEAN,APPROVED_DAYS_TERMINATION_MEAN,APPROVED_CREDIT_TO_ANNUITY_RATIO_MEAN,APPROVED_CREDIT_TO_ANNUITY_RATIO_MAX,APPROVED_APPLICATION_CREDIT_DIFF_MAX,APPROVED_APPLICATION_CREDIT_RATIO_MIN,APPROVED_APPLICATION_CREDIT_RATIO_MAX,APPROVED_APPLICATION_CREDIT_RATIO_MEAN,APPROVED_DAYS_FIRST_DRAWING_MAX,APPROVED_DAYS_FIRST_DRAWING_MEAN,APPROVED_DAYS_FIRST_DUE_MIN,APPROVED_DAYS_FIRST_DUE_MEAN,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MIN,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MAX,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MEAN,APPROVED_DAYS_LAST_DUE_MAX,APPROVED_DAYS_LAST_DUE_MEAN,APPROVED_DAYS_LAST_DUE_DIFF_MIN,APPROVED_DAYS_LAST_DUE_DIFF_MAX,APPROVED_DAYS_LAST_DUE_DIFF_MEAN,APPROVED_SIMPLE_INTERESTS_MIN,APPROVED_SIMPLE_INTERESTS_MAX,APPROVED_SIMPLE_INTERESTS_MEAN,APPROVED_SIMPLE_INTERESTS_STD,REFUSED_AMT_APPLICATION_MAX,REFUSED_AMT_APPLICATION_MEAN,REFUSED_AMT_CREDIT_MIN,REFUSED_AMT_CREDIT_MAX,REFUSED_DAYS_DECISION_MIN,REFUSED_DAYS_DECISION_MAX,REFUSED_DAYS_DECISION_MEAN,REFUSED_CNT_PAYMENT_MAX,REFUSED_CNT_PAYMENT_MEAN,REFUSED_APPLICATION_CREDIT_DIFF_MIN,REFUSED_APPLICATION_CREDIT_DIFF_MAX,REFUSED_APPLICATION_CREDIT_DIFF_MEAN,REFUSED_APPLICATION_CREDIT_DIFF_STD,REFUSED_APPLICATION_CREDIT_RATIO_MIN,REFUSED_APPLICATION_CREDIT_RATIO_MEAN,REFUSED_NAME_CONTRACT_TYPE_Consumer loans_MEAN,REFUSED_NAME_CONTRACT_TYPE_Cash loans_MEAN,REFUSED_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_LAST12M_AMT_CREDIT_SUM,PREV_LAST12M_AMT_ANNUITY_MEAN,PREV_LAST12M_AMT_ANNUITY_MAX,PREV_LAST12M_SIMPLE_INTERESTS_MEAN,PREV_LAST12M_SIMPLE_INTERESTS_MAX,PREV_LAST12M_SIMPLE_INTERESTS_STD,PREV_LAST12M_DAYS_DECISION_MIN,PREV_LAST12M_DAYS_DECISION_MEAN,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_LAST12M_APPLICATION_CREDIT_DIFF_MIN,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MIN,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MAX,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_LAST24M_AMT_CREDIT_SUM,PREV_LAST24M_AMT_ANNUITY_MEAN,PREV_LAST24M_AMT_ANNUITY_MAX,PREV_LAST24M_SIMPLE_INTERESTS_MEAN,PREV_LAST24M_SIMPLE_INTERESTS_MAX,PREV_LAST24M_SIMPLE_INTERESTS_STD,PREV_LAST24M_DAYS_DECISION_MIN,PREV_LAST24M_DAYS_DECISION_MEAN,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_LAST24M_APPLICATION_CREDIT_DIFF_MIN,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MIN,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MAX,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Revolving loans_MEAN,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group of people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse, partner",NAME_TYPE_SUITE_Unaccompanied,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,NAME_FAMILY_STATUS_Civil marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single / not married,NAME_FAMILY_STATUS_Widow,TYPE_SUITE_FAMILY_STATUS_Children_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Children_Married,TYPE_SUITE_FAMILY_STATUS_Children_Separated,TYPE_SUITE_FAMILY_STATUS_Children_Single / not married,TYPE_SUITE_FAMILY_STATUS_Children_Widow,TYPE_SUITE_FAMILY_STATUS_Family_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Family_Married,TYPE_SUITE_FAMILY_STATUS_Family_Separated,TYPE_SUITE_FAMILY_STATUS_Family_Single / not married,TYPE_SUITE_FAMILY_STATUS_Family_Widow,TYPE_SUITE_FAMILY_STATUS_Group of people_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Group of people_Married,TYPE_SUITE_FAMILY_STATUS_Group of people_Separated,TYPE_SUITE_FAMILY_STATUS_Group of people_Single / not married,TYPE_SUITE_FAMILY_STATUS_Other_A_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Other_A_Married,TYPE_SUITE_FAMILY_STATUS_Other_A_Separated,TYPE_SUITE_FAMILY_STATUS_Other_A_Single / not married,TYPE_SUITE_FAMILY_STATUS_Other_A_Widow,TYPE_SUITE_FAMILY_STATUS_Other_B_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Other_B_Married,TYPE_SUITE_FAMILY_STATUS_Other_B_Separated,TYPE_SUITE_FAMILY_STATUS_Other_B_Single / not married,TYPE_SUITE_FAMILY_STATUS_Other_B_Widow,"TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Civil marriage","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Married","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Separated","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Single / not married",TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Married,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Separated,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Single / not married,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Widow,PROCESS_START_PERIOD_afternoon,PROCESS_START_PERIOD_dusk,PROCESS_START_PERIOD_morning
0,100001,1,0,0,1,135000.0,568800.0,20560.5,4,4,0.018850,-5170.0,-812,1,0,1,0,2,0,0,0,0,0.0,0.0,0.0,0.0,-1740.0,1,0,0,0,0,1,52.715068,0,6.380822,0,4.213333,0.152300,0,2.0,0.567263,0.0,0.0,0.0,2.0,-2195.000000,-2916.0,-1628.0,5885.132143,3951.000,17397.900,5076.676624,5885.132143,3951.000,17397.900,5076.676624,8.857143,36.0,12.811825,1.571429,11.0,4.157609,0.142857,1.0,1.000000,0.000000,0.142857,0.377964,0.142857,1.0,0.000000,0.0,0.0,1.000000,0.00,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,7,-1572,-49,-735.000000,-1329.0,1778.0,,,378000.00,2.076236e+05,1453365.00,373239.000,85240.928571,596686.500,0.0,0.0,0.0,3545.357143,122382.642857,856678.500,-19.357143,16.020077,9.428571,66.0,0.454583,0.007519,0.571429,0.425704,0.428571,0.571429,0.0,0.0,1.000000,0.000000,0.0,0.0,0.0,-49.0,-309.333333,411.0,1778.0,,,378000.00,884025.00,1.988955e+05,596686.500,0.0,0.0,-16.0,-10.666667,1.841065,95779.500000,41.943113,-4.833333,4.252450,10.666667,32.0,,,0.0,378000.0,546345.00,241760.25,483520.5,1.269629,31412.25,0.750000,0.0,,,0.0,378000.0,884025.00,198895.50000,596686.500,1.841065,95779.50000,0.710526,0.017544,,,,,,,,,,,,,,,,,,,,,,,,1.0,3951.000,3951.000,3951.00000,2520.0,2520.000,0.104326,0.104326,-1740.0,-1740.0,-1740.000000,8.0,8.000000,-1612.0,6.020501,6.020501,1048.5,1048.5,1048.500,1.044079,1.044079,1.044079,,0.105940,0.000000,1.000000,0.000000,0.0,1.000000,0.000,0.000000,0.0,0.000000,0.000000,0.000000,0.000000,1.000000,0.00,0.0,0.0,1.000000,0.0,0.0,0.0,0.0,0.000000,0.000000,1.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.000000,1.000000,0.000000,0.000000,0.000000,0.000,0.000000,0.00,0.000000,0.000000,0.000000,0.000,0.000,0.000000,0.000,0.000000,0.000000,0.0,1.000000,0.0,0.000000,0.0,1.000000,0.00,0.000000,,,,,,,,,,,,,,,,,,,,,,,,,1.0,3951.000,3951.000,3951.0000,23787.000,23787.0,23787.0000,2520.0,24835.5,-1740.0,-1740.000000,8.0,8.000000,-1612.000000,6.020501,6.020501,1048.5,1.044079,1.044079,1.044079,365243.0,365243.000000,-1709.0,-1709.000000,-1499.0,-1499.0,-1499.000000,-1619.0,-1619.000000,120.0,120.0,120.000000,0.041099,0.041099,0.041099,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0
1,100005,1,1,0,1,99000.0,222768.0,17370.0,4,2,0.035792,-9118.0,-1623,1,0,1,0,2,0,0,0,0,0.0,0.0,0.0,0.0,0.0,1,0,0,0,0,1,49.490411,0,12.243836,0,2.250182,0.175455,0,2.0,0.429869,0.0,0.0,0.0,1.0,-609.555556,-736.0,-470.0,6240.205000,4813.200,17656.245,4281.015000,6240.205000,4813.200,17656.245,4281.015000,23.666667,37.0,13.285330,0.111111,1.0,0.333333,0.111111,1.0,1.000000,0.000000,0.111111,0.333333,0.111111,1.0,0.000000,0.0,0.0,1.000000,0.00,9.0,-609.555556,-736.0,-470.0,6240.205000,4813.200,17656.245,4281.015000,6240.205000,4813.200,17656.245,4281.015000,23.666667,37.0,13.285330,0.111111,1.0,0.333333,0.111111,1.0,1.000000,0.000000,0.111111,0.333333,0.111111,1.0,0.000000,0.0,0.0,1.000000,0.00,9.0,-609.555556,-736.0,-470.0,6240.205000,4813.200,17656.245,4281.015000,6240.205000,4813.200,17656.245,4281.015000,23.666667,37.0,13.285330,0.111111,1.0,0.333333,0.111111,1.0,1.000000,0.000000,0.111111,0.333333,0.111111,1.0,0.000000,0.0,0.0,1.000000,0.00,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,3,-373,-62,-190.666667,-128.0,1324.0,0.0,0.000,568800.00,2.190420e+05,657126.00,543087.000,189469.500000,568408.500,0.0,0.0,0.0,1420.500000,29572.500000,88717.500,-3.666667,3.785939,5.666667,17.0,0.814815,0.000000,0.333333,0.148148,0.666667,0.333333,0.0,0.0,0.666667,0.333333,0.0,0.0,0.0,-62.0,-99.500000,122.0,1324.0,0.0,0.00,568800.00,598626.00,2.842042e+05,568408.500,0.0,0.0,-31.0,-21.000000,1.112619,15108.750000,inf,-1.500000,0.707107,4.000000,8.0,0.0,0.0,0.0,568800.0,598626.00,284204.25,568408.5,1.112619,15108.75,0.833333,0.0,0.0,0.00,0.0,568800.0,657126.00,189469.50000,568408.500,inf,29572.50000,0.814815,0.000000,1.0,-21.0,-21.0,1.0,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,1.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,9.0,0.750000,2.0,4813.200,4813.200,4813.20000,4464.0,4464.000,0.108964,0.108964,-757.0,-315.0,-536.000000,12.0,12.000000,-460.0,8.342371,8.342371,0.0,4464.0,2232.000,1.111173,1.111173,1.111173,,0.111173,0.500000,0.500000,0.000000,0.0,0.500000,0.500,0.000000,0.0,0.000000,0.000000,0.000000,0.500000,0.500000,0.00,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.000000,0.500000,0.0,0.500000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.500000,0.000000,0.000000,0.500000,0.500000,0.000000,0.000000,0.000000,0.000,0.000000,0.50,0.000000,0.000000,0.000000,0.000,0.000,0.000000,0.000,0.000000,0.000000,0.0,0.500000,0.0,0.000000,0.0,0.000000,0.00,1.000000,,,,,,,,,,,,,,,,,,,,,,,,,1.0,4813.200,4813.200,4813.2000,40153.500,40153.5,40153.5000,4464.0,44617.5,-757.0,-757.000000,12.0,12.000000,-460.000000,8.342371,8.342371,4464.0,1.111173,1.111173,1.111173,365243.0,365243.000000,-706.0,-706.000000,-376.0,-376.0,-376.000000,-466.0,-466.000000,90.0,90.0,90.000000,0.036537,0.036537,0.036537,,,,,,,,,,,,,,,,,,,,0.000,,,,,,-315.0,-315.0,,,,0.0,,,,0.0,1.0,0.0,0.000,,,,,,-315.0,-315.000000,,,,0.0,,,,0.000000,1.0,0.000000,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1
2,100013,1,1,1,1,202500.0,663264.0,69777.0,4,4,0.019101,-2175.0,-3503,1,0,1,0,2,0,0,0,0,0.0,0.0,0.0,0.0,-856.0,0,0,1,0,0,1,54.898630,0,12.213699,0,3.275378,0.344578,4,2.0,0.655389,0.0,0.0,0.0,4.0,-1358.109677,-2705.0,-14.0,10897.898516,67.500,357347.745,32242.521804,9740.235774,6.165,357347.745,32222.932746,5.722581,38.0,10.687130,0.541935,21.0,2.596798,0.070968,11.0,0.935484,0.241331,0.058287,0.234070,0.058065,9.0,0.012903,0.0,0.0,1.000000,0.00,146.0,-1327.184932,-2705.0,-14.0,11124.233630,67.500,357347.745,33211.179833,9895.208116,6.165,357347.745,33198.089331,4.178082,32.0,8.605279,0.575342,21.0,2.672557,0.075342,11.0,0.931507,0.248156,0.061880,0.240761,0.061644,9.0,0.013699,0.0,0.0,1.000000,0.00,146.0,-1327.184932,-2705.0,-14.0,11124.233630,67.500,357347.745,33211.179833,9895.208116,6.165,357347.745,33198.089331,4.178082,32.0,8.605279,0.575342,21.0,2.672557,0.075342,11.0,0.931507,0.248156,0.061880,0.240761,0.061644,9.0,0.013699,0.0,0.0,1.000000,0.00,-96.0,161420.220,18159.919219,157500.0,157500.0,571500.0,157500.00,571500.00,0.00,0.00,7875.000,1454.539551,153675.0,6817.172344,654448.545,21730.655260,161420.220,18101.079844,7.0,0.255556,23.0,7.0,0.239583,23.0,0.0,0.000000,0.0,1.0,0.010417,1.0,1.0,1.0,1.024890,0.115301,0.000000,inf,1.000,0.040317,0.0,0.0,0.0,161420.220,18159.919219,1.0,0.010417,1.0,1.024890,0.115301,0.0,0.0,0.0,161420.220,18159.919219,1.0,0.010417,1.0,1.024890,0.115301,0.0,0.0,0.0,161420.220,18159.919219,1.0,0.010417,1.0,1.024890,0.115301,0.0,0.0,0.0,4,-2070,-1210,-1737.500000,-1707.0,-567.0,19305.0,19305.000,1262250.00,5.180700e+05,2072280.06,0.000,0.000000,0.000,0.0,0.0,0.0,0.000000,26490.060000,26490.060,-40.750000,16.635805,32.500000,130.0,0.654344,0.063008,0.750000,0.256579,0.000000,1.000000,0.0,0.0,0.500000,0.000000,0.5,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,-66.0,-23.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.666667,0.0,0.0,0.0,0.0,0.0,0.333333,0.0,0.0,34.0,1.194444,4.0,4742.415,23153.985,11478.19500,6750.0,3375.000,0.134434,0.067217,-1999.0,-222.0,-837.500000,36.0,17.333333,-85.0,11.523312,22.128804,-62370.0,3096.0,-15262.875,0.878272,1.064589,0.956503,0.096680,0.070409,0.500000,0.500000,0.000000,0.0,0.750000,0.250,0.000000,0.0,0.250000,0.000000,0.250000,0.250000,0.000000,0.25,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.500000,0.000000,0.0,1.000000,0.0,0.000000,0.250000,0.0,0.0,0.0,0.000000,0.500000,0.250000,0.250000,0.250000,0.250000,0.000000,0.000000,0.500000,0.000,0.000000,0.25,0.000000,0.000000,0.000000,0.000,0.000,0.250000,0.250,0.000000,0.000000,0.0,0.250000,0.0,0.000000,0.0,0.500000,0.00,0.500000,,,,,,,,,,,,,,,,,,,,,,,,,3.0,4742.415,23153.985,11478.1950,24232.500,512370.0,194845.5000,6750.0,450000.0,-1999.0,-1042.666667,36.0,17.333333,-710.333333,11.523312,22.128804,3096.0,0.878272,1.064589,0.956503,365243.0,365243.000000,-1949.0,-1005.666667,-1679.0,224.0,-515.666667,-92.0,-715.666667,0.0,570.0,200.000000,0.017412,0.036400,0.027617,0.009573,,,,,,,,,,,,,,,,,,,24232.500,4742.415,4742.415,0.029038,0.029038,,-273.0,-247.5,-92.0,-92.0,-92.00,-1777.5,0.926648,0.926648,0.926648,0.5,0.5,0.0,24232.500,4742.4150,4742.415,0.029038,0.029038,,-273.0,-247.500000,-92.0,-92.0,-92.0,-1777.5,0.926648,0.926648,0.926648,0.500000,0.5,0.000000,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0
3,100028,1,0,0,1,315000.0,1575000.0,49018.5,4,2,0.026392,-2000.0,-4208,1,0,1,1,2,0,0,0,0,0.0,0.0,0.0,0.0,-1805.0,1,0,0,0,0,1,38.290411,0,5.112329,1,5.000000,0.155614,0,4.0,0.549372,0.0,0.0,0.0,3.0,-858.548673,-1785.0,-29.0,4979.282257,1.170,38988.540,4943.202131,4356.731549,1.170,38988.540,4741.949982,3.265487,19.0,4.888064,0.265487,7.0,1.017856,0.106195,12.0,0.911504,0.213056,0.074572,0.241249,0.097345,11.0,0.000000,0.0,0.0,1.000000,0.00,89.0,-703.078652,-1302.0,-29.0,4730.878315,1.170,38988.540,5550.205455,3940.448764,1.170,38988.540,5271.875957,2.235955,19.0,4.666180,0.337079,7.0,1.137619,0.134831,12.0,0.887640,0.234650,0.094681,0.268605,0.123596,11.0,0.000000,0.0,0.0,1.000000,0.00,113.0,-858.548673,-1785.0,-29.0,4979.282257,1.170,38988.540,4943.202131,4356.731549,1.170,38988.540,4741.949982,3.265487,19.0,4.888064,0.265487,7.0,1.017856,0.106195,12.0,0.911504,0.213056,0.074572,0.241249,0.097345,11.0,0.000000,0.0,0.0,1.000000,0.00,-49.0,37335.915,8085.058163,225000.0,18000.0,27000.0,22823.55,301663.62,22823.55,274663.62,11250.000,6133.363929,15750.0,5606.152347,274701.465,4629.385588,36980.415,7968.609184,1.0,0.045455,2.0,12.0,2.387755,117.0,12.0,2.613636,115.0,0.0,0.000000,0.0,0.0,0.0,0.165937,0.035934,0.565555,inf,0.080,0.002727,0.0,0.0,0.0,37335.915,8085.058163,0.0,0.000000,0.0,0.165937,0.035934,0.0,0.0,0.0,37335.915,8085.058163,0.0,0.000000,0.0,0.165937,0.035934,0.0,0.0,0.0,37335.915,8085.058163,0.0,0.000000,0.0,0.165937,0.035934,0.0,0.0,0.0,12,-2105,-269,-1401.750000,-1862.0,30885.0,0.0,0.000,393750.00,1.267396e+05,1520875.08,151015.500,18630.450000,186304.500,0.0,0.0,0.0,3012.010714,75722.058000,757220.580,-33.541667,21.604354,25.250000,303.0,0.690276,0.000000,0.500000,0.273147,0.416667,0.583333,0.0,0.0,0.583333,0.416667,0.0,0.0,0.0,-269.0,-1050.400000,-1105.0,30885.0,0.0,0.00,393750.00,864721.08,4.657612e+04,186304.500,0.0,0.0,-913.0,-238.800000,8.957454,71166.645000,56.574381,-17.000000,12.504999,35.000000,175.0,0.0,0.0,0.0,180000.0,308971.08,89295.75,178591.5,2.934431,65189.79,0.727273,0.0,0.0,0.00,0.0,180000.0,308971.08,89295.75000,178591.500,2.934431,65189.79000,0.727273,0.000000,2.0,-49.0,-26.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,21.0,1.458333,5.0,6028.020,11250.000,8091.58500,11250.0,3750.000,0.173124,0.057708,-1805.0,-531.0,-1124.200000,24.0,11.333333,-614.0,16.733328,21.692944,-225000.0,6435.0,-43713.000,0.000000,1.108112,0.777028,0.520520,0.063002,0.200000,0.600000,0.200000,0.0,0.600000,0.200,0.000000,0.2,0.000000,0.000000,0.000000,0.800000,0.000000,0.20,0.0,0.0,0.000000,0.0,0.0,0.0,0.2,0.000000,0.200000,0.0,0.800000,0.0,0.000000,0.200000,0.0,0.0,0.0,0.200000,0.200000,0.000000,0.000000,0.600000,0.000000,0.200000,0.000000,0.200000,0.000,0.200000,0.20,0.000000,0.000000,0.000000,0.000,0.000,0.000000,0.200,0.200000,0.000000,0.0,0.200000,0.0,0.000000,0.0,0.200000,0.00,0.800000,1.0,-inf,11250.000,11250.000,0.000,0.000,225000.000,,,-1490.0,-1490.0,0.0,0.0,365243.0,365243.0,365243.0,283724.460,70348.2300,70348.230,-58724.460,-58724.4600,-58724.460,1.260998,1.260998,3.0,6028.020,11250.000,8091.5850,59521.500,225000.0,138429.0000,11250.0,130765.5,-1805.0,-1364.000000,24.0,11.333333,121182.666667,16.733328,21.692944,6435.0,0.000000,1.108112,0.702704,365243.0,243054.333333,-1773.0,-1271.000000,-1083.0,365243.0,121221.333333,365243.0,121171.333333,0.0,150.0,50.000000,-inf,0.017550,-inf,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.000,,,,,,-531.0,-531.000000,,,,0.0,,,,0.000000,1.0,0.000000,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1
4,100042,1,0,1,1,270000.0,959688.0,34600.5,2,2,0.025164,-6116.0,-2027,1,0,1,1,2,0,0,0,0,0.0,0.0,0.0,0.0,-1705.0,0,0,1,0,0,1,50.969863,0,32.901370,0,3.554400,0.128150,2,2.0,0.510839,0.0,0.0,0.0,7.0,-1546.208791,-2736.0,-17.0,22120.177995,32.850,1082512.575,94768.693190,21856.803379,32.850,1082512.575,94772.726529,6.307692,32.0,8.655714,0.192308,17.0,1.682325,0.021978,4.0,0.983516,0.117121,0.010682,0.096614,0.010989,2.0,0.010989,0.0,0.0,1.000000,0.00,123.0,-1472.788618,-2526.0,-17.0,13964.004512,32.850,1082512.575,97783.676032,13890.833780,32.850,1082512.575,97792.317557,4.837398,30.0,7.538289,0.260163,17.0,2.035897,0.016260,2.0,0.983740,0.120441,0.000854,0.007034,0.000000,0.0,0.016260,0.0,0.0,1.000000,0.00,153.0,-1419.627451,-2526.0,-17.0,22585.066176,32.850,1082512.575,102610.432745,22271.770882,32.850,1082512.575,102616.220534,5.725490,32.0,8.727026,0.228758,17.0,1.833521,0.026144,4.0,0.980392,0.127564,0.012707,0.105305,0.013072,2.0,0.013072,0.0,0.0,1.000000,0.00,-84.0,93118.455,33356.183036,90000.0,87750.0,265500.0,87750.00,497606.49,7074.00,24174.99,4500.000,2064.370663,87975.0,7369.821429,619065.000,15088.572143,93118.455,33298.140000,3.0,0.226190,19.0,3.0,0.380952,32.0,2.0,0.095238,8.0,1.0,0.023810,2.0,0.0,0.0,1.034649,0.370624,0.965000,inf,0.975,0.035119,0.0,0.0,0.0,93118.455,33356.183036,1.0,0.023810,2.0,1.034649,0.370624,0.0,0.0,0.0,93118.455,33356.183036,1.0,0.023810,2.0,1.034649,0.370624,0.0,0.0,0.0,93118.455,33356.183036,1.0,0.023810,2.0,1.034649,0.370624,0.0,0.0,0.0,14,-2723,-234,-1325.500000,-1627.0,8957.0,5562.0,1312.200,1414269.00,6.814755e+05,9540657.00,1139198.895,256180.241250,3074162.895,0.0,0.0,0.0,17038.687500,467624.508750,5611494.105,-30.035714,24.759974,26.785714,375.0,0.567093,0.015304,0.428571,0.384030,0.571429,0.428571,0.0,0.0,0.785714,0.214286,0.0,0.0,0.0,-234.0,-1009.750000,-1449.0,8957.0,999.0,499.50,1414269.00,4553388.00,4.391661e+05,3074162.895,0.0,0.0,-584.0,-167.250000,inf,153460.729286,inf,-16.250000,10.484683,33.500000,268.0,,,0.0,1414269.0,2204478.00,194500.50,583501.5,inf,540325.50,0.583333,0.0,0.0,0.00,0.0,1414269.0,3518478.00,430675.09875,1722700.395,inf,448944.40125,0.687500,0.000000,1.0,-26.0,-25.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,20.0,0.555556,9.0,4500.000,47660.850,23669.88000,9796.5,2449.125,0.101392,0.025348,-2750.0,-679.0,-1821.777778,36.0,21.111111,-645.0,16.825046,25.129796,-90000.0,2524.5,-42284.000,0.000000,1.026454,0.838218,0.317110,0.025664,0.777778,0.111111,0.111111,0.0,1.000000,0.000,0.000000,0.0,0.333333,0.222222,0.000000,0.222222,0.222222,0.00,0.0,0.0,0.111111,0.0,0.0,0.0,0.0,0.666667,0.111111,0.0,0.888889,0.0,0.555556,0.333333,0.0,0.0,0.0,0.111111,0.777778,0.000000,0.000000,0.111111,0.111111,0.000000,0.333333,0.444444,0.000,0.111111,0.00,0.111111,0.222222,0.222222,0.000,0.000,0.222222,0.000,0.111111,0.000000,0.0,0.000000,0.0,0.000000,0.0,0.555556,0.00,0.444444,,,,,,,,,,,,,,,,,,,,,,,,,9.0,4500.000,47660.850,23669.8800,90000.000,1051789.5,458168.0000,9796.5,967500.0,-2750.0,-1821.777778,36.0,21.111111,50913.714286,16.825046,25.129796,2524.5,0.000000,1.026454,0.838218,365243.0,312701.571429,-2719.0,-1854.000000,-2449.0,365243.0,51239.714286,-649.0,-1461.571429,0.0,366599.0,52701.285714,-inf,0.028667,-inf,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1051789.500,47660.8500,47660.850,0.017536,0.017536,,-679.0,-679.000000,401.0,401.0,401.0,-84289.5,0.919861,0.919861,0.919861,0.000000,1.0,0.000000,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
41425,456202,1,0,1,0,135000.0,252022.5,23112.0,4,2,0.009175,-174.0,-4178,1,0,1,1,2,0,0,0,0,0.0,0.0,0.0,0.0,-987.0,1,0,0,0,0,1,32.076712,0,1.010959,1,1.866833,0.171200,1,4.0,0.392521,0.0,0.0,0.0,5.0,-297.600000,-579.0,-6.0,17446.546800,1232.505,89155.800,16693.236053,19666.306800,1232.505,89155.800,17327.810392,9.160000,33.0,9.624968,0.040000,1.0,0.200000,0.040000,1.0,1.169423,0.421282,0.040000,0.200000,0.040000,1.0,0.000000,0.0,0.0,1.498847,0.16,25.0,-297.600000,-579.0,-6.0,17446.546800,1232.505,89155.800,16693.236053,19666.306800,1232.505,89155.800,17327.810392,9.160000,33.0,9.624968,0.040000,1.0,0.200000,0.040000,1.0,1.169423,0.421282,0.040000,0.200000,0.040000,1.0,0.000000,0.0,0.0,1.498847,0.16,25.0,-297.600000,-579.0,-6.0,17446.546800,1232.505,89155.800,16693.236053,19666.306800,1232.505,89155.800,17327.810392,9.160000,33.0,9.624968,0.040000,1.0,0.200000,0.040000,1.0,1.169423,0.421282,0.040000,0.200000,0.040000,1.0,0.000000,0.0,0.0,1.498847,0.16,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,5,-651,-165,-499.000000,-420.0,1122.0,,,270000.00,7.605900e+04,380295.00,15322.500,3064.500000,15322.500,0.0,0.0,0.0,0.000000,72994.500000,364972.500,-9.300000,4.764452,14.400000,72.0,0.429167,0.012500,0.200000,0.525000,0.800000,0.200000,0.0,0.0,0.200000,0.800000,0.0,0.0,0.0,-165.0,-485.250000,757.0,1122.0,,,270000.00,337500.00,3.830625e+03,15322.500,0.0,0.0,-171.0,-54.750000,inf,80544.375000,inf,-7.750000,3.774917,16.500000,66.0,,,0.0,67500.0,67500.00,0.00,0.0,inf,67500.00,1.000000,0.0,,,0.0,270000.0,380295.00,3064.50000,15322.500,inf,72994.50000,0.429167,0.012500,1.0,-17.0,-17.0,1.0,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,1.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,9.0,0.692308,6.0,3871.980,21001.500,9433.35750,9000.0,2679.000,0.231451,0.089688,-608.0,-96.0,-279.166667,12.0,7.333333,-79.0,6.386555,10.713520,-6556.5,7128.0,426.750,0.934212,1.213736,1.046662,0.114935,0.100784,0.000000,1.000000,0.000000,0.0,0.833333,0.000,0.166667,0.0,0.166667,0.166667,0.333333,0.333333,0.000000,0.00,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.833333,0.166667,0.0,0.833333,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.666667,0.166667,0.000000,0.333333,0.166667,0.166667,0.333333,0.000,0.000000,0.00,0.000000,0.000000,0.000000,0.000,0.000,0.000000,0.000,0.166667,0.333333,0.0,0.166667,0.0,0.333333,0.0,0.666667,0.00,0.333333,1.0,0.038416,6839.415,6839.415,40477.500,40477.500,33349.500,9000.0,9000.0,-96.0,-96.0,6.0,6.0,84.0,84.0,84.0,20518.245,0.0000,0.000,12831.255,12831.2550,12831.255,0.615249,0.615249,5.0,3871.980,21001.500,10448.8560,20344.500,225000.0,82496.7000,9000.0,225000.0,-608.0,-294.200000,12.0,7.600000,72894.400000,6.613007,10.713520,7128.0,0.934212,1.213736,1.050056,365243.0,365243.000000,-575.0,-263.600000,-245.0,84.0,-65.600000,365243.0,72890.600000,-365159.0,180.0,-72956.200000,0.009290,0.042777,0.024829,0.015567,23566.5,23566.5,22887.0,22887.0,-204.0,-204.0,-204.0,6.0,6.0,679.5,679.5,679.5,,1.029689,1.029689,1.0,0.0,0.0,210370.500,7119.729,13383.495,0.027558,0.042777,0.013358,-301.0,-213.4,-121.0,84.0,-20.75,-6556.5,0.934212,1.213736,1.055994,1.0,0.0,0.0,435370.500,9433.3575,21001.500,0.024633,0.042777,0.013932,-608.0,-279.166667,-245.0,84.0,-65.6,-6556.5,0.934212,1.213736,1.046662,1.000000,0.0,0.000000,0,0,0,0,0,0,1,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0
41426,456221,1,0,0,1,121500.0,412560.0,17473.5,4,2,0.002042,-9094.0,-3399,1,1,1,1,3,0,0,0,0,1.0,0.0,1.0,0.0,-684.0,0,0,0,0,0,1,54.712329,0,14.161644,0,3.395556,0.143815,0,1.0,0.645800,1.0,0.0,0.0,1.0,-630.333333,-661.0,-599.0,91036.455000,14222.430,244664.505,133045.794034,91036.455000,14222.430,244664.505,133045.794034,7.333333,8.0,1.154701,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,3.0,-630.333333,-661.0,-599.0,91036.455000,14222.430,244664.505,133045.794034,91036.455000,14222.430,244664.505,133045.794034,7.333333,8.0,1.154701,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,3.0,-630.333333,-661.0,-599.0,91036.455000,14222.430,244664.505,133045.794034,91036.455000,14222.430,244664.505,133045.794034,7.333333,8.0,1.154701,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,5,-1337,-113,-727.200000,-604.0,793.0,17131.5,11427.750,488070.00,2.237598e+05,1118799.00,278901.000,111294.000000,556470.000,0.0,0.0,0.0,5960.700000,112465.800000,562329.000,-15.900000,14.227614,15.600000,78.0,0.670659,0.102125,0.600000,0.010000,0.400000,0.600000,0.0,0.0,0.600000,0.200000,0.0,0.0,0.2,-303.0,-452.000000,495.0,793.0,17131.5,11427.75,488070.00,837931.50,2.782350e+05,556470.000,0.0,0.0,-28.0,-27.500000,1.506401,140730.750000,28.083958,-7.000000,3.535534,15.000000,30.0,5724.0,5724.0,0.0,349861.5,367861.50,139450.50,278901.0,inf,44480.25,0.400000,0.1,17131.5,11427.75,0.0,488070.0,855931.50,185490.00000,556470.000,inf,99820.50000,0.550000,0.100000,,,,,,,,,,,,,,,,,,,,,,,,1.0,14222.430,14222.430,14222.43000,,,,,-683.0,-683.0,-683.000000,24.0,24.000000,-591.0,17.908332,17.908332,-29700.0,-29700.0,-29700.000,0.883392,0.883392,0.883392,,,1.000000,0.000000,0.000000,0.0,1.000000,0.000,0.000000,0.0,0.000000,0.000000,0.000000,0.000000,1.000000,0.00,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,1.000000,1.000000,0.0,0.000000,0.0,1.000000,0.000000,0.0,0.0,0.0,0.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,1.000000,0.000000,0.000,0.000000,0.00,0.000000,1.000000,0.000000,0.000,0.000,0.000000,0.000,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.0,1.000000,0.00,0.000000,,,,,,,,,,,,,,,,,,,,,,,,,1.0,14222.430,14222.430,14222.4300,254700.000,254700.0,254700.0000,,225000.0,-683.0,-683.000000,24.0,24.000000,-591.000000,17.908332,17.908332,-29700.0,0.883392,0.883392,0.883392,365243.0,365243.000000,-653.0,-653.000000,37.0,37.0,37.000000,-593.0,-593.000000,630.0,630.0,630.000000,0.014173,0.014173,0.014173,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,254700.000,14222.4300,14222.430,0.014173,0.014173,,-683.0,-683.000000,37.0,37.0,37.0,-29700.0,0.883392,0.883392,0.883392,0.000000,1.0,0.000000,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0
41427,456223,1,0,1,1,202500.0,315000.0,33205.5,3,2,0.026392,-2681.0,-1504,1,0,1,1,2,0,0,0,0,0.0,0.0,0.0,0.0,-838.0,1,0,0,0,0,1,43.621918,0,8.320548,1,1.555556,0.163978,4,3.0,0.549995,0.0,0.0,0.0,2.0,-586.375000,-818.0,-33.0,23158.991250,12640.950,81184.005,23487.981155,23158.991250,12640.950,81184.005,23487.981155,31.625000,76.0,22.116171,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,8.0,-586.375000,-818.0,-33.0,23158.991250,12640.950,81184.005,23487.981155,23158.991250,12640.950,81184.005,23487.981155,31.625000,76.0,22.116171,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,8.0,-586.375000,-818.0,-33.0,23158.991250,12640.950,81184.005,23487.981155,23158.991250,12640.950,81184.005,23487.981155,31.625000,76.0,22.116171,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,5,-1017,-218,-539.000000,-701.0,-13.0,0.0,0.000,1932340.50,4.312619e+05,2156309.46,21343.500,4268.700000,21343.500,0.0,0.0,0.0,1263.375000,426993.192000,2134965.960,-14.000000,11.527142,7.800000,39.0,0.673901,0.028571,0.800000,0.175000,0.200000,0.800000,0.0,0.0,0.600000,0.200000,0.0,0.2,0.0,-229.0,-229.000000,,,0.0,0.00,50547.96,50547.96,2.134350e+04,21343.500,0.0,0.0,-45.0,-45.000000,2.368307,29204.460000,10.002565,-3.500000,,8.000000,8.0,0.0,0.0,0.0,1932340.5,2036888.46,7114.50,21343.5,inf,671848.32,0.577381,0.0,0.0,0.00,0.0,1932340.5,2036888.46,7114.50000,21343.500,inf,671848.32000,0.577381,0.000000,3.0,-96.0,-77.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,15.0,2.125000,2.0,12640.950,15761.205,14201.07750,17086.5,8543.250,0.108935,0.054467,-838.0,-84.0,-461.000000,12.0,11.000000,-628.0,9.279289,9.754203,0.0,17086.5,8543.250,1.000000,1.111140,1.055570,0.078588,0.055570,0.000000,1.000000,0.000000,0.0,1.000000,0.000,0.000000,0.0,0.000000,0.000000,0.500000,0.000000,0.500000,0.00,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.000000,0.500000,0.0,0.500000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.500000,0.000000,0.000000,0.000000,0.000000,0.500000,0.500000,0.000,0.000000,0.00,0.000000,0.000000,0.000000,0.000,0.000,0.000000,0.000,0.000000,0.500000,0.0,0.000000,0.5,0.000000,0.0,1.000000,0.00,0.000000,1.0,0.013580,12640.950,12640.950,111295.665,111295.665,111295.665,0.0,0.0,-84.0,-84.0,10.0,10.0,229.0,229.0,229.0,25281.900,0.0000,0.000,86013.765,86013.7650,86013.765,0.227160,0.227160,2.0,12640.950,15761.205,14201.0775,111295.665,153738.0,132516.8325,17086.5,170824.5,-838.0,-461.000000,12.0,11.000000,182307.500000,9.279289,9.754203,17086.5,1.000000,1.111140,1.055570,365243.0,365243.000000,-806.0,-423.500000,-476.0,229.0,-123.500000,365243.0,182293.500000,-365014.0,180.0,-182417.000000,0.013580,0.019187,0.016383,0.003965,,,,,,,,,,,,,,,,,,,111295.665,12640.950,12640.950,0.013580,0.013580,,-84.0,-84.0,229.0,229.0,229.00,0.0,1.000000,1.000000,1.000000,1.0,0.0,0.0,111295.665,12640.9500,12640.950,0.013580,0.013580,,-84.0,-84.000000,229.0,229.0,229.0,0.0,1.000000,1.000000,1.000000,1.000000,0.0,0.000000,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1
41428,456224,1,1,0,0,225000.0,450000.0,25128.0,3,4,0.018850,-1461.0,-1364,1,1,1,1,2,0,1,0,1,0.0,0.0,0.0,0.0,-2308.0,1,0,0,0,0,1,38.268493,0,7.482192,0,2.000000,0.111680,0,2.0,0.471416,0.0,0.0,0.0,2.0,-924.965517,-2287.0,-13.0,17269.234138,5519.925,23451.705,8672.791892,17269.234138,5519.925,23451.705,8672.791892,7.275862,15.0,4.757675,0.034483,1.0,0.185695,0.034483,1.0,1.000000,0.000000,0.034483,0.185695,0.034483,1.0,0.000000,0.0,0.0,1.000000,0.00,19.0,-285.631579,-559.0,-13.0,23451.705000,23451.705,23451.705,0.000000,23451.705000,23451.705,23451.705,0.000000,9.631579,14.0,2.732734,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,19.0,-285.631579,-559.0,-13.0,23451.705000,23451.705,23451.705,0.000000,23451.705000,23451.705,23451.705,0.000000,9.631579,14.0,2.732734,0.000000,0.0,0.000000,0.000000,0.0,1.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,1.000000,0.00,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,17,-2738,-515,-1755.823529,-2497.0,980.0,6556.5,1492.488,991189.08,2.263932e+05,3848684.31,380604.060,52511.904000,787678.560,0.0,0.0,0.0,4608.450000,182244.450000,2733666.750,-44.529412,27.609142,26.294118,447.0,0.534876,0.053259,0.588235,0.345612,0.352941,0.647059,0.0,0.0,0.764706,0.235294,0.0,0.0,0.0,-890.0,-1077.500000,-2.0,980.0,0.0,0.00,991189.08,2165689.08,1.312798e+05,787678.560,0.0,0.0,-39.0,-22.500000,6.060414,229668.420000,35.907663,-17.583333,2.922613,36.166667,217.0,,,,,,,,,,,,,,0.0,88294.5,88294.50,0.00000,0.000,inf,88294.50000,0.000000,0.000000,,,,,,,,,,,,,,,,,,,,,,,,5.0,5519.925,23451.705,11486.21625,4500.0,1500.000,0.108985,0.036328,-2308.0,-287.0,-1283.600000,24.0,14.500000,-1998.0,10.944233,19.353582,-52924.5,1417.5,-13820.400,0.824470,1.035027,0.913203,0.088721,0.037066,0.400000,0.600000,0.000000,0.0,0.400000,0.200,0.400000,0.0,0.000000,0.000000,0.200000,0.400000,0.200000,0.00,0.2,0.0,0.000000,0.0,0.0,0.4,0.0,0.000000,0.200000,0.2,0.600000,0.0,0.000000,0.200000,0.0,0.0,0.0,0.000000,0.400000,0.200000,0.200000,0.200000,0.600000,0.000000,0.200000,0.000000,0.000,0.000000,0.20,0.000000,0.000000,0.000000,0.200,0.000,0.000000,0.000,0.000000,0.200000,0.0,0.400000,0.0,0.000000,0.0,0.600000,0.00,0.400000,1.0,0.010003,23451.705,23451.705,400950.000,400950.000,453874.500,0.0,0.0,-577.0,-577.0,24.0,24.0,144.0,144.0,144.0,445582.395,0.0000,0.000,8292.105,8292.1050,8292.105,0.981730,0.981730,2.0,5519.925,23451.705,14485.8150,40468.500,453874.5,247171.5000,4500.0,400950.0,-2308.0,-1442.500000,24.0,17.000000,181622.500000,13.342466,19.353582,1417.5,0.883394,1.035027,0.959211,365243.0,365243.000000,-2272.0,-1409.000000,-2002.0,144.0,-929.000000,365243.0,181620.500000,-365099.0,0.0,-182549.500000,0.010003,0.036401,0.023202,0.018666,80955.0,62977.5,54580.5,88969.5,-1623.0,-1623.0,-1623.0,12.0,12.0,-9580.5,-8014.5,-8797.5,1107.329219,0.824470,0.867194,0.5,0.5,0.0,0.000,,,,,,-287.0,-287.0,,,,0.0,,,,0.0,1.0,0.0,453874.500,23451.7050,23451.705,0.010003,0.010003,,-577.0,-432.000000,144.0,144.0,144.0,-52924.5,0.883394,0.883394,0.883394,0.500000,0.5,0.000000,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1


In [86]:
# for some of these features, we would like to see if they were similar to the past
# i.e. if the applicant apply for the current loan in the morning, 
# did the applicant also mostly apply for loans in the morning previously?

for i in ['morning', 'afternoon', 'dusk']:
    train_1[f'APPR_PROCESS_START_DIV_{i}'] = train_1.apply(lambda x: np.nan if x[f'PROCESS_START_PERIOD_{i}']==0 
                                                              else (x[f'PROCESS_START_PERIOD_{i}'] - x[f'PREV_HOUR_APPR_PROCESS_START_{i}_MEAN']), axis=1)
    
    test_1[f'APPR_PROCESS_START_DIV_{i}'] = test_1.apply(lambda x: np.nan if x[f'PROCESS_START_PERIOD_{i}']==0 
                                                              else (x[f'PROCESS_START_PERIOD_{i}'] - x[f'PREV_HOUR_APPR_PROCESS_START_{i}_MEAN']), axis=1)
    
for j in ['Children', 'Family', 'Group of people', 'Other_A', 'Other_B', 'Spouse, partner', 'Unaccompanied']:
    train_1[f'NAME_TYPE_SUITE_DIV_{j}'] = train_1.apply(lambda x: np.nan if x[f'NAME_TYPE_SUITE_{j}']==0
                                                            else (x[f'NAME_TYPE_SUITE_{j}'] - x[f'PREV_NAME_TYPE_SUITE_{j}_MEAN']), axis=1)
    
    test_1[f'NAME_TYPE_SUITE_DIV_{j}'] = test_1.apply(lambda x: np.nan if x[f'NAME_TYPE_SUITE_{j}']==0
                                                            else (x[f'NAME_TYPE_SUITE_{j}'] - x[f'PREV_NAME_TYPE_SUITE_{j}_MEAN']), axis=1)
    
for k in ['MONDAY', 'TUESDAY', 'WEDNESDAY', 'THURSDAY', 'FRIDAY', 'SATURDAY', 'SUNDAY']:
    train_1[f'WEEKDAY_APPR_PROCESS_DIV_{k}'] = train_1.apply(lambda x: np.nan if x[f'WEEKDAY_APPR_PROCESS_START_{k}']==0
                                                            else (x[f'WEEKDAY_APPR_PROCESS_START_{k}'] - x[f'PREV_WEEKDAY_APPR_PROCESS_START_{k}_MEAN']), axis=1)
    
    test_1[f'WEEKDAY_APPR_PROCESS_DIV_{k}'] = test_1.apply(lambda x: np.nan if x[f'WEEKDAY_APPR_PROCESS_START_{k}']==0
                                                            else (x[f'WEEKDAY_APPR_PROCESS_START_{k}'] - x[f'PREV_WEEKDAY_APPR_PROCESS_START_{k}_MEAN']), axis=1)

In [87]:
train_1.head(3)

Unnamed: 0,SK_ID_CURR,TARGET,NAME_CONTRACT_TYPE,CODE_GENDER,FLAG_OWN_CAR,FLAG_OWN_REALTY,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,NAME_INCOME_TYPE,NAME_EDUCATION_TYPE,REGION_POPULATION_RELATIVE,DAYS_REGISTRATION,DAYS_ID_PUBLISH,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,REGION_RATING_CLIENT_W_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_3,FLAG_DOCUMENT_6,FLAG_DOCUMENT_8,FLAG_DOCUMENT_16,FLAG_DOCUMENT_18,NAME_HOUSING_TYPE_CONVERT,AGE,DAYS_EMPLOYED_PENSION,YRS_EMPLOYED,HAVE_CHILDREN,LOAN_INCOME_RATIO,ANNUITY_INCOME_RATIO,CAR_BINS,FAM_MEMBERS_BIN,AVG_EXT_SOURCE,AVG_OBS_CNT_SOCIAL_CIRCLE,AVG_DEF_CNT_SOCIAL_CIRCLE,RATIO_DEF_OBS_SOCIAL_CIRCLE,INS_SK_ID_PREV_NUNIQUE,INS_DAYS_ENTRY_PAYMENT_MEAN,INS_DAYS_ENTRY_PAYMENT_MIN,INS_DAYS_ENTRY_PAYMENT_MAX,INS_AMT_INSTALMENT_MEAN,INS_AMT_INSTALMENT_MIN,INS_AMT_INSTALMENT_MAX,INS_AMT_INSTALMENT_STD,INS_AMT_PAYMENT_MEAN,INS_AMT_PAYMENT_MIN,INS_AMT_PAYMENT_MAX,INS_AMT_PAYMENT_STD,INS_DAYS_BEFORE_DUE_MEAN,INS_DAYS_BEFORE_DUE_MAX,INS_DAYS_BEFORE_DUE_STD,INS_DAYS_PAST_DUE_MEAN,INS_DAYS_PAST_DUE_MAX,INS_DAYS_PAST_DUE_STD,INS_FLAG_LATE_PAY_MEAN,INS_FLAG_LATE_PAY_SUM,INS_INSTALL_PAY_RATIO_MEAN,INS_INSTALL_PAY_RATIO_STD,INS_LATE_PAY_RATIO_MEAN,INS_LATE_PAY_RATIO_STD,INS_SIGNIFICANT_LATE_PAY_MEAN,INS_SIGNIFICANT_LATE_PAY_SUM,INS_FLAG_15DAYS_DUE_MEAN,INS_FLAG_30DAYS_DUE_MEAN,INS_FLAG_60DAYS_DUE_MEAN,INS_PAYMENT_RATIO_MEAN,INS_FLAG_PAYMENT_OVER_MEAN,INS_24M_SK_ID_PREV_SIZE,INS_24M_DAYS_ENTRY_PAYMENT_MEAN,INS_24M_DAYS_ENTRY_PAYMENT_MIN,INS_24M_DAYS_ENTRY_PAYMENT_MAX,INS_24M_AMT_INSTALMENT_MEAN,INS_24M_AMT_INSTALMENT_MIN,INS_24M_AMT_INSTALMENT_MAX,INS_24M_AMT_INSTALMENT_STD,INS_24M_AMT_PAYMENT_MEAN,INS_24M_AMT_PAYMENT_MIN,INS_24M_AMT_PAYMENT_MAX,INS_24M_AMT_PAYMENT_STD,INS_24M_DAYS_BEFORE_DUE_MEAN,INS_24M_DAYS_BEFORE_DUE_MAX,INS_24M_DAYS_BEFORE_DUE_STD,INS_24M_DAYS_PAST_DUE_MEAN,INS_24M_DAYS_PAST_DUE_MAX,INS_24M_DAYS_PAST_DUE_STD,INS_24M_FLAG_LATE_PAY_MEAN,INS_24M_FLAG_LATE_PAY_SUM,INS_24M_INSTALL_PAY_RATIO_MEAN,INS_24M_INSTALL_PAY_RATIO_STD,INS_24M_LATE_PAY_RATIO_MEAN,INS_24M_LATE_PAY_RATIO_STD,INS_24M_SIGNIFICANT_LATE_PAY_MEAN,INS_24M_SIGNIFICANT_LATE_PAY_SUM,INS_24M_FLAG_15DAYS_DUE_MEAN,INS_24M_FLAG_30DAYS_DUE_MEAN,INS_24M_FLAG_60DAYS_DUE_MEAN,INS_24M_PAYMENT_RATIO_MEAN,INS_24M_FLAG_PAYMENT_OVER_MEAN,INS_48M_SK_ID_PREV_SIZE,INS_48M_DAYS_ENTRY_PAYMENT_MEAN,INS_48M_DAYS_ENTRY_PAYMENT_MIN,INS_48M_DAYS_ENTRY_PAYMENT_MAX,INS_48M_AMT_INSTALMENT_MEAN,INS_48M_AMT_INSTALMENT_MIN,INS_48M_AMT_INSTALMENT_MAX,INS_48M_AMT_INSTALMENT_STD,INS_48M_AMT_PAYMENT_MEAN,INS_48M_AMT_PAYMENT_MIN,INS_48M_AMT_PAYMENT_MAX,INS_48M_AMT_PAYMENT_STD,INS_48M_DAYS_BEFORE_DUE_MEAN,INS_48M_DAYS_BEFORE_DUE_MAX,INS_48M_DAYS_BEFORE_DUE_STD,INS_48M_DAYS_PAST_DUE_MEAN,INS_48M_DAYS_PAST_DUE_MAX,INS_48M_DAYS_PAST_DUE_STD,INS_48M_FLAG_LATE_PAY_MEAN,INS_48M_FLAG_LATE_PAY_SUM,INS_48M_INSTALL_PAY_RATIO_MEAN,INS_48M_INSTALL_PAY_RATIO_STD,INS_48M_LATE_PAY_RATIO_MEAN,INS_48M_LATE_PAY_RATIO_STD,INS_48M_SIGNIFICANT_LATE_PAY_MEAN,INS_48M_SIGNIFICANT_LATE_PAY_SUM,INS_48M_FLAG_15DAYS_DUE_MEAN,INS_48M_FLAG_30DAYS_DUE_MEAN,INS_48M_FLAG_60DAYS_DUE_MEAN,INS_48M_PAYMENT_RATIO_MEAN,INS_48M_FLAG_PAYMENT_OVER_MEAN,CC_MONTHS_BALANCE_MIN,CC_AMT_BALANCE_MAX,CC_AMT_BALANCE_MEAN,CC_AMT_CREDIT_LIMIT_ACTUAL_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_SUM,CC_AMT_DRAWINGS_CURRENT_MAX,CC_AMT_DRAWINGS_CURRENT_SUM,CC_AMT_DRAWINGS_POS_CURRENT_MAX,CC_AMT_DRAWINGS_POS_CURRENT_SUM,CC_AMT_INST_MIN_REGULARITY_MAX,CC_AMT_INST_MIN_REGULARITY_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_MAX,CC_AMT_PAYMENT_TOTAL_CURRENT_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_SUM,CC_AMT_PAYMENT_TOTAL_CURRENT_STD,CC_AMT_TOTAL_RECEIVABLE_MAX,CC_AMT_TOTAL_RECEIVABLE_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_MAX,CC_CNT_DRAWINGS_ATM_CURRENT_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_SUM,CC_CNT_DRAWINGS_CURRENT_MAX,CC_CNT_DRAWINGS_CURRENT_MEAN,CC_CNT_DRAWINGS_CURRENT_SUM,CC_CNT_DRAWINGS_POS_CURRENT_MAX,CC_CNT_DRAWINGS_POS_CURRENT_MEAN,CC_CNT_DRAWINGS_POS_CURRENT_SUM,CC_SK_DPD_MAX,CC_SK_DPD_MEAN,CC_SK_DPD_SUM,CC_SK_DPD_DEF_MAX,CC_SK_DPD_DEF_SUM,CC_USAGE_RATIO_MAX,CC_USAGE_RATIO_MEAN,CC_PAYMENT_RATE_MIN,CC_PAYMENT_RATE_MEAN,CC_DRAWING_LIMIT_RATE_MAX,CC_DRAWING_LIMIT_RATE_MEAN,CC_FLAG_15DAYS_DUE_SUM,CC_FLAG_30DAYS_DUE_SUM,CC_FLAG_60DAYS_DUE_SUM,INS_12M_AMT_BALANCE_MAX,INS_12M_AMT_BALANCE_MEAN,INS_12M_SK_DPD_MAX,INS_12M_SK_DPD_MEAN,INS_12M_SK_DPD_SUM,INS_12M_USAGE_RATIO_MAX,INS_12M_USAGE_RATIO_MEAN,INS_12M_FLAG_15DAYS_DUE_SUM,INS_12M_FLAG_30DAYS_DUE_SUM,INS_12M_FLAG_60DAYS_DUE_SUM,INS_24M_AMT_BALANCE_MAX,INS_24M_AMT_BALANCE_MEAN,INS_24M_SK_DPD_MAX,INS_24M_SK_DPD_MEAN,INS_24M_SK_DPD_SUM,INS_24M_USAGE_RATIO_MAX,INS_24M_USAGE_RATIO_MEAN,INS_24M_FLAG_15DAYS_DUE_SUM,INS_24M_FLAG_30DAYS_DUE_SUM,INS_24M_FLAG_60DAYS_DUE_SUM,INS_36M_AMT_BALANCE_MAX,INS_36M_AMT_BALANCE_MEAN,INS_36M_SK_DPD_MAX,INS_36M_SK_DPD_MEAN,INS_36M_SK_DPD_SUM,INS_36M_USAGE_RATIO_MAX,INS_36M_USAGE_RATIO_MEAN,INS_36M_FLAG_15DAYS_DUE_SUM,INS_36M_FLAG_30DAYS_DUE_SUM,INS_36M_FLAG_60DAYS_DUE_SUM,BUREAU_SK_ID_BUREAU_NUNIQUE,BUREAU_DAYS_CREDIT_MIN,BUREAU_DAYS_CREDIT_MAX,BUREAU_DAYS_CREDIT_MEAN,BUREAU_DAYS_CREDIT_ENDDATE_MIN,BUREAU_DAYS_CREDIT_ENDDATE_MAX,BUREAU_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_MAX,BUREAU_AMT_CREDIT_SUM_MEAN,BUREAU_AMT_CREDIT_SUM_SUM,BUREAU_AMT_CREDIT_SUM_DEBT_MAX,BUREAU_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_AMT_CREDIT_SUM_OVERDUE_MAX,BUREAU_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_AMT_CREDIT_SUM_OVERDUE_SUM,BUREAU_AMT_ANNUITY_MEAN,BUREAU_DEBT_CREDIT_DIFF_MEAN,BUREAU_DEBT_CREDIT_DIFF_SUM,BUREAU_BB_BAL_MONTHS_BALANCE_MEAN_MEAN,BUREAU_BB_BAL_MONTHS_BALANCE_MEAN_STD,BUREAU_BB_BAL_MONTHS_BALANCE_SIZE_MEAN,BUREAU_BB_BAL_MONTHS_BALANCE_SIZE_SUM,BUREAU_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_BB_BAL_FLAG_DPD_MEAN_MEAN,BUREAU_BB_BAL_STATUS_C_SUM_MEAN,BUREAU_BB_BAL_STATUS_X_MEAN_MEAN,BUREAU_CREDIT_ACTIVE_Active_MEAN,BUREAU_CREDIT_ACTIVE_Closed_MEAN,BUREAU_CREDIT_ACTIVE_Sold_MEAN,BUREAU_CREDIT_ACTIVE_Bad debt_MEAN,BUREAU_CREDIT_TYPE_Consumer credit_MEAN,BUREAU_CREDIT_TYPE_Credit card_MEAN,BUREAU_CREDIT_TYPE_Car loan_MEAN,BUREAU_CREDIT_TYPE_Mortgage_MEAN,BUREAU_CREDIT_TYPE_Microloan_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_MAX,BUREAU_ACTIVE_DAYS_CREDIT_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_ENDDATE_MIN,BUREAU_ACTIVE_DAYS_CREDIT_ENDDATE_MAX,BUREAU_ACTIVE_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_ACTIVE_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_ACTIVE_AMT_CREDIT_SUM_MAX,BUREAU_ACTIVE_AMT_CREDIT_SUM_SUM,BUREAU_ACTIVE_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_ACTIVE_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_ACTIVE_AMT_CREDIT_SUM_OVERDUE_MAX,BUREAU_ACTIVE_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_ACTIVE_DAYS_CREDIT_UPDATE_MIN,BUREAU_ACTIVE_DAYS_CREDIT_UPDATE_MEAN,BUREAU_ACTIVE_DEBT_PERCENTAGE_MEAN,BUREAU_ACTIVE_DEBT_CREDIT_DIFF_MEAN,BUREAU_ACTIVE_CREDIT_TO_ANNUITY_RATIO_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_MEAN_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_MEAN_STD,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_SIZE_MEAN,BUREAU_ACTIVE_BB_BAL_MONTHS_BALANCE_SIZE_SUM,BUREAU_LAST12M_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_LAST12M_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_MAX,BUREAU_LAST12M_AMT_CREDIT_SUM_SUM,BUREAU_LAST12M_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_LAST12M_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_LAST12M_DEBT_PERCENTAGE_MEAN,BUREAU_LAST12M_DEBT_CREDIT_DIFF_MEAN,BUREAU_LAST12M_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_LAST12M_BB_BAL_FLAG_DPD_MEAN_MEAN,BUREAU_LAST24M_AMT_CREDIT_MAX_OVERDUE_MAX,BUREAU_LAST24M_AMT_CREDIT_MAX_OVERDUE_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_OVERDUE_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_MAX,BUREAU_LAST24M_AMT_CREDIT_SUM_SUM,BUREAU_LAST24M_AMT_CREDIT_SUM_DEBT_MEAN,BUREAU_LAST24M_AMT_CREDIT_SUM_DEBT_SUM,BUREAU_LAST24M_DEBT_PERCENTAGE_MEAN,BUREAU_LAST24M_DEBT_CREDIT_DIFF_MEAN,BUREAU_LAST24M_BB_BAL_STATUS_0_MEAN_MEAN,BUREAU_LAST24M_BB_BAL_FLAG_DPD_MEAN_MEAN,POS_SK_ID_PREV_NUNIQUE,POS_MONTHS_BALANCE_MIN,POS_MONTHS_BALANCE_MAX,POS_MONTHS_BALANCE_SIZE,POS_SK_DPD_MAX,POS_SK_DPD_MEAN,POS_SK_DPD_SUM,POS_SK_DPD_STD,POS_SK_DPD_DEF_MAX,POS_SK_DPD_DEF_MEAN,POS_SK_DPD_DEF_SUM,POS_FLAG_LATE_PAYMENT_MEAN,POS_NAME_CONTRACT_STATUS_Active_MEAN,POS_NAME_CONTRACT_STATUS_Approved_MEAN,POS_NAME_CONTRACT_STATUS_Canceled_MEAN,POS_NAME_CONTRACT_STATUS_Completed_MEAN,POS_NAME_CONTRACT_STATUS_Demand_MEAN,POS_NAME_CONTRACT_STATUS_Returned to the store_MEAN,POS_NAME_CONTRACT_STATUS_Signed_MEAN,POS_LOAN_COMPLETED_MEAN,POS_COMPLETED_BEFORE_MEAN,POS_REMAINING_INSTALMENTS,POS_REMAINING_INSTALMENTS_RATIO,PREV_SK_ID_PREV_NUNIQUE,PREV_AMT_ANNUITY_MIN,PREV_AMT_ANNUITY_MAX,PREV_AMT_ANNUITY_MEAN,PREV_AMT_DOWN_PAYMENT_MAX,PREV_AMT_DOWN_PAYMENT_MEAN,PREV_RATE_DOWN_PAYMENT_MAX,PREV_RATE_DOWN_PAYMENT_MEAN,PREV_DAYS_DECISION_MIN,PREV_DAYS_DECISION_MAX,PREV_DAYS_DECISION_MEAN,PREV_CNT_PAYMENT_MAX,PREV_CNT_PAYMENT_MEAN,PREV_DAYS_TERMINATION_MAX,PREV_CREDIT_TO_ANNUITY_RATIO_MEAN,PREV_CREDIT_TO_ANNUITY_RATIO_MAX,PREV_APPLICATION_CREDIT_DIFF_MIN,PREV_APPLICATION_CREDIT_DIFF_MAX,PREV_APPLICATION_CREDIT_DIFF_MEAN,PREV_APPLICATION_CREDIT_RATIO_MIN,PREV_APPLICATION_CREDIT_RATIO_MAX,PREV_APPLICATION_CREDIT_RATIO_MEAN,PREV_APPLICATION_CREDIT_RATIO_STD,PREV_DOWN_PAYMENT_TO_CREDIT_MEAN,PREV_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_NAME_CONTRACT_TYPE_XNA_MEAN,PREV_NAME_CONTRACT_STATUS_Approved_MEAN,PREV_NAME_CONTRACT_STATUS_Canceled_MEAN,PREV_NAME_CONTRACT_STATUS_Refused_MEAN,PREV_NAME_CONTRACT_STATUS_Unused offer_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_MONDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_TUESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_THURSDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_FRIDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SATURDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SUNDAY_MEAN,PREV_NAME_TYPE_SUITE_Children_MEAN,PREV_NAME_TYPE_SUITE_Family_MEAN,PREV_NAME_TYPE_SUITE_Group of people_MEAN,PREV_NAME_TYPE_SUITE_Other_A_MEAN,PREV_NAME_TYPE_SUITE_Other_B_MEAN,"PREV_NAME_TYPE_SUITE_Spouse, partner_MEAN",PREV_NAME_TYPE_SUITE_Unaccompanied_MEAN,PREV_NAME_CLIENT_TYPE_New_MEAN,PREV_NAME_CLIENT_TYPE_Refreshed_MEAN,PREV_NAME_CLIENT_TYPE_Repeater_MEAN,PREV_NAME_CLIENT_TYPE_XNA_MEAN,PREV_NAME_PRODUCT_TYPE_walk-in_MEAN,PREV_NAME_PRODUCT_TYPE_x-sell_MEAN,PREV_CHANNEL_TYPE_AP+ (Cash loan)_MEAN,PREV_CHANNEL_TYPE_Car dealer_MEAN,PREV_CHANNEL_TYPE_Channel of corporate sales_MEAN,PREV_CHANNEL_TYPE_Contact center_MEAN,PREV_CHANNEL_TYPE_Credit and cash offices_MEAN,PREV_CHANNEL_TYPE_Regional / Local_MEAN,PREV_CHANNEL_TYPE_Stone_MEAN,PREV_NAME_YIELD_GROUP_XNA_MEAN,PREV_NAME_YIELD_GROUP_high_MEAN,PREV_NAME_YIELD_GROUP_low_action_MEAN,PREV_NAME_YIELD_GROUP_low_normal_MEAN,PREV_NAME_YIELD_GROUP_middle_MEAN,PREV_PRODUCT_COMBINATION_Card Street_MEAN,PREV_PRODUCT_COMBINATION_Card X-Sell_MEAN,PREV_PRODUCT_COMBINATION_Cash_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: high_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: low_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: middle_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: high_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: low_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: middle_MEAN,PREV_PRODUCT_COMBINATION_POS household with interest_MEAN,PREV_PRODUCT_COMBINATION_POS household without interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry with interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry without interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile with interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile without interest_MEAN,PREV_PRODUCT_COMBINATION_POS other with interest_MEAN,PREV_PRODUCT_COMBINATION_POS others without interest_MEAN,PREV_HOUR_APPR_PROCESS_START_afternoon_MEAN,PREV_HOUR_APPR_PROCESS_START_dusk_MEAN,PREV_HOUR_APPR_PROCESS_START_morning_MEAN,PREV_ACTIVE_SK_ID_PREV_NUNIQUE,PREV_ACTIVE_SIMPLE_INTERESTS_MEAN,PREV_ACTIVE_AMT_ANNUITY_MAX,PREV_ACTIVE_AMT_ANNUITY_SUM,PREV_ACTIVE_AMT_APPLICATION_MAX,PREV_ACTIVE_AMT_APPLICATION_MEAN,PREV_ACTIVE_AMT_CREDIT_SUM,PREV_ACTIVE_AMT_DOWN_PAYMENT_MAX,PREV_ACTIVE_AMT_DOWN_PAYMENT_MEAN,PREV_ACTIVE_DAYS_DECISION_MIN,PREV_ACTIVE_DAYS_DECISION_MEAN,PREV_ACTIVE_CNT_PAYMENT_MEAN,PREV_ACTIVE_CNT_PAYMENT_SUM,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_ACTIVE_AMT_PAYMENT_SUM,PREV_ACTIVE_INSTALMENT_PAYMENT_DIFF_MEAN,PREV_ACTIVE_INSTALMENT_PAYMENT_DIFF_MAX,PREV_ACTIVE_REMAINING_DEBT_MAX,PREV_ACTIVE_REMAINING_DEBT_MEAN,PREV_ACTIVE_REMAINING_DEBT_SUM,PREV_ACTIVE_REPAYMENT_RATIO_MEAN,TOTAL_REPAYMENT_RATIO,APPROVED_SK_ID_PREV_NUNIQUE,APPROVED_AMT_ANNUITY_MIN,APPROVED_AMT_ANNUITY_MAX,APPROVED_AMT_ANNUITY_MEAN,APPROVED_AMT_CREDIT_MIN,APPROVED_AMT_CREDIT_MAX,APPROVED_AMT_CREDIT_MEAN,APPROVED_AMT_DOWN_PAYMENT_MAX,APPROVED_AMT_GOODS_PRICE_MAX,APPROVED_DAYS_DECISION_MIN,APPROVED_DAYS_DECISION_MEAN,APPROVED_CNT_PAYMENT_MAX,APPROVED_CNT_PAYMENT_MEAN,APPROVED_DAYS_TERMINATION_MEAN,APPROVED_CREDIT_TO_ANNUITY_RATIO_MEAN,APPROVED_CREDIT_TO_ANNUITY_RATIO_MAX,APPROVED_APPLICATION_CREDIT_DIFF_MAX,APPROVED_APPLICATION_CREDIT_RATIO_MIN,APPROVED_APPLICATION_CREDIT_RATIO_MAX,APPROVED_APPLICATION_CREDIT_RATIO_MEAN,APPROVED_DAYS_FIRST_DRAWING_MAX,APPROVED_DAYS_FIRST_DRAWING_MEAN,APPROVED_DAYS_FIRST_DUE_MIN,APPROVED_DAYS_FIRST_DUE_MEAN,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MIN,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MAX,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MEAN,APPROVED_DAYS_LAST_DUE_MAX,APPROVED_DAYS_LAST_DUE_MEAN,APPROVED_DAYS_LAST_DUE_DIFF_MIN,APPROVED_DAYS_LAST_DUE_DIFF_MAX,APPROVED_DAYS_LAST_DUE_DIFF_MEAN,APPROVED_SIMPLE_INTERESTS_MIN,APPROVED_SIMPLE_INTERESTS_MAX,APPROVED_SIMPLE_INTERESTS_MEAN,APPROVED_SIMPLE_INTERESTS_STD,REFUSED_AMT_APPLICATION_MAX,REFUSED_AMT_APPLICATION_MEAN,REFUSED_AMT_CREDIT_MIN,REFUSED_AMT_CREDIT_MAX,REFUSED_DAYS_DECISION_MIN,REFUSED_DAYS_DECISION_MAX,REFUSED_DAYS_DECISION_MEAN,REFUSED_CNT_PAYMENT_MAX,REFUSED_CNT_PAYMENT_MEAN,REFUSED_APPLICATION_CREDIT_DIFF_MIN,REFUSED_APPLICATION_CREDIT_DIFF_MAX,REFUSED_APPLICATION_CREDIT_DIFF_MEAN,REFUSED_APPLICATION_CREDIT_DIFF_STD,REFUSED_APPLICATION_CREDIT_RATIO_MIN,REFUSED_APPLICATION_CREDIT_RATIO_MEAN,REFUSED_NAME_CONTRACT_TYPE_Consumer loans_MEAN,REFUSED_NAME_CONTRACT_TYPE_Cash loans_MEAN,REFUSED_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_LAST12M_AMT_CREDIT_SUM,PREV_LAST12M_AMT_ANNUITY_MEAN,PREV_LAST12M_AMT_ANNUITY_MAX,PREV_LAST12M_SIMPLE_INTERESTS_MEAN,PREV_LAST12M_SIMPLE_INTERESTS_MAX,PREV_LAST12M_SIMPLE_INTERESTS_STD,PREV_LAST12M_DAYS_DECISION_MIN,PREV_LAST12M_DAYS_DECISION_MEAN,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_LAST12M_APPLICATION_CREDIT_DIFF_MIN,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MIN,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MAX,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_LAST24M_AMT_CREDIT_SUM,PREV_LAST24M_AMT_ANNUITY_MEAN,PREV_LAST24M_AMT_ANNUITY_MAX,PREV_LAST24M_SIMPLE_INTERESTS_MEAN,PREV_LAST24M_SIMPLE_INTERESTS_MAX,PREV_LAST24M_SIMPLE_INTERESTS_STD,PREV_LAST24M_DAYS_DECISION_MIN,PREV_LAST24M_DAYS_DECISION_MEAN,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_LAST24M_APPLICATION_CREDIT_DIFF_MIN,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MIN,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MAX,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Revolving loans_MEAN,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group of people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse, partner",NAME_TYPE_SUITE_Unaccompanied,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,NAME_FAMILY_STATUS_Civil marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single / not married,NAME_FAMILY_STATUS_Widow,TYPE_SUITE_FAMILY_STATUS_Children_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Children_Married,TYPE_SUITE_FAMILY_STATUS_Children_Separated,TYPE_SUITE_FAMILY_STATUS_Children_Single / not married,TYPE_SUITE_FAMILY_STATUS_Children_Widow,TYPE_SUITE_FAMILY_STATUS_Family_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Family_Married,TYPE_SUITE_FAMILY_STATUS_Family_Separated,TYPE_SUITE_FAMILY_STATUS_Family_Single / not married,TYPE_SUITE_FAMILY_STATUS_Family_Widow,TYPE_SUITE_FAMILY_STATUS_Group of people_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Group of people_Married,TYPE_SUITE_FAMILY_STATUS_Group of people_Separated,TYPE_SUITE_FAMILY_STATUS_Group of people_Single / not married,TYPE_SUITE_FAMILY_STATUS_Group of people_Widow,TYPE_SUITE_FAMILY_STATUS_Other_A_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Other_A_Married,TYPE_SUITE_FAMILY_STATUS_Other_A_Separated,TYPE_SUITE_FAMILY_STATUS_Other_A_Single / not married,TYPE_SUITE_FAMILY_STATUS_Other_A_Widow,TYPE_SUITE_FAMILY_STATUS_Other_B_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Other_B_Married,TYPE_SUITE_FAMILY_STATUS_Other_B_Separated,TYPE_SUITE_FAMILY_STATUS_Other_B_Single / not married,TYPE_SUITE_FAMILY_STATUS_Other_B_Widow,"TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Civil marriage","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Married","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Separated","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Single / not married","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Widow",TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Married,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Separated,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Single / not married,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Widow,PROCESS_START_PERIOD_afternoon,PROCESS_START_PERIOD_dusk,PROCESS_START_PERIOD_morning,APPR_PROCESS_START_DIV_morning,APPR_PROCESS_START_DIV_afternoon,APPR_PROCESS_START_DIV_dusk,NAME_TYPE_SUITE_DIV_Children,NAME_TYPE_SUITE_DIV_Family,NAME_TYPE_SUITE_DIV_Group of people,NAME_TYPE_SUITE_DIV_Other_A,NAME_TYPE_SUITE_DIV_Other_B,"NAME_TYPE_SUITE_DIV_Spouse, partner",NAME_TYPE_SUITE_DIV_Unaccompanied,WEEKDAY_APPR_PROCESS_DIV_MONDAY,WEEKDAY_APPR_PROCESS_DIV_TUESDAY,WEEKDAY_APPR_PROCESS_DIV_WEDNESDAY,WEEKDAY_APPR_PROCESS_DIV_THURSDAY,WEEKDAY_APPR_PROCESS_DIV_FRIDAY,WEEKDAY_APPR_PROCESS_DIV_SATURDAY,WEEKDAY_APPR_PROCESS_DIV_SUNDAY
0,100002,1,1,1,0,1,202500.0,406597.5,24700.5,4,2,0.018801,-3648.0,-2120,1,0,1,1,2,0,0,0,0,2.0,2.0,2.0,2.0,-1134.0,1,0,0,0,0,1,25.920548,0,1.745205,0,2.007889,0.121978,0,1.0,0.161787,2.0,2.0,1.0,1.0,-315.421053,-587.0,-49.0,11559.247105,9251.775,53093.745,10058.037722,11559.247105,9251.775,53093.745,10058.037722,20.421053,31.0,4.925171,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,19.0,-315.421053,-587.0,-49.0,11559.247105,9251.775,53093.745,10058.037722,11559.247105,9251.775,53093.745,10058.037722,20.421053,31.0,4.925171,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,19.0,-315.421053,-587.0,-49.0,11559.247105,9251.775,53093.745,10058.037722,11559.247105,9251.775,53093.745,10058.037722,20.421053,31.0,4.925171,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,8,-1437,-103,-874.0,-1072.0,780.0,5043.645,1681.029,450000.0,108131.945625,865055.565,245781.0,49156.2,245781.0,0.0,0.0,0.0,0.0,98388.513,491942.565,-22.9375,11.530821,11.625,93.0,0.49256,0.268452,0.75,0.168452,0.25,0.75,0.0,0.0,0.5,0.5,0.0,0.0,0.0,-103.0,-572.5,780.0,780.0,40.5,40.5,450000.0,481988.565,122890.5,245781.0,0.0,0.0,-24.0,-15.5,inf,118103.7825,inf,-14.25,18.031223,9.5,19.0,40.5,40.5,0.0,31988.565,31988.565,0.0,0.0,inf,31988.565,0.5,0.0,5043.645,2542.0725,0.0,120735.0,152723.565,0.0,0.0,inf,50907.855,0.583333,0.166667,1.0,-13.0,-13.0,1.0,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18.0,0.75,1.0,9251.775,9251.775,9251.775,0.0,0.0,0.0,0.0,-606.0,-606.0,-606.0,24.0,24.0,-17.0,19.353584,19.353584,0.0,0.0,0.0,1.0,1.0,1.0,,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,1.0,9251.775,9251.775,9251.775,179055.0,179055.0,179055.0,0.0,179055.0,-606.0,-606.0,24.0,24.0,-17.0,19.353584,19.353584,0.0,1.0,1.0,1.0,365243.0,365243.0,-565.0,-565.0,125.0,125.0,125.0,-25.0,-25.0,150.0,150.0,150.0,0.010003,0.010003,0.010003,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,179055.0,9251.775,9251.775,0.010003,0.010003,,-606.0,-606.0,125.0,125.0,125.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0.0,,,,,,,,,1.0,,,1.0,,,,
1,100003,0,1,0,0,0,270000.0,1293502.5,35698.5,2,4,0.003541,-1186.0,-291,1,0,1,1,1,0,0,0,0,1.0,0.0,1.0,0.0,-828.0,1,0,0,0,0,1,45.931507,0,3.254795,0,4.79075,0.132217,0,2.0,0.466757,1.0,0.0,0.0,3.0,-1385.32,-2324.0,-544.0,64754.586,6662.97,560835.36,110542.5923,64754.586,6662.97,560835.36,110542.5923,7.16,14.0,3.726929,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,13.0,-677.846154,-806.0,-544.0,118314.713077,64275.615,560835.36,134033.060606,118314.713077,64275.615,560835.36,134033.060606,7.538462,14.0,3.950008,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,13.0,-677.846154,-806.0,-544.0,118314.713077,64275.615,560835.36,134033.060606,118314.713077,64275.615,560835.36,134033.060606,7.538462,14.0,3.950008,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,4,-2586,-606,-1400.75,-2434.0,1216.0,0.0,0.0,810000.0,254350.125,1017400.5,0.0,0.0,0.0,0.0,0.0,0.0,,254350.125,1017400.5,,,,0.0,,,,,0.25,0.75,0.0,0.0,0.5,0.5,0.0,0.0,0.0,-606.0,-606.0,1216.0,1216.0,0.0,0.0,810000.0,810000.0,0.0,0.0,0.0,0.0,-43.0,-43.0,inf,810000.0,,,,,0.0,,,,,,,,,,,,0.0,0.0,0.0,810000.0,810000.0,0.0,0.0,inf,810000.0,,,2.0,-66.0,-23.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.25,3.0,6737.31,98356.995,56553.99,6885.0,3442.5,0.100061,0.05003,-2341.0,-746.0,-1305.0,12.0,10.0,-527.0,8.677472,10.531859,-135882.0,756.0,-48754.5,0.868825,1.011109,0.949329,0.072967,0.050585,0.333333,0.666667,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.333333,0.333333,0.333333,0.0,0.666667,0.0,0.0,0.0,0.0,0.333333,0.0,0.666667,0.333333,0.0,0.0,0.333333,0.0,0.0,0.0,0.0,0.333333,0.0,0.333333,0.0,0.0,0.0,0.333333,0.666667,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.333333,0.0,0.333333,0.0,0.333333,0.0,0.0,0.0,0.0,0.0,0.666667,0.0,0.333333,,,,,,,,,,,,,,,,,,,,,,,,,3.0,6737.31,98356.995,56553.99,68053.5,1035882.0,484191.0,6885.0,900000.0,-2341.0,-1305.0,12.0,10.0,-1047.333333,8.677472,10.531859,756.0,0.868825,1.011109,0.949329,365243.0,365243.0,-2310.0,-1274.333333,-1980.0,-386.0,-1004.333333,-536.0,-1054.333333,0.0,150.0,50.0,0.011617,0.018533,0.015272,0.003475,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0.666667,,,,0.333333,,,,,,1.0,,,,,,
2,100004,0,0,1,1,1,67500.0,135000.0,6750.0,4,2,0.010032,-4260.0,-2531,1,1,1,1,2,0,0,0,0,0.0,0.0,0.0,0.0,-815.0,0,0,0,0,0,1,52.180822,0,0.616438,0,2.0,0.1,1,1.0,0.642739,0.0,0.0,0.0,1.0,-761.666667,-795.0,-727.0,7096.155,5357.25,10573.965,3011.87181,7096.155,5357.25,10573.965,3011.87181,7.666667,11.0,4.163332,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,3.0,-761.666667,-795.0,-727.0,7096.155,5357.25,10573.965,3011.87181,7096.155,5357.25,10573.965,3011.87181,7.666667,11.0,4.163332,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2,-1326,-408,-867.0,-595.0,-382.0,0.0,0.0,94537.8,94518.9,189037.8,0.0,0.0,0.0,0.0,0.0,0.0,,94518.9,189037.8,,,,0.0,,,,,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,94537.8,94537.8,0.0,0.0,inf,94537.8,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,5357.25,5357.25,5357.25,4860.0,4860.0,0.212008,0.212008,-815.0,-815.0,-815.0,4.0,4.0,-714.0,3.753045,3.753045,4176.0,4176.0,4176.0,1.207699,1.207699,1.207699,,0.241719,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,1.0,5357.25,5357.25,5357.25,20106.0,20106.0,20106.0,4860.0,24282.0,-815.0,-815.0,4.0,4.0,-714.0,3.753045,3.753045,4176.0,1.207699,1.207699,1.207699,365243.0,365243.0,-784.0,-784.0,-694.0,-694.0,-694.0,-724.0,-724.0,30.0,30.0,30.0,0.01645,0.01645,0.01645,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,1.0,,,,,,,,,0.0,1.0,,,,,,
3,100007,0,1,1,0,1,121500.0,513000.0,21865.5,4,2,0.028663,-4311.0,-3458,1,0,1,0,2,0,0,0,1,0.0,0.0,0.0,0.0,-1106.0,0,0,1,0,0,1,54.608219,0,8.323288,0,4.222222,0.179963,0,1.0,0.322738,0.0,0.0,0.0,5.0,-1032.242424,-2318.0,-14.0,12666.444545,1821.78,22678.785,7852.910669,12214.060227,0.18,22678.785,8048.060877,4.590909,31.0,7.047045,0.954545,12.0,2.303388,0.242424,16.0,0.954545,0.209751,0.242394,0.43178,0.242424,16.0,0.0,0.0,0.0,1.0,0.0,29.0,-428.310345,-838.0,-14.0,16298.323448,16037.64,16509.6,238.544058,16298.323448,16037.64,16509.6,238.544058,6.034483,20.0,4.686476,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,56.0,-826.178571,-1742.0,-14.0,14600.98125,3577.05,22678.785,6908.795822,14067.814018,0.18,22678.785,7311.309694,5.410714,31.0,7.360279,0.267857,7.0,1.05298,0.107143,6.0,0.946429,0.22705,0.107108,0.311991,0.107143,6.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,-1149,-1149,-1149.0,-783.0,-783.0,0.0,0.0,146250.0,146250.0,146250.0,0.0,0.0,0.0,0.0,0.0,0.0,,146250.0,146250.0,,,,0.0,,,,,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,4.0,-73.0,-3.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,43.0,3.058333,6.0,1834.29,22678.785,12278.805,3676.5,3390.75,0.21889,0.159516,-2357.0,-374.0,-1222.833333,48.0,20.666667,-347.0,12.644075,21.858453,-59400.0,2560.5,-16108.5,0.791139,1.175185,0.96965,0.128282,0.176401,0.666667,0.333333,0.0,0.0,1.0,0.0,0.0,0.0,0.166667,0.0,0.0,0.166667,0.166667,0.166667,0.333333,0.0,0.333333,0.0,0.0,0.0,0.0,0.333333,0.166667,0.0,0.833333,0.0,0.166667,0.5,0.166667,0.0,0.0,0.0,0.166667,0.166667,0.0,0.0,0.5,0.0,0.0,0.5,0.0,0.0,0.0,0.166667,0.0,0.0,0.0,0.0,0.5,0.166667,0.0,0.0,0.0,0.166667,0.0,0.0,0.0,0.666667,0.0,0.333333,1.0,0.016803,16037.64,16037.64,247500.0,247500.0,274288.5,,,-374.0,-374.0,24.0,24.0,346.0,346.0,346.0,192451.68,0.0,0.0,81836.82,81836.82,81836.82,0.70164,0.70164,6.0,1834.29,22678.785,12278.805,14616.0,284400.0,166638.75,3676.5,247500.0,-2357.0,-1222.833333,48.0,20.666667,72143.8,12.644075,21.858453,2560.5,0.791139,1.175185,0.96965,365243.0,365243.0,-2326.0,-1263.2,-2056.0,346.0,-837.2,365243.0,72136.2,-364897.0,30.0,-72973.4,0.016803,0.036164,0.026538,0.007373,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,274288.5,16037.64,16037.64,0.016803,0.016803,,-374.0,-374.0,346.0,346.0,346.0,-26788.5,0.902335,0.902335,0.902335,0.0,1.0,0.0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0.666667,,,,,,,,,0.666667,,,,0.833333,,,
4,100008,0,1,1,0,1,99000.0,490495.5,27517.5,2,2,0.035792,-4970.0,-477,1,1,1,1,2,0,0,0,0,0.0,0.0,0.0,0.0,-2536.0,1,0,0,0,0,1,46.413699,0,4.350685,0,4.9545,0.277955,0,2.0,0.487726,0.0,0.0,0.0,4.0,-1237.8,-2519.0,-82.0,27702.964286,8003.475,432218.295,70634.672225,27360.502714,227.16,432218.295,70740.978283,11.514286,28.0,8.378444,37.628571,1317.0,222.613631,0.028571,1.0,0.971429,0.165764,0.000541,0.003203,0.0,0.0,0.028571,0.028571,0.028571,1.0,0.0,18.0,-347.555556,-618.0,-82.0,43790.775,17876.115,432218.295,97007.575331,43790.775,17876.115,432218.295,97007.575331,10.222222,21.0,4.917622,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,18.0,-347.555556,-618.0,-82.0,43790.775,17876.115,432218.295,97007.575331,43790.775,17876.115,432218.295,97007.575331,10.222222,21.0,4.917622,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,3,-1097,-78,-757.333333,-853.0,471.0,0.0,0.0,267606.0,156148.5,468445.5,240057.0,80019.0,240057.0,0.0,0.0,0.0,,76129.5,228388.5,,,,0.0,,,,,0.333333,0.666667,0.0,0.0,1.0,0.0,0.0,0.0,0.0,-78.0,-78.0,471.0,471.0,0.0,0.0,267606.0,267606.0,240057.0,240057.0,0.0,0.0,-16.0,-16.0,1.11476,27549.0,,,,,0.0,0.0,0.0,0.0,267606.0,267606.0,240057.0,240057.0,1.11476,27549.0,,,0.0,0.0,0.0,267606.0,267606.0,240057.0,240057.0,1.11476,27549.0,,,1.0,-19.0,-13.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.666667,0.0,0.0,0.333333,0.0,0.0,0.0,0.333333,1.0,0.0,0.0,5.0,8019.09,25309.575,15839.69625,12145.5,5548.5,0.110243,0.073051,-2536.0,-82.0,-1192.0,30.0,14.0,-66.0,10.72694,19.833403,-51975.0,12145.5,-7065.9,0.896459,1.112625,1.030049,0.103504,0.074579,0.4,0.6,0.0,0.0,0.8,0.2,0.0,0.0,0.6,0.0,0.0,0.2,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.2,0.2,0.2,0.6,0.0,0.0,0.2,0.0,0.0,0.0,0.0,0.2,0.2,0.0,0.2,0.0,0.0,0.6,0.2,0.0,0.0,0.2,0.0,0.0,0.0,0.0,0.0,0.2,0.4,0.0,0.0,0.0,0.2,0.0,0.0,0.0,0.4,0.0,0.6,,,,,,,,,,,,,,,,,,,,,,,,,4.0,8019.09,25309.575,15839.69625,39955.5,501975.0,203459.625,12145.5,450000.0,-2536.0,-1469.5,30.0,14.0,-872.75,10.72694,19.833403,12145.5,0.896459,1.112625,1.030049,365243.0,365243.0,-2491.0,-1434.5,-2341.0,261.0,-1044.5,-69.0,-1209.5,0.0,660.0,165.0,0.01,0.034034,0.018055,0.011098,,,,,,,,,,,,,,,,,,,0.0,,,,,,-82.0,-82.0,,,,0.0,,,,0.0,1.0,0.0,664573.5,21597.705,25309.575,0.013543,0.017087,0.005011,-639.0,-363.666667,-69.0,261.0,96.0,-51975.0,0.896459,1.0,0.948229,0.333333,0.666667,0.0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,,0.6,,,,,,,1.0,,,,1.0,,,,
5,100009,0,1,0,1,1,171000.0,1560726.0,41301.0,3,4,0.035792,-1213.0,-619,1,0,1,1,2,0,0,0,0,1.0,0.0,1.0,0.0,-1562.0,0,0,1,0,0,1,37.747945,0,8.575342,1,9.127053,0.241526,1,3.0,0.663607,1.0,0.0,0.0,8.0,-864.411765,-2914.0,-58.0,9568.531765,6155.28,17341.605,3067.815701,9568.531765,6155.28,17341.605,3067.815701,8.72549,23.0,4.766879,0.137255,7.0,0.980196,0.019608,1.0,1.0,0.0,0.019608,0.140028,0.019608,1.0,0.0,0.0,0.0,1.0,0.0,31.0,-326.193548,-804.0,-58.0,8416.280323,7421.4,10418.67,813.583522,8416.280323,7421.4,10418.67,813.583522,9.903226,21.0,4.011274,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,47.0,-693.659574,-1542.0,-58.0,9858.910213,7421.4,17341.605,3021.82673,9858.910213,7421.4,17341.605,3021.82673,8.659574,21.0,4.294975,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,18,-2882,-239,-1271.5,-2152.0,1402.0,0.0,0.0,1777500.0,266711.75,4800811.5,557959.5,76953.535714,1077349.5,0.0,0.0,0.0,,227088.0,3179232.0,,,,0.0,,,,,0.222222,0.777778,0.0,0.0,0.888889,0.111111,0.0,0.0,0.0,-239.0,-591.75,-209.0,1402.0,,,642861.0,1527561.0,269337.375,1077349.5,0.0,0.0,-847.0,-245.75,inf,112552.875,,,,,0.0,,,0.0,337500.0,337500.0,326628.0,326628.0,1.033286,10872.0,,,,,0.0,642861.0,1402326.0,269337.375,1077349.5,inf,81244.125,,,4.0,-95.0,-10.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.6,0.0,0.0,0.4,0.0,0.0,0.0,1.5,0.0,9.0,1.6,7.0,7435.845,17341.605,10051.412143,22032.0,9203.142857,0.209525,0.126602,-1562.0,-74.0,-719.285714,12.0,8.0,-84.0,7.044559,10.919431,0.0,17671.5,6604.071429,1.0,1.191067,1.095482,0.072435,0.136969,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.142857,0.0,0.285714,0.0,0.0,0.285714,0.285714,0.0,0.285714,0.0,0.0,0.0,0.142857,0.285714,0.0,0.142857,0.857143,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.857143,0.0,0.0,0.285714,0.142857,0.142857,0.428571,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.714286,0.142857,0.0,0.0,0.142857,0.0,0.0,0.0,0.571429,0.0,0.428571,1.0,0.01755,10418.67,10418.67,95841.0,95841.0,88632.0,14377.5,14377.5,-74.0,-74.0,10.0,10.0,227.0,227.0,227.0,10418.67,0.0,0.0,78213.33,78213.33,78213.33,0.11755,0.11755,7.0,7435.845,17341.605,10051.412143,38574.0,98239.5,70137.642857,22032.0,110160.0,-1562.0,-719.285714,12.0,8.0,51672.857143,7.044559,10.919431,17671.5,1.0,1.191067,1.095482,365243.0,365243.0,-1531.0,-688.285714,-1330.0,227.0,-478.285714,365243.0,51666.857143,-365016.0,0.0,-52145.142857,0.008247,0.030703,0.019536,0.008144,,,,,,,,,,,,,,,,,,,171900.0,8913.555,10418.67,0.025346,0.030703,0.006907,-308.0,-229.0,-127.0,227.0,-8.0,1881.0,1.048763,1.081336,1.059644,1.0,0.0,0.0,270139.5,8934.35625,10418.67,0.021071,0.030703,0.010242,-449.0,-284.0,-127.0,227.0,-28.0,0.0,1.0,1.081336,1.044733,1.0,0.0,0.0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,,0.428571,,,,,,,,0.714286,,,,,,,0.714286
6,100010,0,1,1,1,1,360000.0,1530000.0,42075.0,2,4,0.003122,-4597.0,-2379,1,1,1,0,3,0,0,0,1,2.0,0.0,2.0,0.0,-1070.0,1,0,0,0,0,1,51.643836,0,1.230137,0,4.25,0.116875,3,2.0,0.627467,2.0,0.0,0.0,1.0,-915.9,-1069.0,-774.0,27449.208,27321.39,27463.41,44.910667,27449.208,27321.39,27463.41,44.910667,11.9,30.0,6.967384,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10.0,-915.9,-1069.0,-774.0,27449.208,27321.39,27463.41,44.910667,27449.208,27321.39,27463.41,44.910667,11.9,30.0,6.967384,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2,-2741,-1138,-1939.5,-928.0,689.0,,,675000.0,495000.0,990000.0,348007.5,174003.75,348007.5,0.0,0.0,0.0,,320996.25,641992.5,-58.5,37.476659,11.0,22.0,0.909091,0.0,1.0,0.0,0.5,0.5,0.0,0.0,0.5,0.0,0.0,0.0,0.0,-1138.0,-1138.0,689.0,689.0,,,675000.0,675000.0,348007.5,348007.5,0.0,0.0,-18.0,-18.0,1.939613,326992.5,,-32.0,,11.0,11.0,,,,,,,,,,,,,,,,,,,,,,,1.0,-35.0,-28.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.3,1.0,27463.41,27463.41,27463.41,0.0,0.0,0.0,0.0,-1070.0,-1070.0,-1070.0,10.0,10.0,-762.0,9.496672,9.496672,-13599.0,-13599.0,-13599.0,0.947859,0.947859,0.947859,,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,1.0,27463.41,27463.41,27463.41,260811.0,260811.0,260811.0,0.0,247212.0,-1070.0,-1070.0,10.0,10.0,-762.0,9.496672,9.496672,-13599.0,0.947859,0.947859,0.947859,365243.0,365243.0,-1039.0,-1039.0,-769.0,-769.0,-769.0,-769.0,-769.0,0.0,0.0,0.0,0.0053,0.0053,0.0053,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,,0.0,,,,,,,,1.0,1.0,,,,,,
7,100011,0,1,0,0,1,112500.0,1019610.0,33826.5,1,2,0.018634,-7427.0,-3514,0,0,1,0,2,0,0,0,0,1.0,0.0,1.0,0.0,0.0,1,0,0,0,0,1,55.065753,1,,0,9.0632,0.30068,0,2.0,0.514935,1.0,0.0,0.0,3.0,-1150.923077,-2477.0,-37.0,13575.715615,563.355,46485.0,12651.929943,11328.893654,449.685,46485.0,12093.342822,4.807692,32.0,7.762059,7.946154,958.0,83.995507,0.146154,19.0,0.907692,0.252669,0.116381,0.305371,0.138462,18.0,0.007692,0.007692,0.007692,1.0,0.0,113.0,-990.230088,-2234.0,-37.0,13420.147699,563.355,46485.0,13571.335093,11481.503894,461.565,46485.0,12852.525187,4.849558,32.0,7.708091,0.185841,6.0,0.774005,0.079646,9.0,0.938053,0.228043,0.076037,0.259942,0.079646,9.0,0.0,0.0,0.0,1.0,0.0,113.0,-990.230088,-2234.0,-37.0,13420.147699,563.355,46485.0,13571.335093,11481.503894,461.565,46485.0,12852.525187,4.849558,32.0,7.708091,0.185841,6.0,0.774005,0.079646,9.0,0.938053,0.228043,0.076037,0.259942,0.079646,9.0,0.0,0.0,0.0,1.0,0.0,-75.0,189000.0,54482.111149,180000.0,180000.0,180000.0,180000.0,180000.0,0.0,0.0,9000.0,3956.221849,55485.0,4520.067568,334485.0,7473.872687,189000.0,54433.179122,4.0,0.054054,4.0,4.0,0.054054,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.05,0.302678,1.0,inf,1.0,0.013514,0.0,0.0,0.0,189000.0,54482.111149,0.0,0.0,0.0,1.05,0.302678,0.0,0.0,0.0,189000.0,54482.111149,0.0,0.0,0.0,1.05,0.302678,0.0,0.0,0.0,189000.0,54482.111149,0.0,0.0,0.0,1.05,0.302678,0.0,0.0,0.0,4,-2508,-1309,-1773.0,-2173.0,-860.0,10147.23,5073.615,145242.0,108807.075,435228.3,0.0,0.0,0.0,0.0,0.0,0.0,,96662.1,289986.3,,,,0.0,,,,,0.0,1.0,0.0,0.0,0.75,0.25,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,-77.0,-11.0,7.0,8.0,1.142857,8.0,3.023716,8.0,1.142857,8.0,0.142857,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.366667,4.0,9000.0,31295.25,18303.195,13594.5,6797.25,0.10001,0.050005,-2508.0,-1162.0,-1784.5,30.0,14.0,-283.0,17.539667,23.419369,-180000.0,1485.0,-59107.5,0.0,1.011045,0.644008,0.559543,0.050557,0.5,0.25,0.25,0.0,0.75,0.0,0.25,0.0,0.25,0.0,0.25,0.25,0.0,0.25,0.0,0.25,0.0,0.0,0.0,0.0,0.0,0.5,0.25,0.0,0.75,0.0,0.25,0.25,0.0,0.0,0.0,0.25,0.5,0.0,0.0,0.5,0.25,0.25,0.0,0.0,0.0,0.25,0.25,0.0,0.25,0.0,0.0,0.0,0.0,0.25,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.25,0.0,0.75,,,,,,,,,,,,,,,,,,,,,,,,,3.0,9000.0,31295.25,18303.195,134446.5,732915.0,349120.5,13594.5,675000.0,-2508.0,-1992.0,30.0,14.0,121258.0,17.539667,23.419369,1485.0,0.0,1.011045,0.644008,365243.0,242736.333333,-2477.0,-1955.0,-2147.0,365243.0,120935.666667,-289.0,-1231.0,0.0,366500.0,122166.666667,-inf,0.025367,-inf,,0.0,0.0,0.0,0.0,-1162.0,-1162.0,-1162.0,,,0.0,0.0,0.0,,,,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,,0.75,,0.75,,,,,,,,,0.75,,,,
8,100014,0,1,0,0,1,112500.0,652500.0,21177.0,4,4,0.0228,-4427.0,-738,1,0,1,0,2,0,0,0,0,0.0,0.0,0.0,0.0,-844.0,1,0,0,0,0,1,27.936986,0,1.860274,1,5.8,0.18824,0,3.0,0.445189,0.0,0.0,0.0,2.0,-584.473684,-823.0,-36.0,11826.206053,11547.27,14045.625,782.140153,8783.197105,530.1,14045.625,4653.346796,9.263158,30.0,12.008525,1.052632,5.0,1.580214,0.421053,8.0,0.736842,0.380405,0.386798,0.469443,0.421053,8.0,0.0,0.0,0.0,1.0,0.0,19.0,-584.473684,-823.0,-36.0,11826.206053,11547.27,14045.625,782.140153,8783.197105,530.1,14045.625,4653.346796,9.263158,30.0,12.008525,1.052632,5.0,1.580214,0.421053,8.0,0.736842,0.380405,0.386798,0.469443,0.421053,8.0,0.0,0.0,0.0,1.0,0.0,19.0,-584.473684,-823.0,-36.0,11826.206053,11547.27,14045.625,782.140153,8783.197105,530.1,14045.625,4653.346796,9.263158,30.0,12.008525,1.052632,5.0,1.580214,0.421053,8.0,0.736842,0.380405,0.386798,0.469443,0.421053,8.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,8,-2308,-376,-1095.375,-2004.0,723.0,12752.28,3726.3525,900000.0,341241.553125,2729932.425,420201.0,151642.8,758214.0,0.0,0.0,0.0,,343778.985,1718894.925,,,,0.0,,,,,0.25,0.75,0.0,0.0,1.0,0.0,0.0,0.0,0.0,-376.0,-399.5,704.0,723.0,12752.28,6376.14,571500.0,1005750.0,379107.0,758214.0,0.0,0.0,-34.0,-29.5,1.322389,123768.0,,,,,0.0,,,,,,,,,,,,12752.28,6376.14,0.0,571500.0,1188000.0,379107.0,758214.0,1.322389,123768.0,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,11567.475,14045.625,12806.55,0.0,0.0,0.0,0.0,-844.0,-102.0,-473.0,12.0,9.0,-475.0,8.3271,11.399895,-12595.5,0.0,-6297.75,0.904484,1.0,0.952242,0.06754,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.5,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.5,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.5,0.0,1.0,0.0,0.0,1.0,0.023653,14045.625,14045.625,73800.0,73800.0,73800.0,0.0,0.0,-102.0,-102.0,6.0,6.0,86.0,86.0,86.0,28091.25,0.0,0.0,45708.75,45708.75,45708.75,0.38064,0.38064,2.0,11567.475,14045.625,12806.55,73800.0,131868.0,102834.0,0.0,119272.5,-844.0,-473.0,12.0,9.0,182384.0,8.3271,11.399895,0.0,0.904484,1.0,0.952242,365243.0,365243.0,-813.0,-438.5,-483.0,86.0,-198.5,365243.0,182380.0,-365157.0,0.0,-182578.5,0.004387,0.023653,0.01402,0.013624,,,,,,,,,,,,,,,,,,,73800.0,14045.625,14045.625,0.023653,0.023653,,-102.0,-102.0,86.0,86.0,86.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,73800.0,14045.625,14045.625,0.023653,0.023653,,-102.0,-102.0,86.0,86.0,86.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,,0.0,,,,,,,,1.0,,,,,,1.0,
9,100015,0,1,0,0,1,38419.155,148365.0,10678.5,1,2,0.015221,-5246.0,-2512,0,0,1,1,2,0,0,0,0,0.0,0.0,0.0,0.0,-2396.0,0,1,0,0,0,1,55.936986,1,,0,3.861746,0.277947,0,2.0,0.643375,0.0,0.0,0.0,1.0,-2237.9,-2374.0,-2108.0,7658.6805,7584.525,7666.92,26.055587,7658.6805,7584.525,7666.92,26.055587,15.0,29.0,7.67391,2.1,21.0,6.640783,0.1,1.0,1.0,0.0,0.1,0.316228,0.1,1.0,0.1,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,4,-1409,-319,-947.75,-1045.0,-16.0,,,131103.0,102373.875,409495.5,0.0,0.0,0.0,0.0,0.0,0.0,,94320.0,94320.0,,,,0.0,,,,,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,0.0,89752.5,89752.5,,0.0,,,,,,,0.0,89752.5,89752.5,,0.0,,,,,1.0,-75.0,-75.0,1.0,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.6,1.0,7666.92,7666.92,7666.92,6885.0,6885.0,0.101382,0.101382,-2396.0,-2396.0,-2396.0,10.0,10.0,-2084.0,8.748885,8.748885,1773.0,1773.0,1773.0,1.026432,1.026432,1.026432,,0.102643,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,1.0,7666.92,7666.92,7666.92,67077.0,67077.0,67077.0,6885.0,68850.0,-2396.0,-2396.0,10.0,10.0,-2084.0,8.748885,8.748885,1773.0,1.026432,1.026432,1.026432,365243.0,365243.0,-2360.0,-2360.0,-2090.0,-2090.0,-2090.0,-2090.0,-2090.0,0.0,0.0,0.0,0.0143,0.0143,0.0143,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0.0,,,1.0,,,,,,,,,,,1.0,,


In [88]:
# identify columns not in test_1
for col in train_1:
    if col not in test_1:
        print(col)

TARGET
TYPE_SUITE_FAMILY_STATUS_Group of people_Widow
TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Widow


### 6.2. Merging bureau data into train_2 and test_2
`New customer with bureau report`<br>
[top](#Contents)

In [89]:
print(train_2.shape)
print(test_2.shape)

(14859, 51)
(890, 50)


In [90]:
train_2 = pd.merge(train_2, agg_bureau, on='SK_ID_CURR', how='left')

test_2 = pd.merge(test_2, agg_bureau, on='SK_ID_CURR', how='left')

In [91]:
# get dummies for categorical columns
train_2 = pd.get_dummies(train_2, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

test_2 = pd.get_dummies(test_2, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

In [92]:
print(train_2.shape)
print(test_2.shape)

(14859, 182)
(890, 164)


In [93]:
# identify columns not in test_2
for col in train_2:
    if col not in test_2:
        print(col)

TARGET
NAME_TYPE_SUITE_Group of people
TYPE_SUITE_FAMILY_STATUS_Children_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Children_Separated
TYPE_SUITE_FAMILY_STATUS_Children_Widow
TYPE_SUITE_FAMILY_STATUS_Group of people_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Group of people_Married
TYPE_SUITE_FAMILY_STATUS_Group of people_Separated
TYPE_SUITE_FAMILY_STATUS_Group of people_Single / not married
TYPE_SUITE_FAMILY_STATUS_Other_A_Married
TYPE_SUITE_FAMILY_STATUS_Other_A_Separated
TYPE_SUITE_FAMILY_STATUS_Other_A_Single / not married
TYPE_SUITE_FAMILY_STATUS_Other_A_Widow
TYPE_SUITE_FAMILY_STATUS_Other_B_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Other_B_Single / not married
TYPE_SUITE_FAMILY_STATUS_Other_B_Widow
TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Widow


### 6.3. Merging past data into train_3 and test_3
`Repeat customer with no bureau report`<br>
[top](#Contents)

In [94]:
print(train_3.shape)
print(test_3.shape)

(41433, 51)
(6203, 50)


In [95]:
train_3 = pd.merge(train_3, install_pay_agg, on='SK_ID_CURR', how='left')
train_3 = pd.merge(train_3, cc_agg, on='SK_ID_CURR', how='left')
train_3 = pd.merge(train_3, pos_agg, on='SK_ID_CURR', how='left')
train_3 = pd.merge(train_3, agg_prev, on='SK_ID_CURR', how='left')

test_3 = pd.merge(test_3, install_pay_agg, on='SK_ID_CURR', how='left')
test_3 = pd.merge(test_3, cc_agg, on='SK_ID_CURR', how='left')
test_3 = pd.merge(test_3, pos_agg, on='SK_ID_CURR', how='left')
test_3 = pd.merge(test_3, agg_prev, on='SK_ID_CURR', how='left')

In [96]:
# get dummies for categorical columns
train_3 = pd.get_dummies(train_3, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

test_3 = pd.get_dummies(test_3, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

In [97]:
train_3.head(3)

Unnamed: 0,SK_ID_CURR,TARGET,NAME_CONTRACT_TYPE,CODE_GENDER,FLAG_OWN_CAR,FLAG_OWN_REALTY,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,NAME_INCOME_TYPE,NAME_EDUCATION_TYPE,REGION_POPULATION_RELATIVE,DAYS_REGISTRATION,DAYS_ID_PUBLISH,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,REGION_RATING_CLIENT_W_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_3,FLAG_DOCUMENT_6,FLAG_DOCUMENT_8,FLAG_DOCUMENT_16,FLAG_DOCUMENT_18,NAME_HOUSING_TYPE_CONVERT,AGE,DAYS_EMPLOYED_PENSION,YRS_EMPLOYED,HAVE_CHILDREN,LOAN_INCOME_RATIO,ANNUITY_INCOME_RATIO,CAR_BINS,FAM_MEMBERS_BIN,AVG_EXT_SOURCE,AVG_OBS_CNT_SOCIAL_CIRCLE,AVG_DEF_CNT_SOCIAL_CIRCLE,RATIO_DEF_OBS_SOCIAL_CIRCLE,INS_SK_ID_PREV_NUNIQUE,INS_DAYS_ENTRY_PAYMENT_MEAN,INS_DAYS_ENTRY_PAYMENT_MIN,INS_DAYS_ENTRY_PAYMENT_MAX,INS_AMT_INSTALMENT_MEAN,INS_AMT_INSTALMENT_MIN,INS_AMT_INSTALMENT_MAX,INS_AMT_INSTALMENT_STD,INS_AMT_PAYMENT_MEAN,INS_AMT_PAYMENT_MIN,INS_AMT_PAYMENT_MAX,INS_AMT_PAYMENT_STD,INS_DAYS_BEFORE_DUE_MEAN,INS_DAYS_BEFORE_DUE_MAX,INS_DAYS_BEFORE_DUE_STD,INS_DAYS_PAST_DUE_MEAN,INS_DAYS_PAST_DUE_MAX,INS_DAYS_PAST_DUE_STD,INS_FLAG_LATE_PAY_MEAN,INS_FLAG_LATE_PAY_SUM,INS_INSTALL_PAY_RATIO_MEAN,INS_INSTALL_PAY_RATIO_STD,INS_LATE_PAY_RATIO_MEAN,INS_LATE_PAY_RATIO_STD,INS_SIGNIFICANT_LATE_PAY_MEAN,INS_SIGNIFICANT_LATE_PAY_SUM,INS_FLAG_15DAYS_DUE_MEAN,INS_FLAG_30DAYS_DUE_MEAN,INS_FLAG_60DAYS_DUE_MEAN,INS_PAYMENT_RATIO_MEAN,INS_FLAG_PAYMENT_OVER_MEAN,INS_24M_SK_ID_PREV_SIZE,INS_24M_DAYS_ENTRY_PAYMENT_MEAN,INS_24M_DAYS_ENTRY_PAYMENT_MIN,INS_24M_DAYS_ENTRY_PAYMENT_MAX,INS_24M_AMT_INSTALMENT_MEAN,INS_24M_AMT_INSTALMENT_MIN,INS_24M_AMT_INSTALMENT_MAX,INS_24M_AMT_INSTALMENT_STD,INS_24M_AMT_PAYMENT_MEAN,INS_24M_AMT_PAYMENT_MIN,INS_24M_AMT_PAYMENT_MAX,INS_24M_AMT_PAYMENT_STD,INS_24M_DAYS_BEFORE_DUE_MEAN,INS_24M_DAYS_BEFORE_DUE_MAX,INS_24M_DAYS_BEFORE_DUE_STD,INS_24M_DAYS_PAST_DUE_MEAN,INS_24M_DAYS_PAST_DUE_MAX,INS_24M_DAYS_PAST_DUE_STD,INS_24M_FLAG_LATE_PAY_MEAN,INS_24M_FLAG_LATE_PAY_SUM,INS_24M_INSTALL_PAY_RATIO_MEAN,INS_24M_INSTALL_PAY_RATIO_STD,INS_24M_LATE_PAY_RATIO_MEAN,INS_24M_LATE_PAY_RATIO_STD,INS_24M_SIGNIFICANT_LATE_PAY_MEAN,INS_24M_SIGNIFICANT_LATE_PAY_SUM,INS_24M_FLAG_15DAYS_DUE_MEAN,INS_24M_FLAG_30DAYS_DUE_MEAN,INS_24M_FLAG_60DAYS_DUE_MEAN,INS_24M_PAYMENT_RATIO_MEAN,INS_24M_FLAG_PAYMENT_OVER_MEAN,INS_48M_SK_ID_PREV_SIZE,INS_48M_DAYS_ENTRY_PAYMENT_MEAN,INS_48M_DAYS_ENTRY_PAYMENT_MIN,INS_48M_DAYS_ENTRY_PAYMENT_MAX,INS_48M_AMT_INSTALMENT_MEAN,INS_48M_AMT_INSTALMENT_MIN,INS_48M_AMT_INSTALMENT_MAX,INS_48M_AMT_INSTALMENT_STD,INS_48M_AMT_PAYMENT_MEAN,INS_48M_AMT_PAYMENT_MIN,INS_48M_AMT_PAYMENT_MAX,INS_48M_AMT_PAYMENT_STD,INS_48M_DAYS_BEFORE_DUE_MEAN,INS_48M_DAYS_BEFORE_DUE_MAX,INS_48M_DAYS_BEFORE_DUE_STD,INS_48M_DAYS_PAST_DUE_MEAN,INS_48M_DAYS_PAST_DUE_MAX,INS_48M_DAYS_PAST_DUE_STD,INS_48M_FLAG_LATE_PAY_MEAN,INS_48M_FLAG_LATE_PAY_SUM,INS_48M_INSTALL_PAY_RATIO_MEAN,INS_48M_INSTALL_PAY_RATIO_STD,INS_48M_LATE_PAY_RATIO_MEAN,INS_48M_LATE_PAY_RATIO_STD,INS_48M_SIGNIFICANT_LATE_PAY_MEAN,INS_48M_SIGNIFICANT_LATE_PAY_SUM,INS_48M_FLAG_15DAYS_DUE_MEAN,INS_48M_FLAG_30DAYS_DUE_MEAN,INS_48M_FLAG_60DAYS_DUE_MEAN,INS_48M_PAYMENT_RATIO_MEAN,INS_48M_FLAG_PAYMENT_OVER_MEAN,CC_MONTHS_BALANCE_MIN,CC_AMT_BALANCE_MAX,CC_AMT_BALANCE_MEAN,CC_AMT_CREDIT_LIMIT_ACTUAL_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_MAX,CC_AMT_DRAWINGS_ATM_CURRENT_SUM,CC_AMT_DRAWINGS_CURRENT_MAX,CC_AMT_DRAWINGS_CURRENT_SUM,CC_AMT_DRAWINGS_POS_CURRENT_MAX,CC_AMT_DRAWINGS_POS_CURRENT_SUM,CC_AMT_INST_MIN_REGULARITY_MAX,CC_AMT_INST_MIN_REGULARITY_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_MAX,CC_AMT_PAYMENT_TOTAL_CURRENT_MEAN,CC_AMT_PAYMENT_TOTAL_CURRENT_SUM,CC_AMT_PAYMENT_TOTAL_CURRENT_STD,CC_AMT_TOTAL_RECEIVABLE_MAX,CC_AMT_TOTAL_RECEIVABLE_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_MAX,CC_CNT_DRAWINGS_ATM_CURRENT_MEAN,CC_CNT_DRAWINGS_ATM_CURRENT_SUM,CC_CNT_DRAWINGS_CURRENT_MAX,CC_CNT_DRAWINGS_CURRENT_MEAN,CC_CNT_DRAWINGS_CURRENT_SUM,CC_CNT_DRAWINGS_POS_CURRENT_MAX,CC_CNT_DRAWINGS_POS_CURRENT_MEAN,CC_CNT_DRAWINGS_POS_CURRENT_SUM,CC_SK_DPD_MAX,CC_SK_DPD_MEAN,CC_SK_DPD_SUM,CC_SK_DPD_DEF_MAX,CC_SK_DPD_DEF_SUM,CC_USAGE_RATIO_MAX,CC_USAGE_RATIO_MEAN,CC_PAYMENT_RATE_MIN,CC_PAYMENT_RATE_MEAN,CC_DRAWING_LIMIT_RATE_MAX,CC_DRAWING_LIMIT_RATE_MEAN,CC_FLAG_15DAYS_DUE_SUM,CC_FLAG_30DAYS_DUE_SUM,CC_FLAG_60DAYS_DUE_SUM,INS_12M_AMT_BALANCE_MAX,INS_12M_AMT_BALANCE_MEAN,INS_12M_SK_DPD_MAX,INS_12M_SK_DPD_MEAN,INS_12M_SK_DPD_SUM,INS_12M_USAGE_RATIO_MAX,INS_12M_USAGE_RATIO_MEAN,INS_12M_FLAG_15DAYS_DUE_SUM,INS_12M_FLAG_30DAYS_DUE_SUM,INS_12M_FLAG_60DAYS_DUE_SUM,INS_24M_AMT_BALANCE_MAX,INS_24M_AMT_BALANCE_MEAN,INS_24M_SK_DPD_MAX,INS_24M_SK_DPD_MEAN,INS_24M_SK_DPD_SUM,INS_24M_USAGE_RATIO_MAX,INS_24M_USAGE_RATIO_MEAN,INS_24M_FLAG_15DAYS_DUE_SUM,INS_24M_FLAG_30DAYS_DUE_SUM,INS_24M_FLAG_60DAYS_DUE_SUM,INS_36M_AMT_BALANCE_MAX,INS_36M_AMT_BALANCE_MEAN,INS_36M_SK_DPD_MAX,INS_36M_SK_DPD_MEAN,INS_36M_SK_DPD_SUM,INS_36M_USAGE_RATIO_MAX,INS_36M_USAGE_RATIO_MEAN,INS_36M_FLAG_15DAYS_DUE_SUM,INS_36M_FLAG_30DAYS_DUE_SUM,INS_36M_FLAG_60DAYS_DUE_SUM,POS_SK_ID_PREV_NUNIQUE,POS_MONTHS_BALANCE_MIN,POS_MONTHS_BALANCE_MAX,POS_MONTHS_BALANCE_SIZE,POS_SK_DPD_MAX,POS_SK_DPD_MEAN,POS_SK_DPD_SUM,POS_SK_DPD_STD,POS_SK_DPD_DEF_MAX,POS_SK_DPD_DEF_MEAN,POS_SK_DPD_DEF_SUM,POS_FLAG_LATE_PAYMENT_MEAN,POS_NAME_CONTRACT_STATUS_Active_MEAN,POS_NAME_CONTRACT_STATUS_Approved_MEAN,POS_NAME_CONTRACT_STATUS_Canceled_MEAN,POS_NAME_CONTRACT_STATUS_Completed_MEAN,POS_NAME_CONTRACT_STATUS_Demand_MEAN,POS_NAME_CONTRACT_STATUS_Returned to the store_MEAN,POS_NAME_CONTRACT_STATUS_Signed_MEAN,POS_LOAN_COMPLETED_MEAN,POS_COMPLETED_BEFORE_MEAN,POS_REMAINING_INSTALMENTS,POS_REMAINING_INSTALMENTS_RATIO,PREV_SK_ID_PREV_NUNIQUE,PREV_AMT_ANNUITY_MIN,PREV_AMT_ANNUITY_MAX,PREV_AMT_ANNUITY_MEAN,PREV_AMT_DOWN_PAYMENT_MAX,PREV_AMT_DOWN_PAYMENT_MEAN,PREV_RATE_DOWN_PAYMENT_MAX,PREV_RATE_DOWN_PAYMENT_MEAN,PREV_DAYS_DECISION_MIN,PREV_DAYS_DECISION_MAX,PREV_DAYS_DECISION_MEAN,PREV_CNT_PAYMENT_MAX,PREV_CNT_PAYMENT_MEAN,PREV_DAYS_TERMINATION_MAX,PREV_CREDIT_TO_ANNUITY_RATIO_MEAN,PREV_CREDIT_TO_ANNUITY_RATIO_MAX,PREV_APPLICATION_CREDIT_DIFF_MIN,PREV_APPLICATION_CREDIT_DIFF_MAX,PREV_APPLICATION_CREDIT_DIFF_MEAN,PREV_APPLICATION_CREDIT_RATIO_MIN,PREV_APPLICATION_CREDIT_RATIO_MAX,PREV_APPLICATION_CREDIT_RATIO_MEAN,PREV_APPLICATION_CREDIT_RATIO_STD,PREV_DOWN_PAYMENT_TO_CREDIT_MEAN,PREV_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_NAME_CONTRACT_TYPE_XNA_MEAN,PREV_NAME_CONTRACT_STATUS_Approved_MEAN,PREV_NAME_CONTRACT_STATUS_Canceled_MEAN,PREV_NAME_CONTRACT_STATUS_Refused_MEAN,PREV_NAME_CONTRACT_STATUS_Unused offer_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_MONDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_TUESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_THURSDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_FRIDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SATURDAY_MEAN,PREV_WEEKDAY_APPR_PROCESS_START_SUNDAY_MEAN,PREV_NAME_TYPE_SUITE_Children_MEAN,PREV_NAME_TYPE_SUITE_Family_MEAN,PREV_NAME_TYPE_SUITE_Group of people_MEAN,PREV_NAME_TYPE_SUITE_Other_A_MEAN,PREV_NAME_TYPE_SUITE_Other_B_MEAN,"PREV_NAME_TYPE_SUITE_Spouse, partner_MEAN",PREV_NAME_TYPE_SUITE_Unaccompanied_MEAN,PREV_NAME_CLIENT_TYPE_New_MEAN,PREV_NAME_CLIENT_TYPE_Refreshed_MEAN,PREV_NAME_CLIENT_TYPE_Repeater_MEAN,PREV_NAME_CLIENT_TYPE_XNA_MEAN,PREV_NAME_PRODUCT_TYPE_walk-in_MEAN,PREV_NAME_PRODUCT_TYPE_x-sell_MEAN,PREV_CHANNEL_TYPE_AP+ (Cash loan)_MEAN,PREV_CHANNEL_TYPE_Car dealer_MEAN,PREV_CHANNEL_TYPE_Channel of corporate sales_MEAN,PREV_CHANNEL_TYPE_Contact center_MEAN,PREV_CHANNEL_TYPE_Credit and cash offices_MEAN,PREV_CHANNEL_TYPE_Regional / Local_MEAN,PREV_CHANNEL_TYPE_Stone_MEAN,PREV_NAME_YIELD_GROUP_XNA_MEAN,PREV_NAME_YIELD_GROUP_high_MEAN,PREV_NAME_YIELD_GROUP_low_action_MEAN,PREV_NAME_YIELD_GROUP_low_normal_MEAN,PREV_NAME_YIELD_GROUP_middle_MEAN,PREV_PRODUCT_COMBINATION_Card Street_MEAN,PREV_PRODUCT_COMBINATION_Card X-Sell_MEAN,PREV_PRODUCT_COMBINATION_Cash_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: high_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: low_MEAN,PREV_PRODUCT_COMBINATION_Cash Street: middle_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: high_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: low_MEAN,PREV_PRODUCT_COMBINATION_Cash X-Sell: middle_MEAN,PREV_PRODUCT_COMBINATION_POS household with interest_MEAN,PREV_PRODUCT_COMBINATION_POS household without interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry with interest_MEAN,PREV_PRODUCT_COMBINATION_POS industry without interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile with interest_MEAN,PREV_PRODUCT_COMBINATION_POS mobile without interest_MEAN,PREV_PRODUCT_COMBINATION_POS other with interest_MEAN,PREV_PRODUCT_COMBINATION_POS others without interest_MEAN,PREV_HOUR_APPR_PROCESS_START_afternoon_MEAN,PREV_HOUR_APPR_PROCESS_START_dusk_MEAN,PREV_HOUR_APPR_PROCESS_START_morning_MEAN,PREV_ACTIVE_SK_ID_PREV_NUNIQUE,PREV_ACTIVE_SIMPLE_INTERESTS_MEAN,PREV_ACTIVE_AMT_ANNUITY_MAX,PREV_ACTIVE_AMT_ANNUITY_SUM,PREV_ACTIVE_AMT_APPLICATION_MAX,PREV_ACTIVE_AMT_APPLICATION_MEAN,PREV_ACTIVE_AMT_CREDIT_SUM,PREV_ACTIVE_AMT_DOWN_PAYMENT_MAX,PREV_ACTIVE_AMT_DOWN_PAYMENT_MEAN,PREV_ACTIVE_DAYS_DECISION_MIN,PREV_ACTIVE_DAYS_DECISION_MEAN,PREV_ACTIVE_CNT_PAYMENT_MEAN,PREV_ACTIVE_CNT_PAYMENT_SUM,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_ACTIVE_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_ACTIVE_AMT_PAYMENT_SUM,PREV_ACTIVE_INSTALMENT_PAYMENT_DIFF_MEAN,PREV_ACTIVE_INSTALMENT_PAYMENT_DIFF_MAX,PREV_ACTIVE_REMAINING_DEBT_MAX,PREV_ACTIVE_REMAINING_DEBT_MEAN,PREV_ACTIVE_REMAINING_DEBT_SUM,PREV_ACTIVE_REPAYMENT_RATIO_MEAN,TOTAL_REPAYMENT_RATIO,APPROVED_SK_ID_PREV_NUNIQUE,APPROVED_AMT_ANNUITY_MIN,APPROVED_AMT_ANNUITY_MAX,APPROVED_AMT_ANNUITY_MEAN,APPROVED_AMT_CREDIT_MIN,APPROVED_AMT_CREDIT_MAX,APPROVED_AMT_CREDIT_MEAN,APPROVED_AMT_DOWN_PAYMENT_MAX,APPROVED_AMT_GOODS_PRICE_MAX,APPROVED_DAYS_DECISION_MIN,APPROVED_DAYS_DECISION_MEAN,APPROVED_CNT_PAYMENT_MAX,APPROVED_CNT_PAYMENT_MEAN,APPROVED_DAYS_TERMINATION_MEAN,APPROVED_CREDIT_TO_ANNUITY_RATIO_MEAN,APPROVED_CREDIT_TO_ANNUITY_RATIO_MAX,APPROVED_APPLICATION_CREDIT_DIFF_MAX,APPROVED_APPLICATION_CREDIT_RATIO_MIN,APPROVED_APPLICATION_CREDIT_RATIO_MAX,APPROVED_APPLICATION_CREDIT_RATIO_MEAN,APPROVED_DAYS_FIRST_DRAWING_MAX,APPROVED_DAYS_FIRST_DRAWING_MEAN,APPROVED_DAYS_FIRST_DUE_MIN,APPROVED_DAYS_FIRST_DUE_MEAN,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MIN,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MAX,APPROVED_DAYS_LAST_DUE_1ST_VERSION_MEAN,APPROVED_DAYS_LAST_DUE_MAX,APPROVED_DAYS_LAST_DUE_MEAN,APPROVED_DAYS_LAST_DUE_DIFF_MIN,APPROVED_DAYS_LAST_DUE_DIFF_MAX,APPROVED_DAYS_LAST_DUE_DIFF_MEAN,APPROVED_SIMPLE_INTERESTS_MIN,APPROVED_SIMPLE_INTERESTS_MAX,APPROVED_SIMPLE_INTERESTS_MEAN,APPROVED_SIMPLE_INTERESTS_STD,REFUSED_AMT_APPLICATION_MAX,REFUSED_AMT_APPLICATION_MEAN,REFUSED_AMT_CREDIT_MIN,REFUSED_AMT_CREDIT_MAX,REFUSED_DAYS_DECISION_MIN,REFUSED_DAYS_DECISION_MAX,REFUSED_DAYS_DECISION_MEAN,REFUSED_CNT_PAYMENT_MAX,REFUSED_CNT_PAYMENT_MEAN,REFUSED_APPLICATION_CREDIT_DIFF_MIN,REFUSED_APPLICATION_CREDIT_DIFF_MAX,REFUSED_APPLICATION_CREDIT_DIFF_MEAN,REFUSED_APPLICATION_CREDIT_DIFF_STD,REFUSED_APPLICATION_CREDIT_RATIO_MIN,REFUSED_APPLICATION_CREDIT_RATIO_MEAN,REFUSED_NAME_CONTRACT_TYPE_Consumer loans_MEAN,REFUSED_NAME_CONTRACT_TYPE_Cash loans_MEAN,REFUSED_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_LAST12M_AMT_CREDIT_SUM,PREV_LAST12M_AMT_ANNUITY_MEAN,PREV_LAST12M_AMT_ANNUITY_MAX,PREV_LAST12M_SIMPLE_INTERESTS_MEAN,PREV_LAST12M_SIMPLE_INTERESTS_MAX,PREV_LAST12M_SIMPLE_INTERESTS_STD,PREV_LAST12M_DAYS_DECISION_MIN,PREV_LAST12M_DAYS_DECISION_MEAN,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_LAST12M_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_LAST12M_APPLICATION_CREDIT_DIFF_MIN,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MIN,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MAX,PREV_LAST12M_APPLICATION_CREDIT_RATIO_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_LAST12M_NAME_CONTRACT_TYPE_Revolving loans_MEAN,PREV_LAST24M_AMT_CREDIT_SUM,PREV_LAST24M_AMT_ANNUITY_MEAN,PREV_LAST24M_AMT_ANNUITY_MAX,PREV_LAST24M_SIMPLE_INTERESTS_MEAN,PREV_LAST24M_SIMPLE_INTERESTS_MAX,PREV_LAST24M_SIMPLE_INTERESTS_STD,PREV_LAST24M_DAYS_DECISION_MIN,PREV_LAST24M_DAYS_DECISION_MEAN,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MIN,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MAX,PREV_LAST24M_DAYS_LAST_DUE_1ST_VERSION_MEAN,PREV_LAST24M_APPLICATION_CREDIT_DIFF_MIN,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MIN,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MAX,PREV_LAST24M_APPLICATION_CREDIT_RATIO_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Consumer loans_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Cash loans_MEAN,PREV_LAST24M_NAME_CONTRACT_TYPE_Revolving loans_MEAN,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group of people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse, partner",NAME_TYPE_SUITE_Unaccompanied,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,NAME_FAMILY_STATUS_Civil marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single / not married,NAME_FAMILY_STATUS_Widow,TYPE_SUITE_FAMILY_STATUS_Children_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Children_Married,TYPE_SUITE_FAMILY_STATUS_Children_Separated,TYPE_SUITE_FAMILY_STATUS_Children_Single / not married,TYPE_SUITE_FAMILY_STATUS_Children_Widow,TYPE_SUITE_FAMILY_STATUS_Family_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Family_Married,TYPE_SUITE_FAMILY_STATUS_Family_Separated,TYPE_SUITE_FAMILY_STATUS_Family_Single / not married,TYPE_SUITE_FAMILY_STATUS_Family_Widow,TYPE_SUITE_FAMILY_STATUS_Group of people_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Group of people_Married,TYPE_SUITE_FAMILY_STATUS_Group of people_Separated,TYPE_SUITE_FAMILY_STATUS_Group of people_Single / not married,TYPE_SUITE_FAMILY_STATUS_Group of people_Widow,TYPE_SUITE_FAMILY_STATUS_Other_A_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Other_A_Married,TYPE_SUITE_FAMILY_STATUS_Other_A_Separated,TYPE_SUITE_FAMILY_STATUS_Other_A_Single / not married,TYPE_SUITE_FAMILY_STATUS_Other_A_Widow,TYPE_SUITE_FAMILY_STATUS_Other_B_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Other_B_Married,TYPE_SUITE_FAMILY_STATUS_Other_B_Separated,TYPE_SUITE_FAMILY_STATUS_Other_B_Single / not married,TYPE_SUITE_FAMILY_STATUS_Other_B_Widow,"TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Civil marriage","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Married","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Separated","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Single / not married","TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Widow",TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Civil marriage,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Married,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Separated,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Single / not married,TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Widow,PROCESS_START_PERIOD_afternoon,PROCESS_START_PERIOD_dusk,PROCESS_START_PERIOD_morning
0,100006,0,1,0,0,1,135000.0,312682.5,29686.5,4,2,0.008019,-9833.0,-2437,1,0,1,0,2,0,0,0,0,2.0,0.0,2.0,0.0,-617.0,1,0,0,0,0,1,52.068493,0,8.326027,0,2.316167,0.2199,0,2.0,0.650442,2.0,0.0,0.0,3.0,-271.625,-575.0,-12.0,62947.088438,2482.92,691786.89,168097.624347,62947.088438,2482.92,691786.89,168097.624347,19.375,77.0,25.397835,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,16.0,-271.625,-575.0,-12.0,62947.088438,2482.92,691786.89,168097.624347,62947.088438,2482.92,691786.89,168097.624347,19.375,77.0,25.397835,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,16.0,-271.625,-575.0,-12.0,62947.088438,2482.92,691786.89,168097.624347,62947.088438,2482.92,691786.89,168097.624347,19.375,77.0,25.397835,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,-6.0,0.0,0.0,270000.0,,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,9.0,2482.92,39954.51,23651.175,66987.0,34840.17,0.21783,0.163412,-617.0,-181.0,-272.444444,48.0,23.0,-143.0,17.767287,27.839644,-218115.0,66987.0,-19492.24,0.759418,1.250017,1.010763,0.164441,0.180612,0.555556,0.222222,0.222222,0.0,0.555556,0.333333,0.111111,0.0,0.0,0.111111,0.0,0.666667,0.0,0.111111,0.111111,0.0,0.111111,0.0,0.0,0.0,0.0,0.333333,0.111111,0.0,0.888889,0.0,0.0,0.444444,0.0,0.0,0.0,0.0,0.777778,0.0,0.111111,0.444444,0.222222,0.0,0.222222,0.111111,0.111111,0.111111,0.222222,0.0,0.0,0.0,0.111111,0.222222,0.0,0.111111,0.0,0.111111,0.0,0.0,0.0,0.0,0.0,0.888889,0.0,0.111111,2.0,-inf,29027.52,42527.52,334917.0,302458.5,537930.0,66987.0,66987.0,-311.0,-246.0,6.0,12.0,49.0,365243.0,182646.0,290275.2,0.0,0.0,-22345.2,-22345.2,-22345.2,1.083399,0.539615,5.0,2482.92,39954.51,21842.19,24219.0,675000.0,343728.9,66987.0,675000.0,-617.0,-345.6,48.0,18.0,182481.75,15.775037,27.839644,66987.0,0.943934,1.250017,1.061032,365243.0,365243.0,-545.0,91066.5,-215.0,365243.0,91584.0,365243.0,182477.5,-365194.0,1410.0,-90893.5,-inf,0.027424,-inf,,688500.0,688500.0,906615.0,906615.0,-181.0,-181.0,-181.0,48.0,48.0,-218115.0,-218115.0,-218115.0,,0.759418,0.759418,0.0,1.0,0.0,2119545.0,24867.405,32696.1,-inf,0.025007,,-311.0,-199.571429,49.0,1259.0,654.0,-218115.0,0.759418,1.250017,1.002359,0.142857,0.571429,0.285714,2625259.5,23651.175,39954.51,-inf,0.027424,,-617.0,-272.444444,-215.0,1259.0,364.333333,-218115.0,0.759418,1.250017,1.010763,0.222222,0.555556,0.222222,0,0,0,0,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0
1,100012,0,0,1,0,1,135000.0,405000.0,20250.0,4,2,0.019689,-14437.0,-3992,1,0,1,0,2,0,0,0,0,2.0,0.0,2.0,0.0,-1673.0,0,0,0,0,0,1,39.641096,0,5.531507,0,3.0,0.15,0,1.0,0.746644,2.0,0.0,0.0,3.0,-690.3125,-1645.0,-151.0,9584.503125,3012.075,49204.89,7844.551914,10451.285625,5.85,58687.245,11553.379435,25.875,90.0,23.119141,0.5625,14.0,2.23993,0.104167,5.0,1.049621,0.788977,0.064124,0.22442,0.083333,4.0,0.0,0.0,0.0,1.265909,0.041667,37.0,-443.702703,-832.0,-151.0,11331.765,5242.86,49204.89,8072.854978,12619.054459,883.485,58687.245,12295.536496,31.837838,90.0,22.632957,0.27027,5.0,1.146217,0.054054,2.0,1.118427,0.870791,0.029186,0.164559,0.027027,1.0,0.0,0.0,0.0,1.344963,0.054054,48.0,-690.3125,-1645.0,-151.0,9584.503125,3012.075,49204.89,7844.551914,10451.285625,5.85,58687.245,11553.379435,25.875,90.0,23.119141,0.5625,14.0,2.23993,0.104167,5.0,1.049621,0.788977,0.064124,0.22442,0.083333,4.0,0.0,0.0,0.0,1.265909,0.041667,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,-16.0,-7.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11.0,0.569444,4.0,3012.075,11188.035,7894.155,0.0,0.0,0.0,0.0,-1673.0,-107.0,-779.75,24.0,18.0,-137.0,11.36203,14.167635,-24273.0,0.0,-13189.5,0.787588,0.851692,0.809751,0.036342,0.0,0.75,0.25,0.0,0.0,0.75,0.25,0.0,0.0,0.25,0.25,0.0,0.25,0.25,0.0,0.0,0.0,0.25,0.0,0.0,0.0,0.0,0.25,0.25,0.0,0.75,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.75,0.0,0.0,0.25,0.75,0.0,0.0,0.0,0.0,0.0,0.25,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.25,0.0,0.0,0.0,0.75,0.0,0.25,,,,,,,,,,,,,,,,,,,,,,,,,3.0,3012.075,11188.035,7894.155,23697.0,158508.0,98826.0,0.0,135000.0,-1673.0,-1004.0,24.0,18.0,-559.333333,11.36203,14.167635,-4977.0,0.787588,0.851692,0.809751,365243.0,365243.0,-1641.0,-973.333333,-1311.0,33.0,-463.333333,-142.0,-563.333333,30.0,180.0,100.0,0.027424,0.043775,0.033372,0.00904,,,,,,,,,,,,,,,,,,,0.0,,,,,,-107.0,-107.0,,,,0.0,,,,0.0,1.0,0.0,114273.0,9482.355,9482.355,0.027424,0.027424,,-507.0,-307.0,33.0,33.0,33.0,-24273.0,0.787588,0.787588,0.787588,0.0,1.0,0.0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1
2,100018,0,1,0,0,1,189000.0,773680.5,32778.0,4,2,0.010006,-615.0,-2056,1,0,1,0,1,0,0,0,0,0.0,0.0,0.0,0.0,-188.0,1,0,0,0,0,1,39.953425,0,0.556164,0,4.093548,0.173429,0,2.0,0.682298,0.0,0.0,0.0,3.0,-1004.208333,-1628.0,-40.0,49114.6425,4109.265,94906.035,32760.657332,49114.6425,4109.265,94906.035,32760.657332,6.875,21.0,6.422193,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,5.0,-103.8,-170.0,-40.0,4180.365,4180.365,4180.365,0.0,4180.365,4180.365,4180.365,0.0,14.8,21.0,5.403702,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,24.0,-1004.208333,-1628.0,-40.0,49114.6425,4109.265,94906.035,32760.657332,49114.6425,4109.265,94906.035,32760.657332,6.875,21.0,6.422193,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,-49.0,-27.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.392857,4.0,4180.365,94906.035,38669.70375,57181.5,14295.375,0.108917,0.027229,-1648.0,-188.0,-755.25,12.0,10.0,-784.0,8.308475,10.553692,-7686.0,57181.5,12373.875,0.863229,1.11112,0.993587,0.101472,0.02778,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.25,0.25,0.0,0.0,0.25,0.25,0.0,0.0,0.25,0.0,0.0,0.0,0.25,0.0,0.25,0.0,0.5,0.25,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,0.25,0.0,0.75,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.25,0.25,0.0,0.0,1.0,0.0,0.0,1.0,0.01358,4180.365,4180.365,36805.365,36805.365,36805.365,0.0,0.0,-188.0,-188.0,10.0,10.0,121.0,121.0,121.0,20901.825,0.0,0.0,15903.54,15903.54,15903.54,0.567902,0.567902,4.0,4180.365,94906.035,38669.70375,36805.365,536364.0,285989.59125,57181.5,571774.5,-1648.0,-755.25,12.0,10.0,121061.333333,8.308475,10.553692,57181.5,0.863229,1.11112,0.993587,365243.0,365243.0,-1613.0,-905.666667,-1283.0,121.0,-655.666667,365243.0,121057.666667,-365122.0,0.0,-121713.333333,0.010277,0.038257,0.018384,0.01332,,,,,,,,,,,,,,,,,,,93001.365,5506.6275,6832.89,0.025919,0.038257,0.017449,-196.0,-192.0,121.0,121.0,121.0,-7686.0,0.863229,1.0,0.931614,1.0,0.0,0.0,93001.365,5506.6275,6832.89,0.025919,0.038257,0.017449,-196.0,-192.0,121.0,121.0,121.0,-7686.0,0.863229,1.0,0.931614,1.0,0.0,0.0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1
3,100021,0,0,0,0,1,81000.0,270000.0,13500.0,4,2,0.010966,-4143.0,-2427,1,0,1,0,2,0,0,1,1,4.0,0.0,4.0,0.0,-2811.0,0,0,0,0,0,1,26.783562,0,0.523288,1,3.333333,0.166667,0,3.0,0.683513,4.0,0.0,0.0,4.0,-1023.217391,-2776.0,-66.0,9059.022391,2705.76,52236.18,10161.055403,9059.022391,2705.76,52236.18,10161.055403,14.73913,46.0,14.510865,2.434783,15.0,5.434119,0.173913,4.0,1.0,0.0,0.173913,0.387553,0.173913,4.0,0.043478,0.0,0.0,1.0,0.0,17.0,-433.529412,-826.0,-66.0,11300.265,4992.03,52236.18,11022.964318,11300.265,4992.03,52236.18,11022.964318,17.705882,46.0,13.98108,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,17.0,-433.529412,-826.0,-66.0,11300.265,4992.03,52236.18,11022.964318,11300.265,4992.03,52236.18,11022.964318,17.705882,46.0,13.98108,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,-18.0,0.0,0.0,675000.0,,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,-25.0,-9.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,21.0,1.75,6.0,2709.45,33750.0,10686.165,9922.5,3770.1,0.433539,0.106606,-2811.0,-261.0,-943.833333,12.0,7.0,-332.0,9.38907,20.0,-675000.0,8928.0,-112654.5,0.0,1.661333,0.911771,0.530061,0.152374,0.0,0.833333,0.166667,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.166667,0.333333,0.166667,0.333333,0.0,0.0,0.0,0.0,0.0,0.5,0.166667,0.166667,0.166667,0.666667,0.0,0.0,0.166667,0.0,0.0,0.0,0.0,0.166667,0.333333,0.0,0.166667,0.0,0.0,0.333333,0.5,0.0,0.166667,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.666667,0.0,0.0,0.0,0.166667,0.0,0.0,0.0,1.0,0.0,0.0,2.0,-inf,33750.0,41174.865,71950.5,35975.25,754546.5,0.0,0.0,-549.0,-405.0,6.0,12.0,100.0,365243.0,182671.5,59398.92,0.0,0.0,20147.58,20147.58,20147.58,0.746719,0.078721,6.0,2709.45,33750.0,10686.165,13500.0,675000.0,153615.75,9922.5,99189.0,-2811.0,-943.833333,12.0,7.0,72234.4,9.38907,20.0,8928.0,0.0,1.661333,0.911771,365243.0,365243.0,-2772.0,72171.4,-2622.0,365243.0,72363.4,365243.0,145338.0,-365143.0,180.0,-72974.6,-inf,0.034033,-inf,,,,,,,,,,,,,,,,,,,,79546.5,7424.865,7424.865,0.010007,0.010007,,-261.0,-261.0,100.0,100.0,100.0,-7596.0,0.904509,0.904509,0.904509,1.0,0.0,0.0,809500.5,12789.73125,33750.0,-inf,0.015014,,-596.0,-500.5,-415.0,100.0,-157.5,-675000.0,0.0,0.949885,0.70107,0.75,0.0,0.25,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1
4,100034,0,0,1,0,1,90000.0,180000.0,9000.0,4,4,0.030755,-4799.0,-3015,1,0,1,0,2,0,0,0,0,0.0,0.0,0.0,0.0,-599.0,0,0,0,0,0,0,28.331507,0,2.767123,0,2.0,0.1,0,1.0,0.400346,0.0,0.0,0.0,2.0,-415.2,-584.0,-189.0,25285.5765,13888.98,61969.77,14569.598569,31135.5765,13888.98,61969.77,20138.915622,19.0,51.0,17.613126,0.0,0.0,0.0,0.0,0.0,1.222993,0.524439,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.645986,0.2,10.0,-415.2,-584.0,-189.0,25285.5765,13888.98,61969.77,14569.598569,31135.5765,13888.98,61969.77,20138.915622,19.0,51.0,17.613126,0.0,0.0,0.0,0.0,0.0,1.222993,0.524439,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.645986,0.2,10.0,-415.2,-584.0,-189.0,25285.5765,13888.98,61969.77,14569.598569,31135.5765,13888.98,61969.77,20138.915622,19.0,51.0,17.613126,0.0,0.0,0.0,0.0,0.0,1.222993,0.524439,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.645986,0.2,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,-18.0,-18.0,1.0,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.666667,2.0,21281.13,22430.43,21855.78,12145.5,12145.5,0.103967,0.103967,-599.0,-288.0,-443.5,6.0,6.0,-163.0,5.155254,5.407749,-15471.0,6372.0,-4549.5,0.859317,1.055369,0.957343,0.138629,0.105537,0.5,0.5,0.0,0.0,1.0,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.5,0.0,0.5,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.5,0.5,0.0,0.0,0.5,0.0,0.0,0.5,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.5,,,,,,,,,,,,,,,,,,,,,,,,,2.0,21281.13,22430.43,21855.78,109971.0,115083.0,112527.0,12145.5,121455.0,-599.0,-443.5,6.0,6.0,-303.0,5.155254,5.407749,6372.0,0.859317,1.055369,0.957343,365243.0,365243.0,-569.0,-413.0,-419.0,-107.0,-263.0,-167.0,-308.0,30.0,60.0,45.0,0.018253,0.0373,0.027777,0.013468,,,,,,,,,,,,,,,,,,,115083.0,21281.13,21281.13,0.018253,0.018253,,-288.0,-288.0,-107.0,-107.0,-107.0,6372.0,1.055369,1.055369,1.055369,1.0,0.0,0.0,225054.0,21855.78,22430.43,0.027777,0.0373,0.013468,-599.0,-443.5,-419.0,-107.0,-263.0,-15471.0,0.859317,1.055369,0.957343,0.5,0.5,0.0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0


In [98]:
for i in ['morning', 'afternoon', 'dusk']:
    train_3[f'APPR_PROCESS_START_DIV_{i}'] = train_3.apply(lambda x: np.nan if x[f'PROCESS_START_PERIOD_{i}']==0 
                                                              else (x[f'PROCESS_START_PERIOD_{i}'] - x[f'PREV_HOUR_APPR_PROCESS_START_{i}_MEAN']), axis=1)
    
    test_3[f'APPR_PROCESS_START_DIV_{i}'] = test_3.apply(lambda x: np.nan if x[f'PROCESS_START_PERIOD_{i}']==0 
                                                              else (x[f'PROCESS_START_PERIOD_{i}'] - x[f'PREV_HOUR_APPR_PROCESS_START_{i}_MEAN']), axis=1)
    
for j in ['Children', 'Family', 'Group of people', 'Other_A', 'Other_B', 'Spouse, partner', 'Unaccompanied']:
    train_3[f'NAME_TYPE_SUITE_DIV_{j}'] = train_3.apply(lambda x: np.nan if x[f'NAME_TYPE_SUITE_{j}']==0
                                                            else (x[f'NAME_TYPE_SUITE_{j}'] - x[f'PREV_NAME_TYPE_SUITE_{j}_MEAN']), axis=1)
    
    test_3[f'NAME_TYPE_SUITE_DIV_{j}'] = test_3.apply(lambda x: np.nan if x[f'NAME_TYPE_SUITE_{j}']==0
                                                            else (x[f'NAME_TYPE_SUITE_{j}'] - x[f'PREV_NAME_TYPE_SUITE_{j}_MEAN']), axis=1)
    
for k in ['MONDAY', 'TUESDAY', 'WEDNESDAY', 'THURSDAY', 'FRIDAY', 'SATURDAY', 'SUNDAY']:
    train_3[f'WEEKDAY_APPR_PROCESS_DIV_{k}'] = train_3.apply(lambda x: np.nan if x[f'WEEKDAY_APPR_PROCESS_START_{k}']==0
                                                            else (x[f'WEEKDAY_APPR_PROCESS_START_{k}'] - x[f'PREV_WEEKDAY_APPR_PROCESS_START_{k}_MEAN']), axis=1)
    
    test_3[f'WEEKDAY_APPR_PROCESS_DIV_{k}'] = test_3.apply(lambda x: np.nan if x[f'WEEKDAY_APPR_PROCESS_START_{k}']==0
                                                            else (x[f'WEEKDAY_APPR_PROCESS_START_{k}'] - x[f'PREV_WEEKDAY_APPR_PROCESS_START_{k}_MEAN']), axis=1)

In [99]:
print(train_3.shape)
print(test_3.shape)

(41433, 505)
(6203, 498)


In [100]:
# identify columns not in test_3
for col in train_3:
    if col not in test_3:
        print(col)

TARGET
TYPE_SUITE_FAMILY_STATUS_Group of people_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Group of people_Separated
TYPE_SUITE_FAMILY_STATUS_Group of people_Widow
TYPE_SUITE_FAMILY_STATUS_Other_A_Separated
TYPE_SUITE_FAMILY_STATUS_Other_A_Widow
TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Widow


### 6.4. Preparing data for train_4 and test_4
`New customer with no bureau report`<br>
[top](#Contents)

In [101]:
print(train_4.shape)
print(test_4.shape)

(2587, 51)
(221, 50)


In [102]:
# get dummies for categorical columns
train_4 = pd.get_dummies(train_4, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

test_4 = pd.get_dummies(test_4, columns=['NAME_TYPE_SUITE', 'WEEKDAY_APPR_PROCESS_START', 'NAME_FAMILY_STATUS', 'TYPE_SUITE_FAMILY_STATUS', 'PROCESS_START_PERIOD'])

In [103]:
print(train_4.shape)
print(test_4.shape)

(2587, 96)
(221, 77)


In [104]:
# identify columns not in test_4
for col in train_4:
    if col not in test_4:
        print(col)

TARGET
NAME_TYPE_SUITE_Children
NAME_TYPE_SUITE_Other_B
TYPE_SUITE_FAMILY_STATUS_Children_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Children_Married
TYPE_SUITE_FAMILY_STATUS_Children_Single / not married
TYPE_SUITE_FAMILY_STATUS_Children_Widow
TYPE_SUITE_FAMILY_STATUS_Family_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Family_Separated
TYPE_SUITE_FAMILY_STATUS_Group of people_Widow
TYPE_SUITE_FAMILY_STATUS_Other_A_Married
TYPE_SUITE_FAMILY_STATUS_Other_A_Single / not married
TYPE_SUITE_FAMILY_STATUS_Other_B_Civil marriage
TYPE_SUITE_FAMILY_STATUS_Other_B_Married
TYPE_SUITE_FAMILY_STATUS_Other_B_Separated
TYPE_SUITE_FAMILY_STATUS_Other_B_Single / not married
TYPE_SUITE_FAMILY_STATUS_Other_B_Widow
TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Separated
TYPE_SUITE_FAMILY_STATUS_Spouse, partner_Single / not married


### 6.5. Identifying alternative features and saving files for modeling
[top](#Contents)

In [105]:
# rename column name so that it can be read into the lightgb model
train_1 = train_1.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 
train_2 = train_2.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 
train_3 = train_3.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 
train_4 = train_4.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 

test_1 = test_1.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 
test_2 = test_2.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 
test_3 = test_3.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 
test_4 = test_4.rename(columns = lambda x:re.sub('[^A-Za-z0-9_]+', '_', x)) 

In [106]:
# for group 1:

to_drop_for_train_1 = [
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Widow',
]

alternative_feat_1 = [
    'DAYS_ID_PUBLISH',
    'FLAG_EMP_PHONE',
    'FLAG_WORK_PHONE',
    'FLAG_CONT_MOBILE', 
    'FLAG_PHONE',
    'REGION_RATING_CLIENT_W_CITY',
    'REG_REGION_NOT_LIVE_REGION',
    'REG_REGION_NOT_WORK_REGION',
    'REG_CITY_NOT_LIVE_CITY',
    'REG_CITY_NOT_WORK_CITY',
    'OBS_30_CNT_SOCIAL_CIRCLE', 
    'DEF_30_CNT_SOCIAL_CIRCLE',
    'OBS_60_CNT_SOCIAL_CIRCLE',
    'DEF_60_CNT_SOCIAL_CIRCLE', 
    'DAYS_LAST_PHONE_CHANGE', 
    'CAR_BINS',
    'FAM_MEMBERS_BIN', 
    'AVG_OBS_CNT_SOCIAL_CIRCLE', 
    'AVG_DEF_CNT_SOCIAL_CIRCLE', 
    'RATIO_DEF_OBS_SOCIAL_CIRCLE',
    'NAME_TYPE_SUITE_Children',
    'NAME_TYPE_SUITE_Family',
    'NAME_TYPE_SUITE_Group_of_people',
    'NAME_TYPE_SUITE_Other_A',
    'NAME_TYPE_SUITE_Other_B',
    'NAME_TYPE_SUITE_Spouse_partner',
    'NAME_TYPE_SUITE_Unaccompanied',
    'WEEKDAY_APPR_PROCESS_START_MONDAY',
    'WEEKDAY_APPR_PROCESS_START_TUESDAY',
    'WEEKDAY_APPR_PROCESS_START_WEDNESDAY',
    'WEEKDAY_APPR_PROCESS_START_THURSDAY',
    'WEEKDAY_APPR_PROCESS_START_FRIDAY',
    'WEEKDAY_APPR_PROCESS_START_SATURDAY',
    'WEEKDAY_APPR_PROCESS_START_SUNDAY',
    'NAME_FAMILY_STATUS_Civil_marriage',
    'NAME_FAMILY_STATUS_Married',
    'NAME_FAMILY_STATUS_Separated',
    'NAME_FAMILY_STATUS_Single_not_married',
    'NAME_FAMILY_STATUS_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Children_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Children_Married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Children_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Family_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Family_Married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Family_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Married',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Widow', 
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Married',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Widow',
    'PROCESS_START_PERIOD_afternoon',
    'PROCESS_START_PERIOD_dusk',
    'PROCESS_START_PERIOD_morning',    
    'PREV_WEEKDAY_APPR_PROCESS_START_MONDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_TUESDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_THURSDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_FRIDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_SATURDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_SUNDAY_MEAN',
    'PREV_NAME_TYPE_SUITE_Children_MEAN',
    'PREV_NAME_TYPE_SUITE_Family_MEAN',
    'PREV_NAME_TYPE_SUITE_Group_of_people_MEAN',
    'PREV_NAME_TYPE_SUITE_Other_A_MEAN',
    'PREV_NAME_TYPE_SUITE_Other_B_MEAN',
    'PREV_NAME_TYPE_SUITE_Spouse_partner_MEAN',
    'PREV_NAME_TYPE_SUITE_Unaccompanied_MEAN',
    'PREV_HOUR_APPR_PROCESS_START_morning_MEAN',
    'PREV_HOUR_APPR_PROCESS_START_afternoon_MEAN',
    'PREV_HOUR_APPR_PROCESS_START_dusk_MEAN',
    'APPR_PROCESS_START_DIV_morning',
    'APPR_PROCESS_START_DIV_afternoon',
    'APPR_PROCESS_START_DIV_dusk',
    'NAME_TYPE_SUITE_DIV_Children', 
    'NAME_TYPE_SUITE_DIV_Family',
    'NAME_TYPE_SUITE_DIV_Group_of_people',
    'NAME_TYPE_SUITE_DIV_Other_A',
    'NAME_TYPE_SUITE_DIV_Other_B',
    'NAME_TYPE_SUITE_DIV_Spouse_partner',
    'NAME_TYPE_SUITE_DIV_Unaccompanied',
    'WEEKDAY_APPR_PROCESS_DIV_MONDAY',
    'WEEKDAY_APPR_PROCESS_DIV_TUESDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_WEDNESDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_THURSDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_FRIDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_SATURDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_SUNDAY',   
]

In [107]:
# for group 2:

to_drop_for_train_2 = [
    'NAME_TYPE_SUITE_Group_of_people',
    'TYPE_SUITE_FAMILY_STATUS_Children_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Children_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Children_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Married',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Widow',
]

alternative_feat_2 = [
    'DAYS_ID_PUBLISH',
    'FLAG_EMP_PHONE', 
    'FLAG_WORK_PHONE', 
    'FLAG_CONT_MOBILE', 
    'FLAG_PHONE',
    'REGION_RATING_CLIENT_W_CITY',
    'REG_REGION_NOT_LIVE_REGION',
    'REG_REGION_NOT_WORK_REGION',
    'REG_CITY_NOT_LIVE_CITY',
    'REG_CITY_NOT_WORK_CITY',
    'OBS_30_CNT_SOCIAL_CIRCLE', 
    'DEF_30_CNT_SOCIAL_CIRCLE',
    'OBS_60_CNT_SOCIAL_CIRCLE',
    'DEF_60_CNT_SOCIAL_CIRCLE', 
    'DAYS_LAST_PHONE_CHANGE', 
    'CAR_BINS',
    'FAM_MEMBERS_BIN', 
    'AVG_OBS_CNT_SOCIAL_CIRCLE', 
    'AVG_DEF_CNT_SOCIAL_CIRCLE', 
    'RATIO_DEF_OBS_SOCIAL_CIRCLE',
    'NAME_TYPE_SUITE_Children',
    'NAME_TYPE_SUITE_Family',
    'NAME_TYPE_SUITE_Group_of_people',
    'NAME_TYPE_SUITE_Other_A',
    'NAME_TYPE_SUITE_Other_B',
    'NAME_TYPE_SUITE_Spouse_partner',
    'NAME_TYPE_SUITE_Unaccompanied',
    'WEEKDAY_APPR_PROCESS_START_MONDAY',
    'WEEKDAY_APPR_PROCESS_START_TUESDAY',
    'WEEKDAY_APPR_PROCESS_START_WEDNESDAY',
    'WEEKDAY_APPR_PROCESS_START_THURSDAY',
    'WEEKDAY_APPR_PROCESS_START_FRIDAY',
    'WEEKDAY_APPR_PROCESS_START_SATURDAY',
    'WEEKDAY_APPR_PROCESS_START_SUNDAY',
    'NAME_FAMILY_STATUS_Civil_marriage',
    'NAME_FAMILY_STATUS_Married',
    'NAME_FAMILY_STATUS_Separated',
    'NAME_FAMILY_STATUS_Single_not_married',
    'NAME_FAMILY_STATUS_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Children_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Children_Married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Children_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Family_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Family_Married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Family_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Married',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Married',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Widow',
    'PROCESS_START_PERIOD_afternoon',
    'PROCESS_START_PERIOD_dusk',
    'PROCESS_START_PERIOD_morning',  
]

In [108]:
# for group 3:

to_drop_for_train_3 = [
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Widow',
]

alternative_feat_3 = [
    'DAYS_ID_PUBLISH',
    'FLAG_EMP_PHONE',
    'FLAG_WORK_PHONE',
    'FLAG_CONT_MOBILE', 
    'FLAG_PHONE',
    'REGION_RATING_CLIENT_W_CITY',
    'REG_REGION_NOT_LIVE_REGION',
    'REG_REGION_NOT_WORK_REGION',
    'REG_CITY_NOT_LIVE_CITY',
    'REG_CITY_NOT_WORK_CITY',
    'OBS_30_CNT_SOCIAL_CIRCLE', 
    'DEF_30_CNT_SOCIAL_CIRCLE',
    'OBS_60_CNT_SOCIAL_CIRCLE',
    'DEF_60_CNT_SOCIAL_CIRCLE', 
    'DAYS_LAST_PHONE_CHANGE', 
    'CAR_BINS',
    'FAM_MEMBERS_BIN', 
    'AVG_OBS_CNT_SOCIAL_CIRCLE', 
    'AVG_DEF_CNT_SOCIAL_CIRCLE', 
    'RATIO_DEF_OBS_SOCIAL_CIRCLE',
    'NAME_TYPE_SUITE_Children',
    'NAME_TYPE_SUITE_Family',
    'NAME_TYPE_SUITE_Group_of_people',
    'NAME_TYPE_SUITE_Other_A',
    'NAME_TYPE_SUITE_Other_B',
    'NAME_TYPE_SUITE_Spouse_partner',
    'NAME_TYPE_SUITE_Unaccompanied',
    'WEEKDAY_APPR_PROCESS_START_MONDAY',
    'WEEKDAY_APPR_PROCESS_START_TUESDAY',
    'WEEKDAY_APPR_PROCESS_START_WEDNESDAY',
    'WEEKDAY_APPR_PROCESS_START_THURSDAY',
    'WEEKDAY_APPR_PROCESS_START_FRIDAY',
    'WEEKDAY_APPR_PROCESS_START_SATURDAY',
    'WEEKDAY_APPR_PROCESS_START_SUNDAY',
    'NAME_FAMILY_STATUS_Civil_marriage',
    'NAME_FAMILY_STATUS_Married',
    'NAME_FAMILY_STATUS_Separated',
    'NAME_FAMILY_STATUS_Single_not_married',
    'NAME_FAMILY_STATUS_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Children_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Children_Married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Children_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Family_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Family_Married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Family_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Married',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Widow', 
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Married',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Widow',
    'PROCESS_START_PERIOD_afternoon',
    'PROCESS_START_PERIOD_dusk',
    'PROCESS_START_PERIOD_morning',    
    'PREV_WEEKDAY_APPR_PROCESS_START_MONDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_TUESDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_THURSDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_FRIDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_SATURDAY_MEAN',
    'PREV_WEEKDAY_APPR_PROCESS_START_SUNDAY_MEAN',
    'PREV_NAME_TYPE_SUITE_Children_MEAN',
    'PREV_NAME_TYPE_SUITE_Family_MEAN',
    'PREV_NAME_TYPE_SUITE_Group_of_people_MEAN',
    'PREV_NAME_TYPE_SUITE_Other_A_MEAN',
    'PREV_NAME_TYPE_SUITE_Other_B_MEAN',
    'PREV_NAME_TYPE_SUITE_Spouse_partner_MEAN',
    'PREV_NAME_TYPE_SUITE_Unaccompanied_MEAN',
    'PREV_HOUR_APPR_PROCESS_START_morning_MEAN',
    'PREV_HOUR_APPR_PROCESS_START_afternoon_MEAN',
    'PREV_HOUR_APPR_PROCESS_START_dusk_MEAN',
    'APPR_PROCESS_START_DIV_morning',
    'APPR_PROCESS_START_DIV_afternoon',
    'APPR_PROCESS_START_DIV_dusk',
    'NAME_TYPE_SUITE_DIV_Children', 
    'NAME_TYPE_SUITE_DIV_Family',
    'NAME_TYPE_SUITE_DIV_Group_of_people',
    'NAME_TYPE_SUITE_DIV_Other_A',
    'NAME_TYPE_SUITE_DIV_Other_B',
    'NAME_TYPE_SUITE_DIV_Spouse_partner',
    'NAME_TYPE_SUITE_DIV_Unaccompanied',
    'WEEKDAY_APPR_PROCESS_DIV_MONDAY',
    'WEEKDAY_APPR_PROCESS_DIV_TUESDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_WEDNESDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_THURSDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_FRIDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_SATURDAY', 
    'WEEKDAY_APPR_PROCESS_DIV_SUNDAY',   
]

In [109]:
# for group 4:

to_drop_for_train_4 = [
    'NAME_TYPE_SUITE_Children',
    'NAME_TYPE_SUITE_Other_B',
    'TYPE_SUITE_FAMILY_STATUS_Children_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Children_Married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Family_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Family_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Single_not_married',    
]

alternative_feat_4 = [
    'DAYS_ID_PUBLISH',
    'FLAG_EMP_PHONE', 
    'FLAG_WORK_PHONE', 
    'FLAG_CONT_MOBILE', 
    'FLAG_PHONE',
    'REGION_RATING_CLIENT_W_CITY',
    'REG_REGION_NOT_LIVE_REGION',
    'REG_REGION_NOT_WORK_REGION',
    'REG_CITY_NOT_LIVE_CITY',
    'REG_CITY_NOT_WORK_CITY',
    'OBS_30_CNT_SOCIAL_CIRCLE', 
    'DEF_30_CNT_SOCIAL_CIRCLE',
    'OBS_60_CNT_SOCIAL_CIRCLE',
    'DEF_60_CNT_SOCIAL_CIRCLE', 
    'DAYS_LAST_PHONE_CHANGE', 
    'CAR_BINS',
    'FAM_MEMBERS_BIN', 
    'AVG_OBS_CNT_SOCIAL_CIRCLE', 
    'AVG_DEF_CNT_SOCIAL_CIRCLE', 
    'RATIO_DEF_OBS_SOCIAL_CIRCLE',
    'NAME_TYPE_SUITE_Children',
    'NAME_TYPE_SUITE_Family',
    'NAME_TYPE_SUITE_Group_of_people',
    'NAME_TYPE_SUITE_Other_A',
    'NAME_TYPE_SUITE_Other_B',
    'NAME_TYPE_SUITE_Spouse_partner',
    'NAME_TYPE_SUITE_Unaccompanied',
    'WEEKDAY_APPR_PROCESS_START_MONDAY',
    'WEEKDAY_APPR_PROCESS_START_TUESDAY',
    'WEEKDAY_APPR_PROCESS_START_WEDNESDAY',
    'WEEKDAY_APPR_PROCESS_START_THURSDAY',
    'WEEKDAY_APPR_PROCESS_START_FRIDAY',
    'WEEKDAY_APPR_PROCESS_START_SATURDAY',
    'WEEKDAY_APPR_PROCESS_START_SUNDAY',
    'NAME_FAMILY_STATUS_Civil_marriage',
    'NAME_FAMILY_STATUS_Married',
    'NAME_FAMILY_STATUS_Separated',
    'NAME_FAMILY_STATUS_Single_not_married',
    'NAME_FAMILY_STATUS_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Children_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Children_Married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Children_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Family_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Family_Married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Family_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Family_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Married',
    'TYPE_SUITE_FAMILY_STATUS_Group_of_people_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_A_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Other_B_Widow',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Married',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Spouse_partner_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Civil_marriage',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Separated',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Single_not_married',
    'TYPE_SUITE_FAMILY_STATUS_Unaccompanied_Widow',
    'PROCESS_START_PERIOD_afternoon',
    'PROCESS_START_PERIOD_dusk',
    'PROCESS_START_PERIOD_morning',   
]

In [110]:
# save individual train and test files
train_1.to_csv('../datasets/train_1_final.csv', index=False)
train_2.to_csv('../datasets/train_2_final.csv', index=False)
train_3.to_csv('../datasets/train_3_final.csv', index=False)
train_4.to_csv('../datasets/train_4_final.csv', index=False)

test_1.to_csv('../datasets/test_1_final.csv', index=False)
test_2.to_csv('../datasets/test_2_final.csv', index=False)
test_3.to_csv('../datasets/test_3_final.csv', index=False)
test_4.to_csv('../datasets/test_4_final.csv', index=False)