In [1]:
%matplotlib inline
%reload_ext autoreload
%autoreload 2

In [2]:
import gc
import sys
sys.path.append('../')

from fastai.structured import *
from fastai.column_data import *
np.set_printoptions(threshold=50, edgeitems=20)
from IPython.display import HTML, display
from sklearn import metrics
import traceback 
from sklearn.ensemble import RandomForestRegressor, RandomForestClassifier

import featuretools as ft

MERED = "merged"
#PATH = "../../../data/home-credit-default-risk/"
PATH = "../../data/home-credit-default-risk/"

In [6]:
ls {PATH}

application_test.csv                [0m[01;34mmerged[0m/
application_train.csv               [01;34mmodels[0m/
bureau_balance.csv                  POS_CASH_balance.csv
bureau.csv                          previous_application.csv
credit_card_balance.csv             sample_submission.csv
HomeCredit_columns_description.csv  [01;34mtmp[0m/
installments_payments.csv


In [3]:
n_sample = None

In [4]:
cat_vars = [
    'CREDIT_ACTIVE',
    'DAYS_CREDIT',
    'CREDIT_DAY_OVERDUE',
    'DAYS_CREDIT_ENDDATE',
    'DAYS_ENDDATE_FACT',
    'AMT_CREDIT_MAX_OVERDUE',
    'CNT_CREDIT_PROLONG',
    'CREDIT_TYPE',
    'STATUS',
    'CNT_INSTALMENT',
    'CNT_INSTALMENT_FUTURE',
    'SK_DPD',
    'SK_DPD_DEF',
    'MONTHS_BALANCE',
    'CNT_DRAWINGS_ATM_CURRENT',
    'CNT_DRAWINGS_CURRENT',
    'CNT_DRAWINGS_OTHER_CURRENT',
    'CNT_DRAWINGS_POS_CURRENT',
    'CNT_INSTALMENT_MATURE_CUM',
    'NAME_CONTRACT_TYPE',
    'WEEKDAY_APPR_PROCESS_START',
    'HOUR_APPR_PROCESS_START',
    'FLAG_LAST_APPL_PER_CONTRACT',
    'NFLAG_LAST_APPL_IN_DAY',
    'NFLAG_MICRO_CASH',
    'NAME_CASH_LOAN_PURPOSE',
    'NAME_CONTRACT_STATUS',
    'DAYS_DECISION',
    'NAME_PAYMENT_TYPE',
    'CODE_REJECT_REASON',
    'NAME_TYPE_SUITE',
    'NAME_CLIENT_TYPE',
    'NAME_GOODS_CATEGORY',
    'NAME_PORTFOLIO',
    'NAME_PRODUCT_TYPE',
    'CHANNEL_TYPE',
    'NAME_SELLER_INDUSTRY',
    'CNT_PAYMENT',
    'NAME_YIELD_GROUP',
    'PRODUCT_COMBINATION',
    'DAYS_FIRST_DRAWING',
    'DAYS_FIRST_DUE',
    'DAYS_LAST_DUE_1ST_VERSION',
    'DAYS_LAST_DUE',
    'DAYS_TERMINATION',
    'NFLAG_INSURED_ON_APPROVAL',
    'NUM_INSTALMENT_VERSION',
    'NUM_INSTALMENT_NUMBER',
    'DAYS_INSTALMENT',
    'DAYS_ENTRY_PAYMENT',
    'CREDIT_CURRENCY']

In [5]:
def set_category_types(table):
    for col_name in table:
        for cat in cat_vars:            
            if cat == col_name or cat + ")" in col_name:
                table[col_name] = table[col_name].astype('category').cat.as_ordered()
        

In [6]:
def delete_by_nan(table, ratio=0.5):
    null_ratio = table.isnull().sum().sort_values(ascending=False) / len(table)
    filtered_by_null = null_ratio[null_ratio > ratio]
    
    table.drop(columns=filtered_by_null.index, axis=1, inplace=True)

In [7]:
def load_sample(file_name, sk_id_currs=None, nrows=None):
    table = pd.read_csv(f'{PATH}{file_name}.csv', low_memory=False, nrows=nrows)
    if sk_id_currs is not None:
        table = table[table.SK_ID_CURR.isin(sk_id_currs)]    
    
    col_num = len(table.columns)
    delete_by_nan(table)
    
    print(file_name, len(table), col_num, len(table.columns))
    return table

In [8]:
def add_table_to_app(app, table, table_name):
    entities = {
        'app' : (app, "SK_ID_CURR"),
        table_name : (table, 'index'),
    }
    relationships = [
        ('app', 'SK_ID_CURR', table_name, 'index')
    ]
    
    return add_table_to_app_by_entities(entities=entities, relationships=relationships, table_name=table_name)

In [9]:
def add_table_to_app_by_entities(entities, relationships, table_name):
    feature_matrix, feature_defs = ft.dfs(
        entities=entities,
        relationships = relationships,
        target_entity="app",
        agg_primitives=["mean", "sum", "mode"],
        ignore_variables={table_name: ['SK_ID_PREV', 'SK_ID_CURR']}
    )
    
    os.makedirs(f'{PATH}tmp', exist_ok=True)
    feature_matrix = feature_matrix.reset_index()
    
    feature_matrix.to_feather(f'{PATH}tmp/app-table')        
    
    return feature_matrix, feature_defs

In [10]:
train = load_sample('application_train',  nrows=n_sample)

application_train 307511 122 81


In [11]:
test = load_sample('application_test',  nrows=n_sample)

application_test 48744 121 92


In [12]:
train['is_test'] = 0
df_t_t = pd.concat([train, test])
df_t_t.is_test.fillna(1, inplace=True)

of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.


  


In [13]:
del train, test
gc.collect()

21

In [14]:
bureau = load_sample('bureau', df_t_t.SK_ID_CURR)

bureau 1716428 17 15


In [15]:
file_names = ['bureau_balance']
tables = [pd.read_csv(f'{PATH}{file_name}.csv',low_memory=False) for file_name in file_names]
bureau_balance = tables[0][tables[0].SK_ID_BUREAU.isin(bureau.SK_ID_BUREAU)]
bureau_balance = bureau_balance.reset_index()

In [16]:
entities = {
    'app' : (df_t_t, "SK_ID_CURR"),
    'bureau' : (bureau, "SK_ID_BUREAU"),
    'bureau_balance' : (bureau_balance, 'index')
}

relationships = [
    ('app', 'SK_ID_CURR', 'bureau', 'SK_ID_CURR'),
    ('bureau', 'SK_ID_BUREAU', 'bureau_balance', 'SK_ID_BUREAU')
]

In [17]:
df_t_t, _ = add_table_to_app_by_entities(entities, relationships, 'bureau')

In [18]:
del bureau, bureau_balance, tables
gc.collect()

407

In [19]:
file_names = ['previous_application', 'POS_CASH_balance', 'credit_card_balance', 'installments_payments']
for file_name in file_names:
    table = load_sample(file_name, df_t_t.SK_ID_CURR)
    table = table.reset_index()
    df_t_t, feature_defs = add_table_to_app(df_t_t, table, file_name)

previous_application 1670214 37 33
POS_CASH_balance 10001358 8 8
credit_card_balance 3840312 23 23
installments_payments 13605401 8 8


In [20]:
df_all = pd.read_feather(f'{PATH}tmp/app-table')

In [30]:
FileLink(f'data/home-credit-default-risk/tmp/app-table')

In [26]:
ls

[0m[01;36mdata[0m@
Home Credit Default Risk.ipynb
Home Credit Default Risk (only app).ipynb
Home Credit Default Risk (random forest all features).ipynb
Home Credit Default Risk (random forest).ipynb
Plant Seedling clf.ipynb
README.md
submission.csv


In [32]:
df_all.head()

Unnamed: 0,SK_ID_CURR,AMT_ANNUITY,AMT_CREDIT,AMT_GOODS_PRICE,AMT_INCOME_TOTAL,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_WEEK,...,MEAN(installments_payments.DAYS_INSTALMENT),MEAN(installments_payments.DAYS_ENTRY_PAYMENT),MEAN(installments_payments.AMT_INSTALMENT),MEAN(installments_payments.AMT_PAYMENT),SUM(installments_payments.NUM_INSTALMENT_VERSION),SUM(installments_payments.NUM_INSTALMENT_NUMBER),SUM(installments_payments.DAYS_INSTALMENT),SUM(installments_payments.DAYS_ENTRY_PAYMENT),SUM(installments_payments.AMT_INSTALMENT),SUM(installments_payments.AMT_PAYMENT)
0,100001,20560.5,568800.0,450000.0,135000.0,0.0,0.0,0.0,0.0,0.0,...,,,,,,,,,,
1,100002,24700.5,406597.5,351000.0,202500.0,0.0,0.0,0.0,0.0,0.0,...,-778.0,-789.0,447329.61,447329.61,2.0,6.0,-778.0,-789.0,447329.61,447329.61
2,100003,35698.5,1293502.5,1129500.0,270000.0,0.0,0.0,0.0,0.0,0.0,...,,,,,,,,,,
3,100004,6750.0,135000.0,135000.0,67500.0,0.0,0.0,0.0,0.0,0.0,...,,,,,,,,,,
4,100005,17370.0,222768.0,180000.0,99000.0,0.0,0.0,0.0,0.0,0.0,...,,,,,,,,,,


In [31]:
 with pd.option_context("display.max_rows", 1000, "display.max_columns", 1000):
        display(DataFrameSummary(df_all).summary())

Unnamed: 0,SK_ID_CURR,AMT_ANNUITY,AMT_CREDIT,AMT_GOODS_PRICE,AMT_INCOME_TOTAL,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_YEAR,APARTMENTS_AVG,APARTMENTS_MEDI,APARTMENTS_MODE,CNT_CHILDREN,CNT_FAM_MEMBERS,CODE_GENDER,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_ID_PUBLISH,DAYS_LAST_PHONE_CHANGE,DAYS_REGISTRATION,DEF_30_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,EMERGENCYSTATE_MODE,ENTRANCES_AVG,ENTRANCES_MEDI,ENTRANCES_MODE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,FLAG_CONT_MOBILE,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_2,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_EMAIL,FLAG_EMP_PHONE,FLAG_MOBIL,FLAG_OWN_CAR,FLAG_OWN_REALTY,FLAG_PHONE,FLAG_WORK_PHONE,FLOORSMAX_AVG,FLOORSMAX_MEDI,FLOORSMAX_MODE,HOUR_APPR_PROCESS_START,HOUSETYPE_MODE,LIVE_CITY_NOT_WORK_CITY,LIVE_REGION_NOT_WORK_REGION,LIVINGAREA_AVG,LIVINGAREA_MEDI,LIVINGAREA_MODE,NAME_CONTRACT_TYPE,NAME_EDUCATION_TYPE,NAME_FAMILY_STATUS,NAME_HOUSING_TYPE,NAME_INCOME_TYPE,NAME_TYPE_SUITE,OBS_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,OCCUPATION_TYPE,ORGANIZATION_TYPE,REGION_POPULATION_RELATIVE,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,TARGET,TOTALAREA_MODE,WALLSMATERIAL_MODE,WEEKDAY_APPR_PROCESS_START,YEARS_BEGINEXPLUATATION_AVG,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BEGINEXPLUATATION_MODE,is_test,MEAN(bureau.DAYS_CREDIT),MEAN(bureau.CREDIT_DAY_OVERDUE),MEAN(bureau.DAYS_CREDIT_ENDDATE),MEAN(bureau.DAYS_ENDDATE_FACT),MEAN(bureau.CNT_CREDIT_PROLONG),MEAN(bureau.AMT_CREDIT_SUM),MEAN(bureau.AMT_CREDIT_SUM_DEBT),MEAN(bureau.AMT_CREDIT_SUM_LIMIT),MEAN(bureau.AMT_CREDIT_SUM_OVERDUE),MEAN(bureau.DAYS_CREDIT_UPDATE),SUM(bureau.DAYS_CREDIT),SUM(bureau.CREDIT_DAY_OVERDUE),SUM(bureau.DAYS_CREDIT_ENDDATE),SUM(bureau.DAYS_ENDDATE_FACT),SUM(bureau.CNT_CREDIT_PROLONG),SUM(bureau.AMT_CREDIT_SUM),SUM(bureau.AMT_CREDIT_SUM_DEBT),SUM(bureau.AMT_CREDIT_SUM_LIMIT),SUM(bureau.AMT_CREDIT_SUM_OVERDUE),SUM(bureau.DAYS_CREDIT_UPDATE),MODE(bureau.CREDIT_ACTIVE),MODE(bureau.CREDIT_CURRENCY),MODE(bureau.CREDIT_TYPE),MEAN(bureau_balance.MONTHS_BALANCE),SUM(bureau_balance.MONTHS_BALANCE),MODE(bureau_balance.STATUS),MEAN(bureau.MEAN(bureau_balance.MONTHS_BALANCE)),MEAN(bureau.SUM(bureau_balance.MONTHS_BALANCE)),SUM(bureau.MEAN(bureau_balance.MONTHS_BALANCE)),MODE(bureau.MODE(bureau_balance.STATUS)),MEAN(previous_application.AMT_ANNUITY),MEAN(previous_application.AMT_APPLICATION),MEAN(previous_application.AMT_CREDIT),MEAN(previous_application.AMT_GOODS_PRICE),MEAN(previous_application.HOUR_APPR_PROCESS_START),MEAN(previous_application.NFLAG_LAST_APPL_IN_DAY),MEAN(previous_application.DAYS_DECISION),MEAN(previous_application.SELLERPLACE_AREA),MEAN(previous_application.CNT_PAYMENT),MEAN(previous_application.DAYS_FIRST_DRAWING),MEAN(previous_application.DAYS_FIRST_DUE),MEAN(previous_application.DAYS_LAST_DUE_1ST_VERSION),MEAN(previous_application.DAYS_LAST_DUE),MEAN(previous_application.DAYS_TERMINATION),MEAN(previous_application.NFLAG_INSURED_ON_APPROVAL),SUM(previous_application.AMT_ANNUITY),SUM(previous_application.AMT_APPLICATION),SUM(previous_application.AMT_CREDIT),SUM(previous_application.AMT_GOODS_PRICE),SUM(previous_application.HOUR_APPR_PROCESS_START),SUM(previous_application.NFLAG_LAST_APPL_IN_DAY),SUM(previous_application.DAYS_DECISION),SUM(previous_application.SELLERPLACE_AREA),SUM(previous_application.CNT_PAYMENT),SUM(previous_application.DAYS_FIRST_DRAWING),SUM(previous_application.DAYS_FIRST_DUE),SUM(previous_application.DAYS_LAST_DUE_1ST_VERSION),SUM(previous_application.DAYS_LAST_DUE),SUM(previous_application.DAYS_TERMINATION),SUM(previous_application.NFLAG_INSURED_ON_APPROVAL),MODE(previous_application.NAME_CONTRACT_TYPE),MODE(previous_application.WEEKDAY_APPR_PROCESS_START),MODE(previous_application.FLAG_LAST_APPL_PER_CONTRACT),MODE(previous_application.NAME_CASH_LOAN_PURPOSE),MODE(previous_application.NAME_CONTRACT_STATUS),MODE(previous_application.NAME_PAYMENT_TYPE),MODE(previous_application.CODE_REJECT_REASON),MODE(previous_application.NAME_TYPE_SUITE),MODE(previous_application.NAME_CLIENT_TYPE),MODE(previous_application.NAME_GOODS_CATEGORY),MODE(previous_application.NAME_PORTFOLIO),MODE(previous_application.NAME_PRODUCT_TYPE),MODE(previous_application.CHANNEL_TYPE),MODE(previous_application.NAME_SELLER_INDUSTRY),MODE(previous_application.NAME_YIELD_GROUP),MODE(previous_application.PRODUCT_COMBINATION),MEAN(POS_CASH_balance.MONTHS_BALANCE),MEAN(POS_CASH_balance.CNT_INSTALMENT),MEAN(POS_CASH_balance.CNT_INSTALMENT_FUTURE),MEAN(POS_CASH_balance.SK_DPD),MEAN(POS_CASH_balance.SK_DPD_DEF),SUM(POS_CASH_balance.MONTHS_BALANCE),SUM(POS_CASH_balance.CNT_INSTALMENT),SUM(POS_CASH_balance.CNT_INSTALMENT_FUTURE),SUM(POS_CASH_balance.SK_DPD),SUM(POS_CASH_balance.SK_DPD_DEF),MODE(POS_CASH_balance.NAME_CONTRACT_STATUS),MEAN(credit_card_balance.MONTHS_BALANCE),MEAN(credit_card_balance.AMT_BALANCE),MEAN(credit_card_balance.AMT_CREDIT_LIMIT_ACTUAL),MEAN(credit_card_balance.AMT_DRAWINGS_ATM_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_OTHER_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_POS_CURRENT),MEAN(credit_card_balance.AMT_INST_MIN_REGULARITY),MEAN(credit_card_balance.AMT_PAYMENT_CURRENT),MEAN(credit_card_balance.AMT_PAYMENT_TOTAL_CURRENT),MEAN(credit_card_balance.AMT_RECEIVABLE_PRINCIPAL),MEAN(credit_card_balance.AMT_RECIVABLE),MEAN(credit_card_balance.AMT_TOTAL_RECEIVABLE),MEAN(credit_card_balance.CNT_DRAWINGS_ATM_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_OTHER_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_POS_CURRENT),MEAN(credit_card_balance.CNT_INSTALMENT_MATURE_CUM),MEAN(credit_card_balance.SK_DPD),MEAN(credit_card_balance.SK_DPD_DEF),SUM(credit_card_balance.MONTHS_BALANCE),SUM(credit_card_balance.AMT_BALANCE),SUM(credit_card_balance.AMT_CREDIT_LIMIT_ACTUAL),SUM(credit_card_balance.AMT_DRAWINGS_ATM_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_OTHER_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_POS_CURRENT),SUM(credit_card_balance.AMT_INST_MIN_REGULARITY),SUM(credit_card_balance.AMT_PAYMENT_CURRENT),SUM(credit_card_balance.AMT_PAYMENT_TOTAL_CURRENT),SUM(credit_card_balance.AMT_RECEIVABLE_PRINCIPAL),SUM(credit_card_balance.AMT_RECIVABLE),SUM(credit_card_balance.AMT_TOTAL_RECEIVABLE),SUM(credit_card_balance.CNT_DRAWINGS_ATM_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_OTHER_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_POS_CURRENT),SUM(credit_card_balance.CNT_INSTALMENT_MATURE_CUM),SUM(credit_card_balance.SK_DPD),SUM(credit_card_balance.SK_DPD_DEF),MODE(credit_card_balance.NAME_CONTRACT_STATUS),MEAN(installments_payments.NUM_INSTALMENT_VERSION),MEAN(installments_payments.NUM_INSTALMENT_NUMBER),MEAN(installments_payments.DAYS_INSTALMENT),MEAN(installments_payments.DAYS_ENTRY_PAYMENT),MEAN(installments_payments.AMT_INSTALMENT),MEAN(installments_payments.AMT_PAYMENT),SUM(installments_payments.NUM_INSTALMENT_VERSION),SUM(installments_payments.NUM_INSTALMENT_NUMBER),SUM(installments_payments.DAYS_INSTALMENT),SUM(installments_payments.DAYS_ENTRY_PAYMENT),SUM(installments_payments.AMT_INSTALMENT),SUM(installments_payments.AMT_PAYMENT)
count,356255,356219,356255,355977,356255,308687,308687,308687,308687,308687,308687,24857,24857,24857,356255,356253,,356255,356255,356255,356254,356255,355205,355205,,25165,25165,25165,28212,355587,286622,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,,,356255,356255,179914,179914,179914,356255,,356255,356255,25192,25192,25192,,,,,,,355205,355205,,,356255,356255,356255,356255,356255,356255,356255,307511,185200,,,183392,183392,183392,356255,305811,305811,303226,268155,305811,305809,297439,280503,305811,305811,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,,,,134542,356255,,134542,305811,356255,,276718,356255,356255,273874,356255,356255,356255,356255,276719,212371,212371,212371,212371,212371,212371,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,,,,,,,,,,,,,,,,,356255,355796,355795,356255,356255,356255,356255,356255,356255,356255,,356255,356255,356255,281971,356255,281971,281971,329386,281413,356255,356255,356255,356255,281971,356255,281971,281971,329386,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255
mean,278128,27425.6,587767,528020,170116,0.00628144,0.00580847,0.231697,0.304399,0.0299948,1.91156,0.122388,0.122809,0.119078,0.414316,2.15186,,-16041.2,64317.2,-3002.07,-978.581,-4983.59,0.143452,0.100198,,0.151777,0.1512,0.147161,0.50118,0.51489,0.50935,0.99817,1.96488e-05,0.00353679,5.61396e-06,0.00304276,0.0025347,0.0010442,0.0085697,0.000230172,0.00723078,0.000513677,3.64907e-05,0.000437889,0.000289119,0.720504,8.42093e-05,0.0150651,0.0879763,0.000171226,0.0823455,0.00397749,0.071213,0.818498,0.999994,,,0.278612,0.200098,0.227331,0.226922,0.223315,12.0557,,0.178824,0.0408471,0.112286,0.113368,0.110687,,,,,,,1.42573,1.40947,,,0.020917,2.05051,2.02893,0.0780761,0.229661,0.0156489,0.0513705,0.0807288,0.103193,,,0.977889,0.977903,0.977239,0.136823,-1083.8,0.965926,662.421,-967.018,0.00701018,380740,161634,5898.54,45.9507,-542.966,-5502.65,3.94191,2308.4,-3092.32,0.0308852,1.71034e+06,561323,19665.7,182.663,-2860.67,,,,-23.1592,-1894.52,,-19.9465,-364.069,-46.0277,,15930.5,174966,195690,227626,12.4943,0.996264,-879.924,322.351,16.0579,342254,13490.1,33416.8,76205.1,81709.9,0.332169,12373.9,174966,195690,174990,12.4943,0.996264,-879.924,322.351,12.4729,204025,8041.75,19920.5,45427.4,48708.9,0.198013,,,,,,,,,,,,,,,,,-27.5522,20.3224,12.8835,0.36196,0.0737309,-27.5522,20.2962,12.8669,0.36196,0.0737309,,-35.0736,54571.1,149920,5659.89,6346.33,260.422,2088.29,3383.66,9681.99,7076.99,52355.2,54398.4,54408.4,0.300244,0.559515,0.00497924,0.401694,20.5442,9.17916,0.34351,-35.0736,54571.1,149920,4479.73,6346.33,206.12,1652.85,3128.47,7648,7076.99,52355.2,54398.4,54408.4,0.237639,0.559515,0.003941,0.317935,18.9947,9.17916,0.34351,,0.854124,18.9699,-1044.52,-1053.28,16956.5,17148,0.854124,18.9699,-1044.52,-1053.28,16956.5,17148
std,102842,14732.8,398624,366065,223507,0.10425,0.0797363,0.855949,0.786915,0.191374,1.86534,0.113112,0.114184,0.113465,0.720378,0.907937,,4358.8,141706,1517.9,835.064,3526.97,0.456579,0.368259,,0.100669,0.100931,0.101748,0.205142,0.189753,0.194141,0.0427411,0.00443266,0.0593658,0.00236938,0.0550773,0.050282,0.0322972,0.0921753,0.0151697,0.0847261,0.0226587,0.00604065,0.0209212,0.0170011,0.448752,0.00917619,0.121812,0.283261,0.0130842,0.274891,0.0629419,0.257181,0.385434,0.00236938,,,0.448317,0.400074,0.145051,0.145453,0.144126,3.26758,,0.383206,0.197936,0.11486,0.116503,0.116699,,,,,,,2.59991,2.57772,,,0.013915,0.510947,0.504586,0.268292,0.420616,0.124113,0.220753,0.272419,0.108041,,,0.0579289,0.0585622,0.0631651,0.343661,558.441,24.9572,3282.36,531.159,0.0623341,879286,536768,29921.8,4956.64,446.427,6075.06,82.3009,11803.3,3993.2,0.216193,3.92165e+06,1.5371e+06,91347.4,14538.5,3708.72,,,,11.7924,4339.06,,11.1091,645.418,94.4309,,14736.3,292218,317936,314821,3.33569,0.0610093,778.502,9621.51,14.5555,88838.3,71660.9,106370,149382,153119,0.470992,14583.8,292218,317936,292240,3.33569,0.0610093,778.502,9621.51,14.4665,181403,55723.1,83747.7,121246,124835,0.398502,,,,,,,,,,,,,,,,,24.0015,14.0444,12.8571,15.1692,1.52305,24.0015,14.0543,12.8571,15.1692,1.52305,,27.6505,98947.3,160033,27216.6,30090.5,7077.75,16146,5299.27,33819.1,29869.4,95376,98653.2,98659.7,1.07532,2.67162,0.0849536,2.67214,20.3447,98.8238,22.01,27.6505,98947.3,160033,24322.3,30090.5,6297.64,14389.4,5173.26,30315.2,29869.4,95376,98653.2,98659.7,0.964408,2.67162,0.0756064,2.38288,20.3008,98.8238,22.01,,1.00795,26.8334,801.471,801.096,50563.7,54913.6,1.00795,26.8334,801.471,801.096,50563.7,54913.6
min,100001,1615.5,45000,40500,25650,0,0,0,0,0,0,0,0,0,0,1,,-25229,-17912,-7197,-4361,-24672,0,0,,0,0,0,0.0134579,8.17362e-08,0.000527265,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,,0,0,0,0,0,0,,0,0,0,0,0,,,,,,,0,0,,,0.000253,1,-1,0,0,0,0,0,0,,,0,0,0,0,-2922,0,-41875,-8376.5,0,0,-1.08361e+06,-97891.7,0,-41890,-83611,0,-155271,-74646,0,0,-6.98156e+06,-579854,0,-90065,,,,-92.5,-80687,,-92.5,-4656,-2294.5,,0,0,0,0,0,0,-2922,-1,0,-2919,-2892,-2801,-2889,-2825,0,0,0,0,0,0,0,-2922,-1,0,-2919,-2892,-2801,-2889,-2825,0,,,,,,,,,,,,,,,,,-96,1,0,0,0,-96,0,0,0,0,,-96,-261471,0,0,-1687.5,0,0,0,0,0,-267615,-261777,-261777,0,0,0,0,0,0,0,-96,-261471,0,0,-1687.5,0,0,0,0,0,-267615,-261777,-261777,0,0,0,0,0,0,0,,0,1,-2922,-3021,0.045,0,0,1,-2922,-3021,0.045,0
25%,189064,16731,270000,234000,112500,0,0,0,0,0,0,0.0619,0.0625,0.0588,0,2,,-19676,-2781,-4318,-1592,-7477,0,0,,0.0745,0.069,0.069,0.343695,0.394955,0.368969,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,,,0,0,0.1667,0.1667,0.1667,10,,0,0,0.048575,0.049,0.0456,,,,,,,0,0,,,0.010006,2,2,0,0,0,0,0,0.0415,,,0.9767,0.9767,0.9767,0,-1431,0,-697.525,-1288.59,0,103962,0,0,0,-773.696,-8091,0,-2319,-4529,0,157287,0,0,0,-4150,,,,-31.3464,-1416,,-26.25,-519.888,-50.5,,6309.92,18585,24043.5,50692.5,10,1,-1300,-1,6,365243,-1630,-1243,-1317,-1271,0,2250,18585,24043.5,18594,10,1,-1300,-1,0,0,-1022,-584,-738,-697,0,,,,,,,,,,,,,,,,,-41,10,4,0,0,-41,10,4,0,0,,-58,0,45000,0,0,0,0,0,144.225,0,0,0,0,0,0,0,0,4,0,0,-58,0,45000,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,,0,4,-1656,-1665,4187.72,3375,0,4,-1656,-1665,4187.72,3375
50%,278128,25078.5,500211,450000,153000,0,0,0,0,0,1,0.0928,0.0926,0.0851,0,2,,-15755,-1224,-3252,-771,-4502,0,0,,0.1379,0.1379,0.1379,0.506771,0.564849,0.533482,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,,,0,0,0.1667,0.1667,0.1667,12,,0,0,0.077,0.0776,0.0751,,,,,,,0,0,,,0.01885,2,2,0,0,0,0,0,0.069,,,0.9816,0.9816,0.9816,0,-1052.5,0,-131.789,-926.4,0,197297,44760.4,0,0,-479.3,-3597,0,0,-1692,0,723596,90660.6,0,0,-1574,,,,-23.1038,0,,-18.95,0,0,,11250,70762.5,80334,111998,12,1,-581,3,12,365243,-835,-365,-540,-501,0,8216.82,70762.5,80334,70762.5,12,1,-581,3,10,365243,-274,0,0,0,0,,,,,,,,,,,,,,,,,-18,12,9,0,0,-18,12,9,0,0,,-27,0,112500,0,0,0,0,0,2638.8,0,0,0,0,0,0,0,0,15,0,0,-27,0,112500,0,0,0,0,0,370.71,0,0,0,0,0,0,0,0,12,0,0,,1,8,-822,-831,8855.1,8101.44,1,8,-822,-831,8855.1,8101.44
75%,367192,34960.5,797558,675000,202500,0,0,0,0,0,3,0.1485,0.1499,0.1502,1,3,,-12425,-290,-1717,-286,-1995,0,0,,0.2069,0.2069,0.2069,0.665956,0.662928,0.665855,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,,,1,0,0.3333,0.3333,0.3333,14,,0,0,0.1376,0.137425,0.1306,,,,,,,2,2,,,0.028663,2,2,0,0,0,0,0,0.1287,,,0.9866,0.9866,0.9866,0,-670.369,0,613,-573.667,0,397865,143600,0,0,-209,-911,0,1217,-24,0,2.01538e+06,551171,0,0,-142,,,,-14.302,0,,-12,0,0,,20637,180000,215865,234000,15,1,-280,82,24,365243,-412,126,-76,-45,1,16773.9,180000,215865,180000,15,1,-280,82,16,365243,0,0,0,0,0,,,,,,,,,,,,,,,,,-10,24,18,0,0,-10,24,18,0,0,,-11,85081.7,180000,0,0,0,0,5895.63,9000,6750,81573.5,85023.5,85048.2,0,0,0,0,32,0,0,-11,85081.7,180000,0,0,0,0,5625,7200,6750,81573.5,85023.5,85048.2,0,0,0,0,30,0,0,,1,19,-362,-371,16624.6,16006.5,1,19,-362,-371,16624.6,16006.5
max,456255,258026,4.05e+06,4.05e+06,1.17e+08,9,4,27,261,8,25,1,1,1,20,21,,-7338,365243,0,0,0,34,24,,1,1,1,0.939145,0.855,0.89601,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,,,1,1,1,1,1,23,,1,1,1,1,1,,,,,,,354,351,,,0.072508,3,3,1,1,1,1,1,1,,,1,1,1,1,0,2776,31198,0,6,1.98072e+08,5.175e+07,4.5e+06,1.6174e+06,14,0,5250,214193,0,9,1.01796e+09,3.34498e+08,8.12933e+06,3.75668e+06,14,,,,0,0,,0,0,0,,298558,4.23788e+06,4.10435e+06,4.23788e+06,23,1,-2,4e+06,84,365243,365243,365243,365243,365243,1,298558,4.23788e+06,4.10435e+06,4.23788e+06,23,1,-2,4e+06,84,365243,365243,365243,365243,365243,1,,,,,,,,,,,,,,,,,-1,72,70,2672,268,-1,72,70,2672,268,,-1,983767,1.35e+06,900000,963346,757350,963346,57252.4,1.56225e+06,1.55228e+06,971851,982646,982646,31,142,8,142,117,3015,3015,-1,983767,1.35e+06,900000,963346,757350,963346,57252.4,1.56225e+06,1.55228e+06,971851,982646,982646,31,142,8,142,117,3015,3015,,35,244,-2,-2,2.54423e+06,2.54423e+06,35,244,-2,-2,2.54423e+06,2.54423e+06
counts,356255,356219,356255,355977,356255,308687,308687,308687,308687,308687,308687,24857,24857,24857,356255,356253,356255,356255,356255,356255,356254,356255,355205,355205,188291,25165,25165,25165,28212,355587,286622,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,179914,179914,179914,356255,25125,356255,356255,25192,25192,25192,356255,356255,356255,356255,356255,354052,355205,355205,244259,356255,356255,356255,356255,356255,356255,356255,356255,307511,185200,24851,356255,183392,183392,183392,356255,305811,305811,303226,268155,305811,305809,297439,280503,305811,305811,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,305811,305811,305811,134542,356255,134542,134542,305811,356255,134542,276718,356255,356255,273874,356255,356255,356255,356255,276719,212371,212371,212371,212371,212371,212371,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,180862,356255,356255,356255,356255,356255,356255,356255,356182,356255,355796,355795,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,281971,356255,281971,281971,329386,281413,356255,356255,356255,356255,281971,356255,281971,281971,329386,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255,356255
uniques,356255,14166,6480,1291,2741,9,5,24,11,9,25,1543,918,636,16,18,3,17467,12896,6224,3846,15898,10,9,2,200,43,30,27207,127157,814,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,414,49,25,24,3,2,2,3848,3885,3842,2,5,6,6,8,7,36,35,18,58,82,3,4,2,2,2,2,2,5191,7,7,294,250,224,2,69801,1657,108600,45759,111,241365,195127,44904,2081,59481,27394,927,48663,19490,10,236434,176862,42988,1369,18233,4,3,12,86427,20956,6,8068,48709,1657,7,139327,44146,51107,44146,24,2,2921,1804,39,2445,2892,4548,2837,2785,2,139327,44146,51107,44146,24,2,2921,1804,39,2446,2893,4548,2838,2786,2,4,7,2,25,4,4,9,7,4,27,5,3,8,11,5,17,96,56,69,226,75,96,57,69,226,75,6,96,140007,150,758,17612,385,15780,39848,32246,23929,128650,141760,141765,30,92,9,89,118,501,106,96,140007,150,758,17612,385,15780,39848,32246,23929,128650,141760,141765,30,92,9,89,118,501,106,7,36,228,2921,2964,141721,149696,36,228,2921,2964,141721,149696


In [176]:
delete_by_nan(df_all)

In [177]:
[print(c) for c in df_all.columns]

SK_ID_CURR
AMT_ANNUITY
AMT_CREDIT
AMT_GOODS_PRICE
AMT_INCOME_TOTAL
AMT_REQ_CREDIT_BUREAU_DAY
AMT_REQ_CREDIT_BUREAU_HOUR
AMT_REQ_CREDIT_BUREAU_MON
AMT_REQ_CREDIT_BUREAU_QRT
AMT_REQ_CREDIT_BUREAU_WEEK
AMT_REQ_CREDIT_BUREAU_YEAR
APARTMENTS_AVG
APARTMENTS_MEDI
APARTMENTS_MODE
CNT_CHILDREN
CNT_FAM_MEMBERS
CODE_GENDER
DAYS_BIRTH
DAYS_EMPLOYED
DAYS_ID_PUBLISH
DAYS_LAST_PHONE_CHANGE
DAYS_REGISTRATION
DEF_30_CNT_SOCIAL_CIRCLE
DEF_60_CNT_SOCIAL_CIRCLE
EMERGENCYSTATE_MODE
ENTRANCES_AVG
ENTRANCES_MEDI
ENTRANCES_MODE
EXT_SOURCE_2
EXT_SOURCE_3
FLAG_CONT_MOBILE
FLAG_DOCUMENT_10
FLAG_DOCUMENT_11
FLAG_DOCUMENT_12
FLAG_DOCUMENT_13
FLAG_DOCUMENT_14
FLAG_DOCUMENT_15
FLAG_DOCUMENT_16
FLAG_DOCUMENT_17
FLAG_DOCUMENT_18
FLAG_DOCUMENT_19
FLAG_DOCUMENT_2
FLAG_DOCUMENT_20
FLAG_DOCUMENT_21
FLAG_DOCUMENT_3
FLAG_DOCUMENT_4
FLAG_DOCUMENT_5
FLAG_DOCUMENT_6
FLAG_DOCUMENT_7
FLAG_DOCUMENT_8
FLAG_DOCUMENT_9
FLAG_EMAIL
FLAG_EMP_PHONE
FLAG_MOBIL
FLAG_OWN_CAR
FLAG_OWN_REALTY
FLAG_PHONE
FLAG_WORK_PHONE
FLOORSMAX_AVG
FLOORSMA

[None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None,
 None]

In [32]:
train = df_all[df_all.is_test == 0]
train.drop(['is_test'], axis=1)
train = train.reset_index()
set_category_types(train)
train.to_feather(f'{PATH}tmp/train_all_tables')

In [33]:
test = df_all[df_all.is_test == 1]
test.drop(['is_test'], axis=1)
test = test.reset_index()
set_category_types(train)
test.to_feather(f'{PATH}tmp/test_all_tables')

In [34]:
del df_all, train, test
gc.collect()

1885

In [207]:
train = pd.read_feather(f'{PATH}tmp/train_all_tables')

  return feather.read_dataframe(path, nthreads=nthreads)


In [208]:
 with pd.option_context("display.max_rows", 1000, "display.max_columns", 1000):
        display(DataFrameSummary(train).summary())

Unnamed: 0,index,SK_ID_CURR,AMT_ANNUITY,AMT_CREDIT,AMT_GOODS_PRICE,AMT_INCOME_TOTAL,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_YEAR,APARTMENTS_AVG,APARTMENTS_MEDI,APARTMENTS_MODE,CNT_CHILDREN,CNT_FAM_MEMBERS,CODE_GENDER,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_ID_PUBLISH,DAYS_LAST_PHONE_CHANGE,DAYS_REGISTRATION,DEF_30_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,EMERGENCYSTATE_MODE,ENTRANCES_AVG,ENTRANCES_MEDI,ENTRANCES_MODE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,FLAG_CONT_MOBILE,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_2,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_EMAIL,FLAG_EMP_PHONE,FLAG_MOBIL,FLAG_OWN_CAR,FLAG_OWN_REALTY,FLAG_PHONE,FLAG_WORK_PHONE,FLOORSMAX_AVG,FLOORSMAX_MEDI,FLOORSMAX_MODE,HOUR_APPR_PROCESS_START,HOUSETYPE_MODE,LIVE_CITY_NOT_WORK_CITY,LIVE_REGION_NOT_WORK_REGION,LIVINGAREA_AVG,LIVINGAREA_MEDI,LIVINGAREA_MODE,NAME_CONTRACT_TYPE,NAME_EDUCATION_TYPE,NAME_FAMILY_STATUS,NAME_HOUSING_TYPE,NAME_INCOME_TYPE,NAME_TYPE_SUITE,OBS_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,OCCUPATION_TYPE,ORGANIZATION_TYPE,REGION_POPULATION_RELATIVE,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,TARGET,TOTALAREA_MODE,WALLSMATERIAL_MODE,WEEKDAY_APPR_PROCESS_START,YEARS_BEGINEXPLUATATION_AVG,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BEGINEXPLUATATION_MODE,is_test,MEAN(bureau.DAYS_CREDIT),MEAN(bureau.CREDIT_DAY_OVERDUE),MEAN(bureau.DAYS_CREDIT_ENDDATE),MEAN(bureau.DAYS_ENDDATE_FACT),MEAN(bureau.CNT_CREDIT_PROLONG),MEAN(bureau.AMT_CREDIT_SUM),MEAN(bureau.AMT_CREDIT_SUM_DEBT),MEAN(bureau.AMT_CREDIT_SUM_LIMIT),MEAN(bureau.AMT_CREDIT_SUM_OVERDUE),MEAN(bureau.DAYS_CREDIT_UPDATE),SUM(bureau.DAYS_CREDIT),SUM(bureau.CREDIT_DAY_OVERDUE),SUM(bureau.DAYS_CREDIT_ENDDATE),SUM(bureau.DAYS_ENDDATE_FACT),SUM(bureau.CNT_CREDIT_PROLONG),SUM(bureau.AMT_CREDIT_SUM),SUM(bureau.AMT_CREDIT_SUM_DEBT),SUM(bureau.AMT_CREDIT_SUM_LIMIT),SUM(bureau.AMT_CREDIT_SUM_OVERDUE),SUM(bureau.DAYS_CREDIT_UPDATE),MODE(bureau.CREDIT_ACTIVE),MODE(bureau.CREDIT_CURRENCY),MODE(bureau.CREDIT_TYPE),MEAN(bureau_balance.MONTHS_BALANCE),SUM(bureau_balance.MONTHS_BALANCE),MODE(bureau_balance.STATUS),MEAN(bureau.MEAN(bureau_balance.MONTHS_BALANCE)),MEAN(bureau.SUM(bureau_balance.MONTHS_BALANCE)),SUM(bureau.MEAN(bureau_balance.MONTHS_BALANCE)),MODE(bureau.MODE(bureau_balance.STATUS)),MEAN(previous_application.AMT_ANNUITY),MEAN(previous_application.AMT_APPLICATION),MEAN(previous_application.AMT_CREDIT),MEAN(previous_application.AMT_GOODS_PRICE),MEAN(previous_application.HOUR_APPR_PROCESS_START),MEAN(previous_application.NFLAG_LAST_APPL_IN_DAY),MEAN(previous_application.DAYS_DECISION),MEAN(previous_application.SELLERPLACE_AREA),MEAN(previous_application.CNT_PAYMENT),MEAN(previous_application.DAYS_FIRST_DRAWING),MEAN(previous_application.DAYS_FIRST_DUE),MEAN(previous_application.DAYS_LAST_DUE_1ST_VERSION),MEAN(previous_application.DAYS_LAST_DUE),MEAN(previous_application.DAYS_TERMINATION),MEAN(previous_application.NFLAG_INSURED_ON_APPROVAL),SUM(previous_application.AMT_ANNUITY),SUM(previous_application.AMT_APPLICATION),SUM(previous_application.AMT_CREDIT),SUM(previous_application.AMT_GOODS_PRICE),SUM(previous_application.HOUR_APPR_PROCESS_START),SUM(previous_application.NFLAG_LAST_APPL_IN_DAY),SUM(previous_application.DAYS_DECISION),SUM(previous_application.SELLERPLACE_AREA),SUM(previous_application.CNT_PAYMENT),SUM(previous_application.DAYS_FIRST_DRAWING),SUM(previous_application.DAYS_FIRST_DUE),SUM(previous_application.DAYS_LAST_DUE_1ST_VERSION),SUM(previous_application.DAYS_LAST_DUE),SUM(previous_application.DAYS_TERMINATION),SUM(previous_application.NFLAG_INSURED_ON_APPROVAL),MODE(previous_application.NAME_CONTRACT_TYPE),MODE(previous_application.WEEKDAY_APPR_PROCESS_START),MODE(previous_application.FLAG_LAST_APPL_PER_CONTRACT),MODE(previous_application.NAME_CASH_LOAN_PURPOSE),MODE(previous_application.NAME_CONTRACT_STATUS),MODE(previous_application.NAME_PAYMENT_TYPE),MODE(previous_application.CODE_REJECT_REASON),MODE(previous_application.NAME_TYPE_SUITE),MODE(previous_application.NAME_CLIENT_TYPE),MODE(previous_application.NAME_GOODS_CATEGORY),MODE(previous_application.NAME_PORTFOLIO),MODE(previous_application.NAME_PRODUCT_TYPE),MODE(previous_application.CHANNEL_TYPE),MODE(previous_application.NAME_SELLER_INDUSTRY),MODE(previous_application.NAME_YIELD_GROUP),MODE(previous_application.PRODUCT_COMBINATION),MEAN(POS_CASH_balance.MONTHS_BALANCE),MEAN(POS_CASH_balance.CNT_INSTALMENT),MEAN(POS_CASH_balance.CNT_INSTALMENT_FUTURE),MEAN(POS_CASH_balance.SK_DPD),MEAN(POS_CASH_balance.SK_DPD_DEF),SUM(POS_CASH_balance.MONTHS_BALANCE),SUM(POS_CASH_balance.CNT_INSTALMENT),SUM(POS_CASH_balance.CNT_INSTALMENT_FUTURE),SUM(POS_CASH_balance.SK_DPD),SUM(POS_CASH_balance.SK_DPD_DEF),MODE(POS_CASH_balance.NAME_CONTRACT_STATUS),MEAN(credit_card_balance.MONTHS_BALANCE),MEAN(credit_card_balance.AMT_BALANCE),MEAN(credit_card_balance.AMT_CREDIT_LIMIT_ACTUAL),MEAN(credit_card_balance.AMT_DRAWINGS_ATM_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_OTHER_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_POS_CURRENT),MEAN(credit_card_balance.AMT_INST_MIN_REGULARITY),MEAN(credit_card_balance.AMT_PAYMENT_CURRENT),MEAN(credit_card_balance.AMT_PAYMENT_TOTAL_CURRENT),MEAN(credit_card_balance.AMT_RECEIVABLE_PRINCIPAL),MEAN(credit_card_balance.AMT_RECIVABLE),MEAN(credit_card_balance.AMT_TOTAL_RECEIVABLE),MEAN(credit_card_balance.CNT_DRAWINGS_ATM_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_OTHER_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_POS_CURRENT),MEAN(credit_card_balance.CNT_INSTALMENT_MATURE_CUM),MEAN(credit_card_balance.SK_DPD),MEAN(credit_card_balance.SK_DPD_DEF),SUM(credit_card_balance.MONTHS_BALANCE),SUM(credit_card_balance.AMT_BALANCE),SUM(credit_card_balance.AMT_CREDIT_LIMIT_ACTUAL),SUM(credit_card_balance.AMT_DRAWINGS_ATM_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_OTHER_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_POS_CURRENT),SUM(credit_card_balance.AMT_INST_MIN_REGULARITY),SUM(credit_card_balance.AMT_PAYMENT_CURRENT),SUM(credit_card_balance.AMT_PAYMENT_TOTAL_CURRENT),SUM(credit_card_balance.AMT_RECEIVABLE_PRINCIPAL),SUM(credit_card_balance.AMT_RECIVABLE),SUM(credit_card_balance.AMT_TOTAL_RECEIVABLE),SUM(credit_card_balance.CNT_DRAWINGS_ATM_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_OTHER_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_POS_CURRENT),SUM(credit_card_balance.CNT_INSTALMENT_MATURE_CUM),SUM(credit_card_balance.SK_DPD),SUM(credit_card_balance.SK_DPD_DEF),MODE(credit_card_balance.NAME_CONTRACT_STATUS),MEAN(installments_payments.NUM_INSTALMENT_VERSION),MEAN(installments_payments.NUM_INSTALMENT_NUMBER),MEAN(installments_payments.DAYS_INSTALMENT),MEAN(installments_payments.DAYS_ENTRY_PAYMENT),MEAN(installments_payments.AMT_INSTALMENT),MEAN(installments_payments.AMT_PAYMENT),SUM(installments_payments.NUM_INSTALMENT_VERSION),SUM(installments_payments.NUM_INSTALMENT_NUMBER),SUM(installments_payments.DAYS_INSTALMENT),SUM(installments_payments.DAYS_ENTRY_PAYMENT),SUM(installments_payments.AMT_INSTALMENT),SUM(installments_payments.AMT_PAYMENT)
count,1000,1000,1000,1000,999,1000,856,856,856,856,856,856,505,505,505,1000,1000,,1000,1000,1000,1000,1000,996,996,,512,512,512,0,997,791,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,,,1000,1000,521,521,521,1000,,1000,1000,511,511,511,,,,,,,996,996,,,1000,1000,1000,1000,1000,1000,1000,1000,531,,,521,521,521,1000,849,849,843,736,849,849,824,784,849,849,849,849,849,849,849,849,849,849,849,849,,,,308,308,,308,308,849,,3,6,6,3,6,6,6,6,3,2,2,2,2,2,2,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,,,,,,,,,,,,,,,,,7,6,6,7,7,7,7,7,7,7,,4,4,4,3,4,3,3,4,3,4,4,4,4,3,4,3,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,,22,22,22,22,22,22,22,22,22,22,22,22
mean,574.487,100575,27120.7,595306,536198,167660,0.00700935,0.00934579,0.231308,0.290888,0.036215,1.9007,0.112891,0.113557,0.109272,0.406,2.129,,-15872.7,55733.9,-2935.1,-980.529,-4887.02,0.126506,0.0873494,,0.141881,0.141796,0.137384,,0.515815,0.513224,0.997,0,0.003,0,0.002,0.002,0.001,0.01,0,0.005,0,0,0,0,0.723,0,0.017,0.066,0,0.085,0.004,0.064,0.842,1,,,0.297,0.212,0.228145,0.227854,0.224655,11.975,,0.193,0.045,0.10491,0.106562,0.103349,,,,,,,1.31024,1.29317,,,0.0211324,2.042,2.016,0.084,0.25,0.018,0.057,0.07,0.100453,,,0.979986,0.980565,0.977572,0,-1070.37,0.849715,689.019,-958.006,0.0094701,370752,171613,5719,343.31,-533.221,-5936.59,3.04947,2426.86,-3309.96,0.0471143,1.67904e+06,573055,23144.9,686.155,-3073.34,,,,-23.3826,-3959.53,,-20.6692,-707.563,-41.7173,,38793.2,179489,179309,358978,14.3333,1,-1093.17,5,9.33333,365243,-1439,-1199,-1304,-1298,0.5,19396.6,179489,179309,179489,14.3333,1,-1093.17,5,4.66667,121748,-479.667,-399.667,-434.667,-432.667,0.166667,,,,,,,,,,,,,,,,,-27.2857,29.3333,17,0,0,-27.2857,25.1429,14.5714,0,0,,-3.75,60071.4,78750,36000,27000,0,0,1353.75,4987.43,1702.79,56626.7,57351.1,57351.1,2,1.5,0,0,8.5,0,0,-3.75,60071.4,78750,27000,27000,0,0,1353.75,3740.57,1702.79,56626.7,57351.1,57351.1,1.5,1.5,0,0,8.5,0,0,,1.36364,20.7273,-708.318,-715.182,41284.1,41230.9,1.36364,20.7273,-708.318,-715.182,41284.1,41230.9
std,331.665,331.665,14278.9,388475,359636,90167.6,0.118262,0.0962771,0.750984,0.649398,0.204846,1.90369,0.0978007,0.0987055,0.0971603,0.713914,0.91826,,4235.85,134159,1514.75,832.251,3526.75,0.396036,0.322367,,0.0854588,0.0859149,0.0866362,,0.195964,0.199838,0.0547174,0,0.0547174,0,0.044699,0.044699,0.0316228,0.0995485,0,0.070569,0,0,0,0,0.44774,0,0.129336,0.248406,0,0.279021,0.0631505,0.244875,0.364924,0,,,0.457165,0.408929,0.14787,0.148202,0.147687,3.30413,,0.39485,0.207408,0.106065,0.108038,0.109026,,,,,,,2.19573,2.17579,,,0.0140328,0.492421,0.481639,0.277527,0.433229,0.133018,0.231959,0.255275,0.10566,,,0.0273775,0.0233593,0.0614623,0,561.16,14.4126,3506.19,525.326,0.0666174,680134,502785,25691.8,9323.14,427.905,5515.12,51.7931,11453.5,3573.59,0.257243,2.19184e+06,1.04932e+06,89662.6,18624.1,3289.19,,,,13.2944,4649.86,,12.6452,664.188,88.3788,,54557,387617,387707,528175,3.38625,0,1240.81,14.6969,3.05505,0,1306.73,1434.01,1285.52,1285.52,0.707107,40522.3,387617,387707,387617,3.38625,0,1240.81,14.6969,5.46504,188611,945.358,891.425,885.413,883.059,0.408248,,,,,,,,,,,,,,,,,20.4427,17.4203,7.34847,0,0,20.4427,19.3858,9.28901,0,0,,4.19325,120143,129253,62353.8,54000,0,0,2707.49,8135.83,3248.52,113253,114702,114702,3.4641,3,0,0,12.7671,0,0,4.19325,120143,129253,54000,54000,0,0,2707.49,7095.52,3248.52,113253,114702,114702,3,3,0,0,12.7671,0,0,,1.52894,32.4422,754.644,755.625,92883.3,92889.3,1.52894,32.4422,754.644,755.625,92883.3,92889.3
min,1,100002,4504.5,47970,45000,31500,0,0,0,0,0,0,0,0,0,0,1,,-25104,-15632,-6223,-3409,-17298,0,0,,0,0,0,,0.0028123,0.000527265,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,,,0,0,0,0,0,1,,0,0,0,0,0,,,,,,,0,0,,,0.001333,1,1,0,0,0,0,0,0,,,0.4933,0.4933,0,0,-2922,0,-2687,-2723,0,0,-568.57,0,0,-2713,-37221,0,-17713,-20020,0,0,-5117.13,0,0,-20348,,,,-71.5,-25427,,-71.5,-3160,-701.5,,3672.95,0,0,19435.5,9,1,-2910,-1,6,365243,-2363,-2213,-2213,-2207,0,0,0,0,0,9,1,-2910,-1,0,0,-2363,-2213,-2213,-2207,0,,,,,,,,,,,,,,,,,-65,10,9,0,0,-65,0,0,0,0,,-10,0,0,0,0,0,0,0,238.5,0,0,0,0,0,0,0,0,0,0,0,-10,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,0,1,-2560,-2575,431.64,431.64,0,1,-2560,-2575,431.64,431.64
25%,288.75,100290,16603.9,273584,238500,112500,0,0,0,0,0,0,0.0567,0.0573,0.0504,0,2,,-19229,-2724,-4257.25,-1594.75,-7223.5,0,0,,0.069,0.069,0.069,,0.378174,0.374866,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,,,0,0,0.1667,0.1667,0.1667,10,,0,0,0.0452,0.046,0.0433,,,,,,,0,0,,,0.010006,2,2,0,0,0,0,0,0.0409,,,0.9767,0.9767,0.9762,0,-1402.5,0,-665.333,-1293.75,0,102210,0,0,0,-742.5,-8763,0,-2687,-4925,0,346080,0,0,0,-4593,,,,-32.6721,-5774,,-28.6111,-1010.92,-37.5,,7366.97,0,0,54717.8,12.5,1,-1946,-1,8,365243,-1901,-1706,-1758.5,-1752.5,0.25,0,0,0,0,12.5,1,-1946,-1,0,0,-386.25,-138.75,-296.25,-291.75,0,,,,,,,,,,,,,,,,,-37.5,13.5,10.75,0,0,-37.5,10,9.5,0,0,,-4,0,0,0,0,0,0,0,290.295,0,0,0,0,0,0,0,0,0,0,0,-4,0,0,0,0,0,0,0,178.875,0,0,0,0,0,0,0,0,0,0,0,,1,5,-1049.75,-1075,9961.44,9961.44,1,5,-1049.75,-1075,9961.44,9961.44
50%,575.5,100576,25371,516514,450000,144000,0,0,0,0,0,1,0.0835,0.0833,0.084,0,2,,-15743,-1267,-3164,-757.5,-4502.5,0,0,,0.1379,0.1379,0.1379,,0.571331,0.533482,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,,,0,0,0.1667,0.1667,0.1667,12,,0,0,0.0703,0.0716,0.0689,,,,,,,0,0,,,0.01885,2,2,0,0,0,0,0,0.0645,,,0.9816,0.9816,0.9816,0,-1033,0,-148.278,-908,0,192249,49281.5,0,0,-479,-4288,0,-452,-2033,0,865581,178711,0,0,-1868,,,,-23.4194,-2106.5,,-19.7542,-518.795,0,,11061,9717.75,9177.75,90000,15,1,-529.5,-1,10,365243,-1439,-1199,-1304,-1298,0.5,1836.47,9717.75,9177.75,9717.75,15,1,-529.5,-1,3,0,0,0,0,0,0,,,,,,,,,,,,,,,,,-17,30,17,0,0,-17,24,13,0,0,,-2,0,22500,0,0,0,0,0,342.09,119.25,0,0,0,0,0,0,0,3.5,0,0,-2,0,22500,0,0,0,0,0,290.295,119.25,0,0,0,0,0,0,0,3.5,0,0,,1,6,-333.5,-339.5,18888.7,18888.7,1,6,-333.5,-339.5,18888.7,18888.7
75%,861.25,100862,34103.2,808650,679500,202500,0,0,0,0,0,3,0.1464,0.1447,0.1429,1,2.25,,-12326.5,-304,-1601.75,-270.5,-1866.5,0,0,,0.1724,0.1724,0.1724,,0.668243,0.67383,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,,,1,0,0.3333,0.3333,0.3333,14.25,,0,0,0.1268,0.129,0.12195,,,,,,,2,2,,,0.028663,2,2,0,0.25,0,0,0,0.1273,,,0.9871,0.9871,0.9871,0,-643.625,0,594.5,-573.125,0,383655,147368,0,0,-217.667,-1725,0,1563,-596,0,2.05505e+06,670533,0,0,-582,,,,-12.4414,-518.5,,-10.8833,-161.979,0,,56353.3,72358.9,72088.9,528750,16.75,1,-207.25,-1,11,365243,-977,-692,-849.5,-843.5,0.75,9213.99,72358.9,72088.9,72358.9,16.75,1,-207.25,-1,9,273932,0,0,0,0,0,,,,,,,,,,,,,,,,,-12,45,21.75,0,0,-12,42,21.5,0,0,,-1.75,60071.4,101250,54000,27000,0,0,1353.75,7361.89,1822.04,56626.7,57351.1,57351.1,3,1.5,0,0,12,0,0,-1.75,60071.4,101250,27000,27000,0,0,1353.75,3851.99,1822.04,56626.7,57351.1,57351.1,1.5,1.5,0,0,12,0,0,,1,18,-222.5,-227.25,27813.8,30811.6,1,18,-222.5,-227.25,27813.8,30811.6
max,1155,101156,116266,2.28621e+06,2.25e+06,765000,3,1,9,4,3,9,0.6639,0.6703,0.6765,3,5,,-7705,365243,-1,0,-3,4,3,,0.6207,0.6207,0.6207,,0.815114,0.865896,1,0,1,0,1,1,1,1,0,1,0,0,0,0,1,0,1,1,0,1,1,1,1,1,,,1,1,1,1,1,22,,1,1,0.7641,0.7778,0.7961,,,,,,,14,14,,,0.072508,3,3,1,1,1,1,1,0.7628,,,0.9995,0.9995,0.9995,0,-8,393,31084,-23.3333,1,1.035e+07,1.00489e+07,450000,271017,0,-8,1272,62168,0,3,2.07e+07,1.00489e+07,810000,542034,0,,,,-0.5,-1,,-0.5,-1,0,,101646,967500,967500,967500,18,1,-72,35,12,365243,-515,-185,-395,-389,1,101646,967500,967500,967500,18,1,-72,35,12,365243,0,0,0,0,1,,,,,,,,,,,,,,,,,-10,48,27,0,0,-10,48,27,0,0,,-1,240286,270000,108000,108000,0,0,5414.98,14381.7,6572.65,226507,229404,229404,6,6,0,0,27,0,0,-1,240286,270000,108000,108000,0,0,5414.98,14381.7,6572.65,226507,229404,229404,6,6,0,0,27,0,0,,6,113,-48,-48,447330,447330,6,113,-48,-48,447330,447330
counts,1000,1000,1000,1000,999,1000,856,856,856,856,856,856,505,505,505,1000,1000,1000,1000,1000,1000,1000,1000,996,996,538,512,512,512,0,997,791,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,521,521,521,1000,514,1000,1000,511,511,511,1000,1000,1000,1000,1000,998,996,996,714,1000,1000,1000,1000,1000,1000,1000,1000,1000,531,506,1000,521,521,521,1000,849,849,843,736,849,849,824,784,849,849,849,849,849,849,849,849,849,849,849,849,849,849,849,308,308,308,308,308,849,308,3,6,6,3,6,6,6,6,3,2,2,2,2,2,2,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,1,6,6,6,6,6,6,6,6,7,6,6,7,7,7,7,7,7,7,7,4,4,4,3,4,3,3,4,3,4,4,4,4,3,4,3,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,22,22,22,22,22,22,22,22,22,22,22,22
uniques,1000,1000,793,458,186,94,3,2,9,5,3,10,218,199,185,4,5,2,975,773,894,737,943,5,4,2,38,24,18,0,983,368,2,1,2,1,2,2,2,2,1,2,1,1,1,1,2,1,2,2,1,2,2,2,2,1,2,2,2,2,40,28,20,21,3,2,2,452,449,453,2,4,5,6,4,7,15,15,18,50,77,3,3,2,2,2,2,2,445,7,7,86,85,86,1,823,13,830,711,20,815,613,163,13,787,814,13,824,714,4,814,612,157,13,766,2,1,5,288,293,3,245,293,220,5,3,4,4,3,6,1,6,2,3,1,2,2,2,2,2,4,4,4,4,6,1,6,2,4,2,3,3,3,3,2,2,5,1,2,3,2,2,1,2,2,3,2,2,3,3,4,6,4,6,1,1,6,5,7,1,1,2,3,2,3,2,2,1,1,2,3,3,2,2,2,2,2,1,1,3,1,1,3,2,3,2,2,1,1,2,4,3,2,2,2,2,2,1,1,3,1,1,1,6,14,21,21,22,21,6,14,21,21,22,21


In [220]:
test = pd.read_feather(f'{PATH}tmp/test_all_tables')

  return feather.read_dataframe(path, nthreads=nthreads)


In [221]:
with pd.option_context("display.max_rows", 1000, "display.max_columns", 1000):
    display(DataFrameSummary(test).summary())

Unnamed: 0,index,SK_ID_CURR,AMT_ANNUITY,AMT_CREDIT,AMT_GOODS_PRICE,AMT_INCOME_TOTAL,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_YEAR,APARTMENTS_AVG,APARTMENTS_MEDI,APARTMENTS_MODE,CNT_CHILDREN,CNT_FAM_MEMBERS,CODE_GENDER,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_ID_PUBLISH,DAYS_LAST_PHONE_CHANGE,DAYS_REGISTRATION,DEF_30_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,EMERGENCYSTATE_MODE,ENTRANCES_AVG,ENTRANCES_MEDI,ENTRANCES_MODE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,FLAG_CONT_MOBILE,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_2,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_EMAIL,FLAG_EMP_PHONE,FLAG_MOBIL,FLAG_OWN_CAR,FLAG_OWN_REALTY,FLAG_PHONE,FLAG_WORK_PHONE,FLOORSMAX_AVG,FLOORSMAX_MEDI,FLOORSMAX_MODE,HOUR_APPR_PROCESS_START,HOUSETYPE_MODE,LIVE_CITY_NOT_WORK_CITY,LIVE_REGION_NOT_WORK_REGION,LIVINGAREA_AVG,LIVINGAREA_MEDI,LIVINGAREA_MODE,NAME_CONTRACT_TYPE,NAME_EDUCATION_TYPE,NAME_FAMILY_STATUS,NAME_HOUSING_TYPE,NAME_INCOME_TYPE,NAME_TYPE_SUITE,OBS_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,OCCUPATION_TYPE,ORGANIZATION_TYPE,REGION_POPULATION_RELATIVE,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,TARGET,TOTALAREA_MODE,WALLSMATERIAL_MODE,WEEKDAY_APPR_PROCESS_START,YEARS_BEGINEXPLUATATION_AVG,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BEGINEXPLUATATION_MODE,is_test,MEAN(bureau.DAYS_CREDIT),MEAN(bureau.CREDIT_DAY_OVERDUE),MEAN(bureau.DAYS_CREDIT_ENDDATE),MEAN(bureau.DAYS_ENDDATE_FACT),MEAN(bureau.CNT_CREDIT_PROLONG),MEAN(bureau.AMT_CREDIT_SUM),MEAN(bureau.AMT_CREDIT_SUM_DEBT),MEAN(bureau.AMT_CREDIT_SUM_LIMIT),MEAN(bureau.AMT_CREDIT_SUM_OVERDUE),MEAN(bureau.DAYS_CREDIT_UPDATE),SUM(bureau.DAYS_CREDIT),SUM(bureau.CREDIT_DAY_OVERDUE),SUM(bureau.DAYS_CREDIT_ENDDATE),SUM(bureau.DAYS_ENDDATE_FACT),SUM(bureau.CNT_CREDIT_PROLONG),SUM(bureau.AMT_CREDIT_SUM),SUM(bureau.AMT_CREDIT_SUM_DEBT),SUM(bureau.AMT_CREDIT_SUM_LIMIT),SUM(bureau.AMT_CREDIT_SUM_OVERDUE),SUM(bureau.DAYS_CREDIT_UPDATE),MODE(bureau.CREDIT_ACTIVE),MODE(bureau.CREDIT_CURRENCY),MODE(bureau.CREDIT_TYPE),MEAN(bureau_balance.MONTHS_BALANCE),SUM(bureau_balance.MONTHS_BALANCE),MODE(bureau_balance.STATUS),MEAN(bureau.MEAN(bureau_balance.MONTHS_BALANCE)),MEAN(bureau.SUM(bureau_balance.MONTHS_BALANCE)),SUM(bureau.MEAN(bureau_balance.MONTHS_BALANCE)),MODE(bureau.MODE(bureau_balance.STATUS)),MEAN(previous_application.AMT_ANNUITY),MEAN(previous_application.AMT_APPLICATION),MEAN(previous_application.AMT_CREDIT),MEAN(previous_application.AMT_GOODS_PRICE),MEAN(previous_application.HOUR_APPR_PROCESS_START),MEAN(previous_application.NFLAG_LAST_APPL_IN_DAY),MEAN(previous_application.DAYS_DECISION),MEAN(previous_application.SELLERPLACE_AREA),MEAN(previous_application.CNT_PAYMENT),MEAN(previous_application.DAYS_FIRST_DRAWING),MEAN(previous_application.DAYS_FIRST_DUE),MEAN(previous_application.DAYS_LAST_DUE_1ST_VERSION),MEAN(previous_application.DAYS_LAST_DUE),MEAN(previous_application.DAYS_TERMINATION),MEAN(previous_application.NFLAG_INSURED_ON_APPROVAL),SUM(previous_application.AMT_ANNUITY),SUM(previous_application.AMT_APPLICATION),SUM(previous_application.AMT_CREDIT),SUM(previous_application.AMT_GOODS_PRICE),SUM(previous_application.HOUR_APPR_PROCESS_START),SUM(previous_application.NFLAG_LAST_APPL_IN_DAY),SUM(previous_application.DAYS_DECISION),SUM(previous_application.SELLERPLACE_AREA),SUM(previous_application.CNT_PAYMENT),SUM(previous_application.DAYS_FIRST_DRAWING),SUM(previous_application.DAYS_FIRST_DUE),SUM(previous_application.DAYS_LAST_DUE_1ST_VERSION),SUM(previous_application.DAYS_LAST_DUE),SUM(previous_application.DAYS_TERMINATION),SUM(previous_application.NFLAG_INSURED_ON_APPROVAL),MODE(previous_application.NAME_CONTRACT_TYPE),MODE(previous_application.WEEKDAY_APPR_PROCESS_START),MODE(previous_application.FLAG_LAST_APPL_PER_CONTRACT),MODE(previous_application.NAME_CASH_LOAN_PURPOSE),MODE(previous_application.NAME_CONTRACT_STATUS),MODE(previous_application.NAME_PAYMENT_TYPE),MODE(previous_application.CODE_REJECT_REASON),MODE(previous_application.NAME_TYPE_SUITE),MODE(previous_application.NAME_CLIENT_TYPE),MODE(previous_application.NAME_GOODS_CATEGORY),MODE(previous_application.NAME_PORTFOLIO),MODE(previous_application.NAME_PRODUCT_TYPE),MODE(previous_application.CHANNEL_TYPE),MODE(previous_application.NAME_SELLER_INDUSTRY),MODE(previous_application.NAME_YIELD_GROUP),MODE(previous_application.PRODUCT_COMBINATION),MEAN(POS_CASH_balance.MONTHS_BALANCE),MEAN(POS_CASH_balance.CNT_INSTALMENT),MEAN(POS_CASH_balance.CNT_INSTALMENT_FUTURE),MEAN(POS_CASH_balance.SK_DPD),MEAN(POS_CASH_balance.SK_DPD_DEF),SUM(POS_CASH_balance.MONTHS_BALANCE),SUM(POS_CASH_balance.CNT_INSTALMENT),SUM(POS_CASH_balance.CNT_INSTALMENT_FUTURE),SUM(POS_CASH_balance.SK_DPD),SUM(POS_CASH_balance.SK_DPD_DEF),MODE(POS_CASH_balance.NAME_CONTRACT_STATUS),MEAN(credit_card_balance.MONTHS_BALANCE),MEAN(credit_card_balance.AMT_BALANCE),MEAN(credit_card_balance.AMT_CREDIT_LIMIT_ACTUAL),MEAN(credit_card_balance.AMT_DRAWINGS_ATM_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_OTHER_CURRENT),MEAN(credit_card_balance.AMT_DRAWINGS_POS_CURRENT),MEAN(credit_card_balance.AMT_INST_MIN_REGULARITY),MEAN(credit_card_balance.AMT_PAYMENT_CURRENT),MEAN(credit_card_balance.AMT_PAYMENT_TOTAL_CURRENT),MEAN(credit_card_balance.AMT_RECEIVABLE_PRINCIPAL),MEAN(credit_card_balance.AMT_RECIVABLE),MEAN(credit_card_balance.AMT_TOTAL_RECEIVABLE),MEAN(credit_card_balance.CNT_DRAWINGS_ATM_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_OTHER_CURRENT),MEAN(credit_card_balance.CNT_DRAWINGS_POS_CURRENT),MEAN(credit_card_balance.CNT_INSTALMENT_MATURE_CUM),MEAN(credit_card_balance.SK_DPD),MEAN(credit_card_balance.SK_DPD_DEF),SUM(credit_card_balance.MONTHS_BALANCE),SUM(credit_card_balance.AMT_BALANCE),SUM(credit_card_balance.AMT_CREDIT_LIMIT_ACTUAL),SUM(credit_card_balance.AMT_DRAWINGS_ATM_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_OTHER_CURRENT),SUM(credit_card_balance.AMT_DRAWINGS_POS_CURRENT),SUM(credit_card_balance.AMT_INST_MIN_REGULARITY),SUM(credit_card_balance.AMT_PAYMENT_CURRENT),SUM(credit_card_balance.AMT_PAYMENT_TOTAL_CURRENT),SUM(credit_card_balance.AMT_RECEIVABLE_PRINCIPAL),SUM(credit_card_balance.AMT_RECIVABLE),SUM(credit_card_balance.AMT_TOTAL_RECEIVABLE),SUM(credit_card_balance.CNT_DRAWINGS_ATM_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_OTHER_CURRENT),SUM(credit_card_balance.CNT_DRAWINGS_POS_CURRENT),SUM(credit_card_balance.CNT_INSTALMENT_MATURE_CUM),SUM(credit_card_balance.SK_DPD),SUM(credit_card_balance.SK_DPD_DEF),MODE(credit_card_balance.NAME_CONTRACT_STATUS),MEAN(installments_payments.NUM_INSTALMENT_VERSION),MEAN(installments_payments.NUM_INSTALMENT_NUMBER),MEAN(installments_payments.DAYS_INSTALMENT),MEAN(installments_payments.DAYS_ENTRY_PAYMENT),MEAN(installments_payments.AMT_INSTALMENT),MEAN(installments_payments.AMT_PAYMENT),SUM(installments_payments.NUM_INSTALMENT_VERSION),SUM(installments_payments.NUM_INSTALMENT_NUMBER),SUM(installments_payments.DAYS_INSTALMENT),SUM(installments_payments.DAYS_ENTRY_PAYMENT),SUM(installments_payments.AMT_INSTALMENT),SUM(installments_payments.AMT_PAYMENT)
count,1000,1000,999,1000,1000,1000,887,887,887,887,887,887,501,501,501,1000,1000,,1000,1000,1000,1000,1000,1000,1000,,509,509,509,580,1000,835,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,,,1000,1000,515,515,515,1000,,1000,1000,504,504,504,,,,,,,1000,1000,,,1000,1000,1000,1000,1000,1000,1000,0,524,,,520,520,520,1000,877,877,865,777,877,877,854,795,877,877,877,877,877,877,877,877,877,877,877,877,,,,877,877,,877,877,877,,6,7,7,6,7,7,7,7,6,4,4,4,4,4,4,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,,,,,,,,,,,,,,,,,7,7,7,7,7,7,7,7,7,7,,7,7,7,5,7,5,5,7,5,7,7,7,7,5,7,5,5,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,,20,20,20,20,20,20,20,20,20,20,20,20
mean,1424.51,103466,28673.9,500326,446808,170785,0.0011274,0.00338219,0.00676437,0.529876,0.0011274,1.95265,0.117108,0.117827,0.115145,0.439,2.209,,-15819.8,64526.7,-2965.32,-1036.08,-4979.52,0.166,0.116,,0.146517,0.146056,0.142601,0.496241,0.515728,0.494265,0.999,0,0.002,0,0,0,0,0,0,0.001,0,0,0,0,0.802,0,0.014,0.084,0,0.083,0.004,0.161,0.818,1,,,0.258,0.209,0.2242,0.223512,0.219831,11.884,,0.171,0.031,0.10429,0.105685,0.104227,,,,,,,1.517,1.498,,,0.0206269,2.074,2.055,0.078,0.221,0.025,0.045,,0.101518,,,0.979711,0.979715,0.979482,1,-1064.34,1.40397,799.501,-920.72,0.0004561,388300,163793,6702.57,3.39961,-504.601,-6569.52,6.28848,3894.85,-3650.93,0.00342075,2.15631e+06,686508,18723.3,68.1856,-3226.17,,,,-21.5296,-5810.86,,-17.2794,-925.85,-106.654,,26880.2,706060,677454,823737,13.4286,1,-1101.86,6006.57,37.6667,365243,-1518,-483,-1045.5,-1041.25,0.25,23040.1,706060,677454,706060,13.4286,1,-1101.86,6006.57,32.2857,208710,-867.429,-276,-597.429,-595,0.142857,,,,,,,,,,,,,,,,,-18.2857,14.2857,10.2857,0,0,-18.2857,14.2857,10.2857,0,0,,-16.7143,26503,61071.4,450,321.429,0,0,1285.71,2093.65,1451.57,25538.2,26493.4,26493.4,0.2,0.142857,0,0,21.8571,0,0,-16.7143,26503,61071.4,321.429,321.429,0,0,1285.71,1495.47,1451.57,25538.2,26493.4,26493.4,0.142857,0.142857,0,0,21.8571,0,0,,0.9,30,-891.5,-901.35,15808.5,15065.8,0.9,30,-891.5,-901.35,15808.5,15065.8
std,442.378,1984.3,15527.7,348833,322985,90814.4,0.0335767,0.0580909,0.0820134,0.692558,0.0335767,1.78216,0.114398,0.115289,0.115688,0.743527,0.917693,,4392.97,141931,1588.54,851.176,3532.02,0.482366,0.390764,,0.109228,0.109469,0.110763,0.202233,0.18304,0.183508,0.0316228,0,0.044699,0,0,0,0,0,0,0.0316228,0,0,0,0,0.398692,0,0.117549,0.277527,0,0.27602,0.0631505,0.367715,0.386038,0,,,0.437753,0.406798,0.144957,0.144231,0.143159,3.28075,,0.376697,0.173404,0.111886,0.113736,0.114032,,,,,,,2.47302,2.44663,,,0.0137548,0.508707,0.504211,0.268306,0.415128,0.156203,0.207408,,0.108354,,,0.0437848,0.0437929,0.0437919,0,530.183,26.3353,3499.97,506.109,0.00826347,560917,410888,26434.4,55.2187,403.767,6049.68,115.627,14902.7,4152.94,0.0584204,3.0363e+06,1.30487e+06,68332.6,1758.74,3552.45,,,,10.0841,6390.29,,8.69614,783.023,98.5137,,18760.3,804814,794042,812988,2.82,0,1001.45,15008.1,24.9292,0,1114.97,1400.09,999.291,998.978,0.5,19912.6,804814,794042,804814,2.82,0,1001.45,15008.1,26.8435,195231,1131.35,1023.12,900.887,899.306,0.377964,,,,,,,,,,,,,,,,,10.9957,15.2503,12.3655,0,0,10.9957,15.2503,12.3655,0,0,,16.1216,70120.5,78711.7,1006.23,850.42,0,0,3401.68,3888.84,3356.55,67567.7,70095,70095,0.447214,0.377964,0,0,24.2791,0,0,16.1216,70120.5,78711.7,850.42,850.42,0,0,3401.68,3335.53,3356.55,67567.7,70095,70095,0.377964,0.377964,0,0,24.2791,0,0,,0.91191,42.5849,731.366,731.699,18807.6,19110.3,0.91191,42.5849,731.366,731.699,18807.6,19110.3
min,0,100001,4509,45000,45000,36000,0,0,0,0,0,0,0.001,0.001,0.0011,0,1,,-24975,-14880,-6091,-3887,-17043,0,0,,0,0,0,0.0378966,0.0029755,0.000527265,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,,,0,0,0,0,0,2,,0,0,0,0,0,,,,,,,0,0,,,0.001276,1,1,0,0,0,0,,0.0009,,,0,0,0,1,-2921,0,-2624,-2618,0,0,0,0,0,-2618,-43985,0,-26762,-30343,0,0,0,0,0,-26711,,,,-47.5,-40512,,-47.5,-4560,-715.5,,3506.31,0,0,43425,8,1,-2702,-1,10,365243,-2671,-2401,-2491,-2487,0,0,0,0,0,8,1,-2702,-1,0,0,-2671,-2401,-2491,-2487,0,,,,,,,,,,,,,,,,,-42,4,0,0,0,-42,4,0,0,0,,-43,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-43,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,0,2,-2622,-2634,68.31,68.31,0,2,-2622,-2634,68.31,68.31
25%,1249.75,101681,17790.8,257391,225000,112500,0,0,0,0,0,0,0.0536,0.0541,0.0504,0,2,,-19464,-2806.75,-4387.25,-1685.75,-7455.75,0,0,,0.069,0.069,0.069,0.340655,0.404166,0.359782,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,,,0,0,0.1667,0.1667,0.1667,10,,0,0,0.04415,0.044475,0.041725,,,,,,,0,0,,,0.010006,2,2,0,0,0,0,,0.0401,,,0.9767,0.9767,0.9762,1,-1407,0,-619,-1226.67,0,106012,1331.1,0,0,-731.25,-9226,0,-2497,-5098,0,393016,0,0,0,-4611,,,,-29.1841,-8042,,-22.9,-1331.12,-149.5,,17804.3,107866,86274,241731,12.5,1,-1647,-1,15,365243,-2341.75,-946.75,-1216.75,-1210.5,0,9628.88,107866,86274,107866,12.5,1,-1647,-1,11,0,-1544,-231,-749,-743.5,0,,,,,,,,,,,,,,,,,-18,6,2,0,0,-18,6,2,0,0,,-25,0,0,0,0,0,0,0,69.39,0,0,0,0,0,0,0,0,0,0,0,-25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,0,6,-1403,-1409.75,6830.23,3645.07,0,6,-1403,-1409.75,6830.23,3645.07
50%,1499.5,103479,25488,446031,366750,157500,0,0,0,0,0,2,0.0918,0.0916,0.084,0,2,,-15450.5,-1325,-3102,-846.5,-4570,0,0,,0.1379,0.1379,0.1379,0.50112,0.56591,0.513694,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,,,0,0,0.1667,0.1667,0.1667,12,,0,0,0.07585,0.0775,0.0754,,,,,,,0,0,,,0.01885,2,2,0,0,0,0,,0.0712,,,0.9821,0.9821,0.9816,1,-1023.33,0,-86,-870,0,211208,51309,0,0,-446.333,-4887,0,-209,-2290,0,1.15461e+06,225000,0,0,-2085,,,,-21.9291,-3782,,-16.6818,-768.4,-79,,25325.4,450000,491580,675000,14,1,-887,-1,42,365243,-1544,-222.5,-749,-743.5,0,23962.9,450000,491580,450000,14,1,-887,-1,24,365243,-313,0,-193,-191,0,,,,,,,,,,,,,,,,,-17,12,9,0,0,-17,12,9,0,0,,-12,0,0,0,0,0,0,0,237.87,0,0,0,0,0,0,0,0,28,0,0,-12,0,0,0,0,0,0,0,69.39,0,0,0,0,0,0,0,0,28,0,0,,1,10,-794,-801.5,11224.2,9391.3,1,10,-794,-801.5,11224.2,9391.3
75%,1749.25,105196,35685,644222,585000,202500,0,0,0,1,0,3,0.1464,0.1478,0.1439,1,3,,-12131.2,-311.5,-1625.25,-358.75,-1966.25,0,0,,0.2069,0.2069,0.2069,0.660101,0.651456,0.634706,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,,,1,0,0.3333,0.3333,0.3333,14,,0,0,0.123,0.1252,0.12465,,,,,,,2,2,,,0.028663,2,2,0,0,0,0,,0.121625,,,0.9866,0.9866,0.9866,1,-683.6,0,719.5,-549.5,0,450900,168535,0,0,-174.25,-2132,0,1865,-726,0,2.56723e+06,838976,0,0,-610,,,,-13.8103,-1131,,-11,-318,-34.5,,30685.1,1.01334e+06,914026,1.07002e+06,15.5,1,-324.5,1025,60,365243,-720.25,241.25,-577.75,-574.25,0.25,29352.7,1.01334e+06,914026,1.01334e+06,15.5,1,-324.5,1025,60,365243,0,8.5,0,0,0,,,,,,,,,,,,,,,,,-11.5,12,11.5,0,0,-11.5,12,11.5,0,0,,-5,0,123750,0,0,0,0,0,1161,580.5,0,0,0,0,0,0,0,29.5,0,0,-5,0,123750,0,0,0,0,0,699.435,580.5,0,0,0,0,0,0,0,29.5,0,0,,1,26.5,-313.75,-322.5,15494.8,15494.8,1,26.5,-313.75,-322.5,15494.8,15494.8
max,1999,106861,103455,2.1564e+06,1.8e+06,1.35e+06,1,1,1,5,1,9,1,1,1,8,10,,-7779,365243,-1,0,-5,4,4,,1,1,1,0.903545,0.855,0.843544,1,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,1,1,0,1,1,1,1,1,,,1,1,0.875,0.875,0.875,23,,1,1,1,1,1,,,,,,,23,23,,,0.072508,3,3,1,1,1,1,,1,,,0.9995,0.9995,0.9995,1,-17,619,30909,-6,0.2,6.26104e+06,5.63903e+06,271746,1527.62,-1,-17,2476,112067,0,1,3.60384e+07,1.50118e+07,670500,51939,-1,,,,0,0,,0,0,0,,59355,2.25e+06,2.25e+06,2.25e+06,16,1,-181,40000,60,365243,-313,914,-193,-191,1,59355,2.25e+06,2.25e+06,2.25e+06,16,1,-181,40000,60,365243,0,914,0,0,1,,,,,,,,,,,,,,,,,-10,48,36,0,0,-10,48,36,0,0,,-2,185521,180000,2250,2250,0,0,9000,9000,9000,178767,185454,185454,1,1,0,0,66,0,0,-2,185521,180000,2250,2250,0,0,9000,9000,9000,178767,185454,185454,1,1,0,0,66,0,0,,3,153,-143,-161,83637.7,83637.7,3,153,-143,-161,83637.7,83637.7
counts,1000,1000,999,1000,1000,1000,887,887,887,887,887,887,501,501,501,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,532,509,509,509,580,1000,835,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,515,515,515,1000,504,1000,1000,504,504,504,1000,1000,1000,1000,1000,984,1000,1000,682,1000,1000,1000,1000,1000,1000,1000,1000,0,524,503,1000,520,520,520,1000,877,877,865,777,877,877,854,795,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,877,6,7,7,6,7,7,7,7,6,4,4,4,4,4,4,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,5,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,5,7,5,5,7,5,7,7,7,7,5,7,5,5,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,20,20,20,20,20,20,20,20,20,20,20,20
uniques,1000,1000,744,421,168,85,2,2,2,6,2,10,211,200,190,6,7,2,978,744,913,733,936,5,5,2,39,24,18,580,990,373,2,1,2,1,1,1,1,1,1,2,1,1,1,1,2,1,2,2,1,2,2,2,2,1,2,2,2,2,35,22,18,21,3,2,2,446,447,444,2,4,5,6,4,7,17,19,18,45,77,3,3,2,2,2,2,0,459,7,7,74,75,75,1,856,12,846,744,3,842,645,168,13,818,845,11,836,737,2,840,645,165,13,799,2,1,6,797,778,3,543,787,422,4,6,7,7,6,6,1,7,4,4,1,4,4,4,4,2,7,7,7,7,6,1,7,4,5,2,5,5,5,5,2,2,6,1,2,3,2,2,3,2,3,4,3,4,4,4,7,6,4,6,1,1,6,4,6,1,1,2,6,2,4,2,2,1,1,2,5,3,2,2,2,2,2,1,1,5,1,1,6,2,4,2,2,1,1,2,5,3,2,2,2,2,2,1,1,5,1,1,1,4,13,20,20,20,20,4,13,20,20,20,20
