# Home Credit Feature Transformation

In [7]:
import numpy as np
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
from scipy.stats import iqr, randint, uniform
import lightgbm as lgb
from sklearn.tree import DecisionTreeClassifier
from sklearn.ensemble import RandomForestClassifier
from sklearn.linear_model import LogisticRegressionCV, LogisticRegression
from sklearn.discriminant_analysis import LinearDiscriminantAnalysis
from sklearn.random_projection import GaussianRandomProjection
from sklearn.svm import LinearSVC
from sklearn.naive_bayes import GaussianNB
from sklearn.decomposition import PCA, FastICA
from sklearn.preprocessing import Imputer, StandardScaler, RobustScaler, QuantileTransformer
from sklearn.model_selection import RandomizedSearchCV, GridSearchCV, train_test_split, cross_val_score, StratifiedKFold
from sklearn.cluster import KMeans
from sklearn.metrics import roc_auc_score
from sklearn.feature_selection import SelectKBest, f_classif
from skopt import gp_minimize
from skopt.plots import plot_convergence, plot_objective
from IPython.display import display
import warnings
import pickle
import gc

%load_ext autotime

pd.options.display.max_columns = None
warnings.filterwarnings("ignore")
gc.enable()
np.random.seed(123)

path = "/Users/dsaxton/home_credit_default/"

impute = Imputer(strategy="median")
quant = QuantileTransformer(output_distribution="normal")
scale = StandardScaler()

The autotime extension is already loaded. To reload it, use:
  %reload_ext autotime
time: 8.83 ms


# Ridge Regression

## Bureau Aggregate Synthetic Target

In [2]:
frame = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"])
bureau_agg = pd.read_csv(path + "bureau_agg.csv", usecols=lambda c: ("AGG_SYNTH" not in c) and ("AGG_COMP" not in c))

df = pd.merge(frame, bureau_agg, how="left", on="SK_ID_CURR")
del frame
gc.collect()
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")

time: 21.1 s


In [3]:
df.head()

Unnamed: 0,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY
0,315.103846,0.0,0.0,0.0,0.0,0.54618,0.54618,2.0,2.0,2.0,780.0,0.0,,,,245781.0,245781.0,0.0,10.875,0.689655,0.264368,0.003698,40.5,1.5,39.0,60.0,0.716964,0.283036,0.5,0.109328,0.014109,0.010476,0.025641,4863.768166,0.0,1617.905476,7012.987013,0.75,0.051282,0.027542,638235.0,927.0,20.0,20.0,-47.0,-1072.0,780.0,-2094.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,103.0,0.017755,148.3425,153.695563,5043.645,8405.145,0.0,35111.571429,245781.0,inf,inf,0.0,inf,-7.0,1178.0,1334.0,69432.89321,865055.565,4.0,0.0,0.0,0.0
1,0.0,0.0,0.0,,,0.0,0.0,1.0,1.0,1.0,1216.0,0.0,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,810000.0,1216.0,,,,-2434.0,1216.0,-2178.0,1.0,4.0,1.0,0.0,0.0,0.0,0.0,606.0,0.003938,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,-43.0,2088.0,1980.0,19188.078259,1017400.5,2.0,0.0,0.0,0.0
2,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-595.0,-382.0,-977.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,408.0,0.003205,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-382.0,300.0,918.0,386.044202,189037.8,0.0,0.0,0.0,0.0
3,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-783.0,-783.0,-783.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1149.0,0.00087,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-783.0,0.0,0.0,186.781609,146250.0,0.0,0.0,0.0,0.0


time: 91.6 ms


In [4]:
df = pd.DataFrame(scale.fit_transform(impute.fit_transform(df.replace([-np.inf, np.inf], np.nan))), columns=df.columns)
df.head()

Unnamed: 0,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY
0,-0.017451,-0.36644,-0.368052,-0.149244,-0.179554,-0.010895,-0.010504,0.255989,0.223639,0.021481,-0.321577,-0.030216,-0.006791,0.001623,-0.001839,-0.21453,-0.21453,-0.153187,-0.292629,-6.091449,-0.433453,-0.172159,-0.578847,-0.625365,0.070782,0.598159,-5.934009,5.934009,5.104959,0.147871,-0.187341,1.167564,0.933341,-0.23016,-0.059154,0.228243,0.241201,2.426528,0.463551,0.808018,-0.206464,-0.378366,-0.085887,-0.085887,0.644639,-0.002689,-0.358515,-0.363513,-0.034576,0.651059,-0.029349,-0.034083,-0.033543,-0.049551,-0.049444,-0.715526,0.192498,0.054073,0.048104,-0.002021,0.006226,-0.151294,-0.045053,-0.215155,-0.008199,-0.006899,-0.005464,0.00598,0.357777,0.150541,0.073218,-0.027026,-0.248757,1.962993,-0.237459,-0.210096,-0.052514
1,-0.054782,-0.36644,-0.368052,-0.149244,-0.179554,-0.017304,-0.016913,-0.427915,-0.445819,-0.604823,-0.278515,-0.030216,-0.006791,0.001623,-0.001839,-0.397412,-0.397412,-0.153187,-0.136725,0.188252,-0.1471,-0.113857,-0.004981,-0.19817,-0.025517,-0.405341,0.190887,-0.190887,-0.243705,-0.155099,-0.119283,-0.101983,-0.11499,-0.091846,-0.04564,-0.059392,-0.057311,-0.209887,-0.176998,-0.154519,-0.133278,-0.353425,-0.16972,-0.16972,-0.010943,-0.56201,-0.30846,-0.370704,-0.635596,-0.327136,-0.633562,-0.034083,-0.033543,-0.049551,-0.049444,0.28645,-0.397029,-0.087456,-0.092504,-0.019744,-0.023189,-0.151294,-0.23545,-0.376695,-0.008581,-0.007198,-0.005464,0.00598,0.247248,1.022249,0.82989,-0.22562,-0.2088,0.529455,-0.237459,-0.210096,-0.052514
2,-0.054782,-0.36644,-0.368052,-0.149244,-0.179554,-0.007339,-0.007151,-1.111819,-1.115277,-1.231127,-0.398615,-0.030216,-0.006791,0.001623,-0.001839,-0.397412,-0.397412,-0.153187,-0.136725,0.188252,-0.1471,-0.113857,-0.004981,-0.19817,-0.025517,-0.405341,0.190887,-0.190887,-0.243705,-0.155099,-0.119283,-0.101983,-0.11499,-0.091846,-0.04564,-0.059392,-0.057311,-0.209887,-0.176998,-0.154519,-0.478407,-0.458367,-0.16972,-0.16972,-0.010943,0.193196,-0.491919,-0.267889,-1.236616,-0.816233,-1.237774,-0.034083,-0.033543,-0.049551,-0.049444,-0.107966,-0.428317,-0.087456,-0.092504,-0.019744,-0.023189,-0.151294,-0.23545,-0.376695,-0.008199,-0.006899,-0.005464,0.00598,-0.793568,-0.690515,-0.414052,-0.299935,-0.426062,-0.904082,-0.237459,-0.210096,-0.052514
3,-0.028147,-0.36644,-0.368052,-0.149244,-0.179554,-0.007339,-0.007151,-0.427915,-0.445819,0.021481,-0.317725,-0.030216,-0.006791,0.001623,-0.001839,-0.288425,-0.288425,-0.153187,-0.136725,0.188252,-0.1471,-0.113857,-0.004981,-0.19817,-0.025517,-0.405341,0.190887,-0.190887,-0.243705,-0.155099,-0.119283,-0.101983,-0.11499,-0.091846,-0.04564,-0.059392,-0.057311,-0.209887,-0.176998,-0.154519,-0.291682,-0.360243,-0.16972,-0.16972,-0.010943,-0.083179,-0.343705,-0.216953,-0.034576,-0.327136,-0.029349,-0.034083,-0.033543,-0.049551,-0.049444,-0.323102,-0.220406,-0.087456,-0.092504,-0.019744,-0.023189,-0.151294,-0.195289,-0.265607,-0.008199,-0.006899,-0.005464,0.00598,0.320934,-0.11193,-0.011117,-0.204876,-0.223408,-0.187314,-0.237459,-0.210096,-0.052514
4,-0.054782,-0.36644,-0.368052,-0.149244,-0.179554,-0.007339,-0.007151,-1.111819,-1.115277,-1.231127,-0.398615,-0.030216,-0.006791,0.001623,-0.001839,-0.397412,-0.397412,-0.153187,-0.136725,0.188252,-0.1471,-0.113857,-0.004981,-0.19817,-0.025517,-0.405341,0.190887,-0.190887,-0.243705,-0.155099,-0.119283,-0.101983,-0.11499,-0.091846,-0.04564,-0.059392,-0.057311,-0.209887,-0.176998,-0.154519,-0.478407,-0.458367,-0.16972,-0.16972,-0.010943,0.115992,-0.537956,-0.251282,-1.236616,-1.060782,-1.237774,-0.034083,-0.033543,-0.049551,-0.049444,1.368105,-0.527937,-0.087456,-0.092504,-0.019744,-0.023189,-0.151294,-0.23545,-0.376695,-0.008199,-0.006899,-0.005464,0.00598,-2.02474,-0.977891,-1.489323,-0.300722,-0.437285,-0.904082,-0.237459,-0.210096,-0.052514


time: 11 s


#### Get out of fold predictions

In [5]:
kfold = StratifiedKFold(n_splits=3)
scores = pd.DataFrame({"SK_ID_CURR": [], "BUREAU_AGG_SYNTHETIC_TARGET": []})

time: 2.74 ms


In [6]:
for train_indx, test_indx in kfold.split(df.values, y.values):
    print("Determining lambda and fitting...")
    clf = LogisticRegressionCV(Cs=10, 
                               penalty="l2", 
                               fit_intercept=False, 
                               scoring="roc_auc", 
                               cv=kfold)
    clf.fit(df.iloc[train_indx], y.iloc[train_indx])
    print("Scoring...")
    fold_scores = pd.DataFrame({"SK_ID_CURR": sk_id_curr.iloc[test_indx], "BUREAU_AGG_SYNTHETIC_TARGET": clf.predict_proba(df.iloc[test_indx])[:,1]})
    scores = pd.concat([scores, fold_scores], axis=0)
    
scores.head()

Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...


Unnamed: 0,SK_ID_CURR,BUREAU_AGG_SYNTHETIC_TARGET
0,100002.0,0.526688
1,100003.0,0.459155
2,100004.0,0.484266
3,100006.0,0.501675
4,100007.0,0.493031


time: 4min 2s


#### Append

In [7]:
bureau_agg = bureau_agg.merge(scores, how="left", on="SK_ID_CURR")
bureau_agg.head()

Unnamed: 0,SK_ID_CURR,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET
0,100001,603.706712,0.0,0.0,1.0,1.0,0.987405,0.987405,3.0,3.0,3.0,3091.0,0.0,,,,596686.5,596686.5,0.0,8.857143,0.983871,1.774194,0.007155,47.5,0.5,47.0,61.0,0.992481,0.007519,0.052632,0.349547,0.021053,0.000835,0.005848,120775.784672,1800.0,282.105263,1974.736842,0.142857,0.111111,0.015873,884025.0,3091.0,19.0,19.0,-51.0,-1329.0,1778.0,577.0,3.0,7.0,3.0,0.0,0.0,0.0,0.0,49.0,0.029363,,0.0,,0.0,0.0,53216.5875,596686.5,inf,inf,0.0,,-6.0,149.0,1523.0,100412.66129,1453365.0,0.0,0.0,0.0,24817.5,
1,100002,315.103846,0.0,0.0,0.0,0.0,0.54618,0.54618,2.0,2.0,2.0,780.0,0.0,,,,245781.0,245781.0,0.0,10.875,0.689655,0.264368,0.003698,40.5,1.5,39.0,60.0,0.716964,0.283036,0.5,0.109328,0.014109,0.010476,0.025641,4863.768166,0.0,1617.905476,7012.987013,0.75,0.051282,0.027542,638235.0,927.0,20.0,20.0,-47.0,-1072.0,780.0,-2094.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,103.0,0.017755,148.3425,153.695563,5043.645,8405.145,0.0,35111.571429,245781.0,inf,inf,0.0,inf,-7.0,1178.0,1334.0,69432.89321,865055.565,4.0,0.0,0.0,0.0,0.526688
2,100003,0.0,0.0,0.0,,,0.0,0.0,1.0,1.0,1.0,1216.0,0.0,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,810000.0,1216.0,,,,-2434.0,1216.0,-2178.0,1.0,4.0,1.0,0.0,0.0,0.0,0.0,606.0,0.003938,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,-43.0,2088.0,1980.0,19188.078259,1017400.5,2.0,0.0,0.0,0.0,0.459155
3,100004,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-595.0,-382.0,-977.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,408.0,0.003205,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-382.0,300.0,918.0,386.044202,189037.8,0.0,0.0,0.0,0.0,0.484266
4,100005,617.739835,0.0,0.0,0.0,0.0,0.954794,0.954794,2.0,2.0,2.0,1446.0,0.0,,,,568408.5,568408.5,0.0,5.333333,1.0,0.3125,0.086957,8.5,1.0,7.5,16.0,1.0,0.0,0.0,0.539216,0.117647,0.0,0.0,107036.117647,6882.352941,0.0,0.0,0.0,0.0,0.0,598626.0,1446.0,8.0,8.0,-12.0,-128.0,1324.0,1318.0,2.0,3.0,2.0,0.0,0.0,0.0,0.0,62.0,0.026109,0.0,0.0,0.0,0.0,0.0,50188.368035,568408.5,inf,inf,0.0,0.0,-11.0,110.0,311.0,53154.691016,657126.0,1.0,0.0,0.0,4261.5,


time: 570 ms


#### Fill in test set cases

Fit model on full training data and predict TARGET for the test cases

In [8]:
clf = LogisticRegressionCV(Cs=10, 
                           penalty="l2", 
                           fit_intercept=False, 
                           scoring="roc_auc", 
                           cv=kfold)
clf.fit(df, y)

LogisticRegressionCV(Cs=10, class_weight=None,
           cv=StratifiedKFold(n_splits=3, random_state=None, shuffle=False),
           dual=False, fit_intercept=False, intercept_scaling=1.0,
           max_iter=100, multi_class='ovr', n_jobs=1, penalty='l2',
           random_state=None, refit=True, scoring='roc_auc',
           solver='lbfgs', tol=0.0001, verbose=0)

time: 2min 11s


In [9]:
null_id = bureau_agg["BUREAU_AGG_SYNTHETIC_TARGET"].isnull()
temp_frame = bureau_agg[null_id].drop(["SK_ID_CURR", "BUREAU_AGG_SYNTHETIC_TARGET"], axis=1).replace([-np.inf, np.inf], np.nan)
arr = scale.fit_transform(impute.fit_transform(temp_frame))
bureau_agg.loc[null_id, "BUREAU_AGG_SYNTHETIC_TARGET"] = clf.predict_proba(pd.DataFrame(arr, columns=temp_frame.columns))[:,1]

time: 1.63 s


#### Reappend principal components if necessary

In [10]:
prin_comp = pd.read_csv(path + "bureau_agg.csv", usecols=lambda c: (c == "SK_ID_CURR") or ("AGG_COMP" in c))
bureau_agg = bureau_agg.merge(prin_comp, how="left", on="SK_ID_CURR")
del prin_comp
bureau_agg.head()

Unnamed: 0,SK_ID_CURR,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7
0,100001,603.706712,0.0,0.0,1.0,1.0,0.987405,0.987405,3.0,3.0,3.0,3091.0,0.0,,,,596686.5,596686.5,0.0,8.857143,0.983871,1.774194,0.007155,47.5,0.5,47.0,61.0,0.992481,0.007519,0.052632,0.349547,0.021053,0.000835,0.005848,120775.784672,1800.0,282.105263,1974.736842,0.142857,0.111111,0.015873,884025.0,3091.0,19.0,19.0,-51.0,-1329.0,1778.0,577.0,3.0,7.0,3.0,0.0,0.0,0.0,0.0,49.0,0.029363,,0.0,,0.0,0.0,53216.5875,596686.5,inf,inf,0.0,,-6.0,149.0,1523.0,100412.66129,1453365.0,0.0,0.0,0.0,24817.5,0.525046,1.10057,1.523734,1.496514,-0.660367,-1.992638,0.017996,0.257508
1,100002,315.103846,0.0,0.0,0.0,0.0,0.54618,0.54618,2.0,2.0,2.0,780.0,0.0,,,,245781.0,245781.0,0.0,10.875,0.689655,0.264368,0.003698,40.5,1.5,39.0,60.0,0.716964,0.283036,0.5,0.109328,0.014109,0.010476,0.025641,4863.768166,0.0,1617.905476,7012.987013,0.75,0.051282,0.027542,638235.0,927.0,20.0,20.0,-47.0,-1072.0,780.0,-2094.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,103.0,0.017755,148.3425,153.695563,5043.645,8405.145,0.0,35111.571429,245781.0,inf,inf,0.0,inf,-7.0,1178.0,1334.0,69432.89321,865055.565,4.0,0.0,0.0,0.0,0.526688,1.038894,7.601345,0.534316,-0.817806,-0.592501,-0.290651,0.111304
2,100003,0.0,0.0,0.0,,,0.0,0.0,1.0,1.0,1.0,1216.0,0.0,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,810000.0,1216.0,,,,-2434.0,1216.0,-2178.0,1.0,4.0,1.0,0.0,0.0,0.0,0.0,606.0,0.003938,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,-43.0,2088.0,1980.0,19188.078259,1017400.5,2.0,0.0,0.0,0.0,0.459155,-1.386349,-0.52014,-0.831323,-0.242488,-0.712057,0.070022,0.154299
3,100004,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-595.0,-382.0,-977.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,408.0,0.003205,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-382.0,300.0,918.0,386.044202,189037.8,0.0,0.0,0.0,0.0,0.484266,-3.20874,-0.155941,-0.524505,0.269582,0.094367,-0.046783,0.032632
4,100005,617.739835,0.0,0.0,0.0,0.0,0.954794,0.954794,2.0,2.0,2.0,1446.0,0.0,,,,568408.5,568408.5,0.0,5.333333,1.0,0.3125,0.086957,8.5,1.0,7.5,16.0,1.0,0.0,0.0,0.539216,0.117647,0.0,0.0,107036.117647,6882.352941,0.0,0.0,0.0,0.0,0.0,598626.0,1446.0,8.0,8.0,-12.0,-128.0,1324.0,1318.0,2.0,3.0,2.0,0.0,0.0,0.0,0.0,62.0,0.026109,0.0,0.0,0.0,0.0,0.0,50188.368035,568408.5,inf,inf,0.0,0.0,-11.0,110.0,311.0,53154.691016,657126.0,1.0,0.0,0.0,4261.5,0.546448,-1.948244,-0.867605,4.826918,-0.613374,-1.4752,0.188919,0.200762


time: 3.83 s


In [11]:
bureau_agg.shape

(305811, 86)

time: 4.96 ms


### AUC

In [12]:
temp = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"]).merge(bureau_agg[["SK_ID_CURR", "BUREAU_AGG_SYNTHETIC_TARGET"]], how="left", on="SK_ID_CURR").dropna()
print(round(roc_auc_score(temp["TARGET"], temp["BUREAU_AGG_SYNTHETIC_TARGET"]), 4))
del temp
gc.collect()

0.64


49

time: 13 s


In [13]:
bureau_agg.to_csv(path + "bureau_agg.csv", index=False, header=True)

time: 53.8 s


## Previous Application Aggregate Synthetic Target

In [65]:
frame = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"])
previous_agg = pd.read_csv(path + "previous_agg.csv", usecols=lambda c: ("AGG_SYNTH" not in c) and ("AGG_COMP" not in c))

df = pd.merge(frame, previous_agg, how="left", on="SK_ID_CURR")
del frame
gc.collect()
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")

time: 13.4 s


In [66]:
df.head()

Unnamed: 0,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M
0,,9251.775,,,1.0,,1.0,1.0,-17.0,-17.0,-17.0,0.0,179055.0,179055.0,179055.0,295.470297,295.470297,295.470297,19.353584,19.353584,19.353584,0.031937,0.031937,0.031937,9251.775,9251.775,9251.775,15.266955,15.266955,15.266955,-606.0,-606.0,0.0,0.0,0.0,295.470297,295.470297,179055.0,179055.0,0.0,0.00165,0.00165,0.0,1.0,1.0,1.0,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.00165,0.00165,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,
1,,,,,,,,3.0,-1976.0,-527.0,-1047.333333,1449.0,68053.5,1035882.0,484191.0,29.070269,1388.581769,612.90394,5.399568,10.531859,8.677472,0.004315,0.014118,0.008318,6737.31,98356.995,56553.99,2.877962,131.845838,70.901357,-2341.0,-746.0,1595.0,0.0,0.0,547.812073,1206.434316,435436.5,900000.0,2.1e-05,0.001071,0.001543,0.05003,1.057664,1.15098,0.989013,,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,2.0,0.0,0.0,1.0,2.0,3.0,0.002975,0.00134,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,
2,,,,,,,,1.0,-714.0,-714.0,-714.0,0.0,20106.0,20106.0,20106.0,24.669939,24.669939,24.669939,3.753045,3.753045,3.753045,0.004605,0.004605,0.004605,5357.25,5357.25,5357.25,6.573313,6.573313,6.573313,-815.0,-815.0,0.0,0.0,0.0,29.793865,29.793865,24282.0,24282.0,0.00026,0.001016,0.001016,0.212008,0.828021,0.828021,0.828021,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.001227,0.001227,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,
3,13500.0,2482.92,0.799989,1.029197,1.012684,1.316797,1.316797,9.0,-416.0,365243.0,182481.75,365659.0,0.0,906615.0,291695.5,0.0,5008.922652,1358.887335,9.230206,27.839644,17.767287,0.015809,0.15381,0.081751,2482.92,39954.51,23651.175,4.024182,180.641436,96.293912,-617.0,-181.0,436.0,5.0,0.555556,1242.561634,3803.867403,272203.26,688500.0,0.000439,0.004129,0.007275,0.163412,1.012684,1.316797,0.799989,,0.0,0.0,0.0,1.0,1.0,3.0,5.0,0.0,0.0,0.0,2.0,2.0,1.0,4.0,0.015886,0.005525,2.0,,,1.0,1.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,,,,,,,
4,,16037.64,,,1.108236,,1.108236,6.0,-2041.0,365243.0,72143.8,367284.0,14616.0,284400.0,166638.75,6.201103,733.391711,248.03877,7.968206,21.858453,12.644075,0.003381,0.045729,0.016725,1834.29,22678.785,12278.805,0.778231,42.88139,16.715844,-2357.0,-374.0,1983.0,1.0,0.166667,222.881532,661.764706,150530.25,247500.0,7.5e-05,0.001244,0.002963,0.159516,1.046356,1.264,0.85093,,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,3.0,1.0,3.0,0.0,3.0,5.0,0.005724,0.002674,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,


time: 68.8 ms


In [67]:
df = pd.DataFrame(scale.fit_transform(impute.fit_transform(df.replace([-np.inf, np.inf], np.nan))), columns=df.columns)
df.head()

Unnamed: 0,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M
0,-0.200503,-0.280145,-0.088223,-0.037291,-0.490707,-0.042666,-0.605926,-0.943576,-0.269426,-1.092069,-0.793686,-0.843603,1.397768,-0.502523,0.072989,0.181463,-0.131681,-0.096781,2.797175,0.143591,1.413703,0.220685,-0.154585,-0.081738,0.206274,-0.757469,-0.527428,0.016193,-0.166969,-0.14672,1.107695,-0.255939,-1.202719,-0.645423,-1.025872,-0.092151,-0.131084,0.18471,-0.451843,-0.172878,-0.159318,-0.196333,-0.94826,-0.16202,-0.59716,0.523521,-0.000927,-0.115808,-0.174476,-0.149492,-0.247045,-0.449611,-0.513724,-0.987931,-0.353334,-0.758034,-0.389068,-0.767641,-0.136381,-1.017007,-0.888998,-0.269736,-0.174889,-0.108617,-0.003902,0.015476,-0.299862,-0.279748,-0.257643,-0.367522,-0.358671,-0.068583,-0.389234,-0.562503,-0.224113,-0.134388,-0.187858,-0.074248,-0.057687,-0.031403,-0.174179,-0.171899
1,-0.200503,-0.261967,-0.088223,-0.037291,0.016602,-0.042666,-0.032036,-0.448425,-0.289847,-1.094869,-0.803285,-0.835563,0.219641,1.413659,1.960317,-0.044303,-0.079282,-0.032474,-0.638947,-0.80446,-0.752372,-0.087796,-0.183878,-0.190546,-0.138355,4.011806,4.325895,-0.078317,-0.0253,0.04532,-0.954705,-0.52153,0.623775,-0.645423,-1.025872,-0.036182,-0.082892,1.899396,1.296445,-0.144258,-0.21471,-0.200199,-0.356741,0.447405,0.327368,0.443085,-0.000927,-0.115808,-0.174476,-0.149492,-0.247045,-0.449611,-0.513724,-0.020339,-0.353334,0.804858,-0.389068,-0.767641,-0.136381,0.504613,0.153448,-0.198209,-0.193144,-0.108617,-0.003902,0.015476,-0.299862,-0.279748,-0.257643,-0.367522,-0.358671,-0.068583,-0.389234,-0.562503,-0.224113,-0.134388,-0.187858,-0.074248,-0.057687,-0.031403,-0.174179,-0.171899
2,-0.200503,-0.261967,-0.088223,-0.037291,0.016602,-0.042666,-0.032036,-0.943576,-0.276692,-1.095896,-0.80018,-0.843603,-0.289255,-0.857992,-0.910143,-0.048032,-0.144662,-0.151642,-1.044397,-1.532965,-1.751488,-0.084556,-0.199516,-0.207651,-0.327505,-0.96592,-0.927016,-0.050127,-0.177534,-0.176729,0.859256,-0.652429,-1.202719,-0.645423,-1.025872,-0.151078,-0.145138,-0.850416,-0.827167,0.175486,-0.21997,-0.219182,1.558353,-1.97958,-1.650276,-0.735555,-0.000927,-0.115808,-0.174476,-0.149492,-0.247045,-0.449611,-0.513724,-0.987931,-0.353334,-0.758034,-0.389068,-0.767641,-0.808324,-1.017007,-0.888998,-0.292576,-0.199834,-0.108617,-0.003902,0.015476,-0.299862,-0.279748,-0.257643,-0.367522,-0.358671,-0.068583,-0.389234,-0.562503,-0.224113,-0.134388,-0.187858,-0.074248,-0.057687,-0.031403,-0.174179,-0.171899
3,0.140593,-0.869836,-2.405221,-0.168226,-0.365712,2.257922,1.459821,1.037028,-0.273585,0.913158,0.906647,1.185336,-0.502652,1.12457,0.769693,-0.068939,0.09426,0.118653,0.304333,1.055569,1.091859,0.040573,0.045766,0.147751,-0.721457,0.885866,0.949986,-0.069573,0.033998,0.13297,1.09462,0.550322,-0.703439,1.072794,1.094097,0.117912,0.054517,0.807688,0.783559,0.4144,0.077758,0.00633,0.983798,-0.027969,1.342752,-0.940777,-0.000927,-0.115808,-0.174476,-0.149492,1.343164,0.11382,1.313,0.947253,-0.353334,-0.758034,-0.389068,0.696217,0.535562,-0.256197,0.67467,0.498623,0.053515,0.655183,-0.003902,0.015476,0.634041,2.574449,-0.257643,-0.367522,-0.358671,-0.068583,-0.389234,2.271847,-0.224113,-0.134388,-0.187858,-0.074248,-0.057687,-0.031403,-0.174179,-0.171899
4,-0.200503,0.311028,-0.088223,-0.037291,0.575907,-0.042666,0.099853,0.294302,-0.290525,0.913158,-0.121367,1.194353,-0.347524,-0.266933,-0.003808,-0.063684,-0.110689,-0.10639,-0.00643,0.412784,0.052412,-0.098229,-0.13191,-0.151818,-0.810357,-0.038801,-0.216848,-0.094335,-0.133411,-0.141719,-0.973724,0.184185,1.068089,-0.30178,-0.389882,-0.108251,-0.111706,-0.006064,-0.285864,-0.072768,-0.198204,-0.149026,0.937738,0.327892,1.019447,-0.567834,-0.000927,-0.115808,-0.174476,-0.149492,-0.247045,-0.449611,-0.513724,1.431049,-0.353334,1.586305,0.543789,1.428146,-0.808324,1.265423,1.195893,-0.04986,-0.114549,-0.108617,-0.003902,0.015476,-0.299862,-0.279748,-0.257643,-0.367522,-0.358671,-0.068583,-0.389234,-0.562503,-0.224113,-0.134388,-0.187858,-0.074248,-0.057687,-0.031403,-0.174179,-0.171899


time: 7.35 s


In [68]:
df.shape

(307511, 82)

time: 6.6 ms


#### Get out of fold predictions

In [69]:
kfold = StratifiedKFold(n_splits=3)
scores = pd.DataFrame({"SK_ID_CURR": [], "PREVIOUS_AGG_SYNTHETIC_TARGET": []})

time: 3.79 ms


In [70]:
for train_indx, test_indx in kfold.split(df.values, y.values):
    print("Determining lambda and fitting...")
    clf = LogisticRegressionCV(Cs=10, 
                               penalty="l2", 
                               fit_intercept=False, 
                               scoring="roc_auc", 
                               cv=kfold)
    clf.fit(df.iloc[train_indx], y.iloc[train_indx])
    print("Scoring...")
    fold_scores = pd.DataFrame({"SK_ID_CURR": sk_id_curr.iloc[test_indx], "PREVIOUS_AGG_SYNTHETIC_TARGET": clf.predict_proba(df.iloc[test_indx])[:,1]})
    scores = pd.concat([scores, fold_scores], axis=0)
    
scores.head()

Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...


Unnamed: 0,SK_ID_CURR,PREVIOUS_AGG_SYNTHETIC_TARGET
0,100002.0,0.487067
1,100003.0,0.42019
2,100004.0,0.506853
3,100006.0,0.505468
4,100007.0,0.492233


time: 1min 21s


#### Append

In [71]:
previous_agg = previous_agg.merge(scores, how="left", on="SK_ID_CURR")
previous_agg.head()

Unnamed: 0,SK_ID_CURR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET
0,100001,,,,,,,,1.0,-1612.0,-1612.0,-1612.0,0.0,23787.0,23787.0,23787.0,13.67069,13.67069,13.67069,6.020501,6.020501,6.020501,0.00346,0.00346,0.00346,3951.0,3951.0,3951.0,2.27069,2.27069,2.27069,-1740.0,-1740.0,0.0,0.0,0.0,14.273276,14.273276,24835.5,24835.5,6e-05,0.00055,0.00055,0.104326,0.957782,0.957782,0.957782,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.000575,0.000575,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,
1,100002,,9251.775,,,1.0,,1.0,1.0,-17.0,-17.0,-17.0,0.0,179055.0,179055.0,179055.0,295.470297,295.470297,295.470297,19.353584,19.353584,19.353584,0.031937,0.031937,0.031937,9251.775,9251.775,9251.775,15.266955,15.266955,15.266955,-606.0,-606.0,0.0,0.0,0.0,295.470297,295.470297,179055.0,179055.0,0.0,0.00165,0.00165,0.0,1.0,1.0,1.0,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.00165,0.00165,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.487067
2,100003,,,,,,,,3.0,-1976.0,-527.0,-1047.333333,1449.0,68053.5,1035882.0,484191.0,29.070269,1388.581769,612.90394,5.399568,10.531859,8.677472,0.004315,0.014118,0.008318,6737.31,98356.995,56553.99,2.877962,131.845838,70.901357,-2341.0,-746.0,1595.0,0.0,0.0,547.812073,1206.434316,435436.5,900000.0,2.1e-05,0.001071,0.001543,0.05003,1.057664,1.15098,0.989013,,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,2.0,0.0,0.0,1.0,2.0,3.0,0.002975,0.00134,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.42019
3,100004,,,,,,,,1.0,-714.0,-714.0,-714.0,0.0,20106.0,20106.0,20106.0,24.669939,24.669939,24.669939,3.753045,3.753045,3.753045,0.004605,0.004605,0.004605,5357.25,5357.25,5357.25,6.573313,6.573313,6.573313,-815.0,-815.0,0.0,0.0,0.0,29.793865,29.793865,24282.0,24282.0,0.00026,0.001016,0.001016,0.212008,0.828021,0.828021,0.828021,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.001227,0.001227,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506853
4,100005,,,,,,,,2.0,-460.0,-460.0,-460.0,0.0,0.0,40153.5,20076.75,0.0,53.042933,26.521466,8.342371,8.342371,8.342371,0.01102,0.01102,0.01102,4813.2,4813.2,4813.2,6.358256,6.358256,6.358256,-757.0,-315.0,442.0,1.0,0.5,29.469947,58.939894,22308.75,44617.5,0.000144,0.001189,0.001189,0.108964,0.89995,0.89995,0.89995,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.001321,0.001321,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,


time: 363 ms


#### Fill in test set cases

Fit model on full training data and predict TARGET for the test cases

In [72]:
clf = LogisticRegressionCV(Cs=10, 
                           penalty="l2", 
                           fit_intercept=False, 
                           scoring="roc_auc", 
                           cv=kfold)
clf.fit(df, y)

LogisticRegressionCV(Cs=10, class_weight=None,
           cv=StratifiedKFold(n_splits=3, random_state=None, shuffle=False),
           dual=False, fit_intercept=False, intercept_scaling=1.0,
           max_iter=100, multi_class='ovr', n_jobs=1, penalty='l2',
           random_state=None, refit=True, scoring='roc_auc',
           solver='lbfgs', tol=0.0001, verbose=0)

time: 39.2 s


In [73]:
null_id = previous_agg["PREVIOUS_AGG_SYNTHETIC_TARGET"].isnull()
temp_frame = previous_agg[null_id].drop(["SK_ID_CURR", "PREVIOUS_AGG_SYNTHETIC_TARGET"], axis=1).replace([-np.inf, np.inf], np.nan)
arr = scale.fit_transform(impute.fit_transform(temp_frame))
previous_agg.loc[null_id, "PREVIOUS_AGG_SYNTHETIC_TARGET"] = clf.predict_proba(pd.DataFrame(arr, columns=temp_frame.columns))[:,1]

time: 958 ms


In [74]:
previous_agg.shape

(338857, 84)

time: 2.51 ms


#### Reappend principal components if necessary

In [None]:
prin_comp = pd.read_csv(path + "previous_agg.csv", usecols=lambda c: (c == "SK_ID_CURR") or ("AGG_COMP" in c))
previous_agg = previous_agg.merge(prin_comp, how="left", on="SK_ID_CURR")
del prin_comp
previous_agg.head()

In [75]:
previous_agg.shape

(338857, 84)

time: 3.63 ms


### AUC

In [76]:
temp = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"]).merge(previous_agg[["SK_ID_CURR", "PREVIOUS_AGG_SYNTHETIC_TARGET"]], how="left", on="SK_ID_CURR").dropna()
print(round(roc_auc_score(temp["TARGET"], temp["PREVIOUS_AGG_SYNTHETIC_TARGET"]), 4))
del temp
gc.collect()

0.6464


70

time: 5.93 s


## Credit Card Aggregate Synthetic Target

In [299]:
frame = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"])
credit_card_agg = pd.read_csv(path + "credit_card_agg.csv", usecols=lambda c: ("AGG_SYNTH" not in c) and ("AGG_COMP" not in c))

df = pd.merge(frame, credit_card_agg, how="left", on="SK_ID_CURR")
del frame
gc.collect()
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")

time: 6.34 s


In [300]:
df.head()

Unnamed: 0,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M
0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,0.0,0.0,0.0,0.0,0.0,6.0,1.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,
4,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


time: 34.5 ms


In [301]:
df = pd.DataFrame(scale.fit_transform(impute.fit_transform(df.replace([-np.inf, np.inf], np.nan))), columns=df.columns)
df.head()

Unnamed: 0,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M
0,-0.045109,-0.048419,-0.203562,-0.245929,-0.268081,-0.282665,-0.171615,-0.19488,-0.149137,-0.080697,-0.250955,-0.307676,-0.205706,-0.141115,-0.221606,-0.229496,-0.326393,-0.235721,-0.117844,0.305828,-0.231616,-0.246752,-0.232725,-0.252816,-0.293747,-0.041852,-0.005999,-0.167533,-0.182542,-0.182952,-0.152257,-0.19792,-0.128588,-0.006867,-0.002019,-0.002097,-0.185024,-0.162354,-0.168614,-0.196211,-0.003362,-0.324033,-0.311702,-0.028594,-0.027655
1,-0.045109,-0.048419,-0.203562,-0.245929,-0.268081,-0.282665,-0.171615,-0.19488,-0.149137,-0.080697,-0.250955,-0.307676,-0.205706,-0.141115,-0.221606,-0.229496,-0.326393,-0.235721,-0.117844,0.305828,-0.231616,-0.246752,-0.232725,-0.252816,-0.293747,-0.041852,-0.005999,-0.167533,-0.182542,-0.182952,-0.152257,-0.19792,-0.128588,-0.006867,-0.002019,-0.002097,-0.185024,-0.162354,-0.168614,-0.196211,-0.003362,-0.324033,-0.311702,-0.028594,-0.027655
2,-0.045109,-0.048419,-0.203562,-0.245929,-0.268081,-0.282665,-0.171615,-0.19488,-0.149137,-0.080697,-0.250955,-0.307676,-0.205706,-0.141115,-0.221606,-0.229496,-0.326393,-0.235721,-0.117844,0.305828,-0.231616,-0.246752,-0.232725,-0.252816,-0.293747,-0.041852,-0.005999,-0.167533,-0.182542,-0.182952,-0.152257,-0.19792,-0.128588,-0.006867,-0.002019,-0.002097,-0.185024,-0.162354,-0.168614,-0.196211,-0.003362,-0.324033,-0.311702,-0.028594,-0.027655
3,-0.045109,-0.048419,-0.203562,-0.245929,-0.268081,-0.282665,-0.171615,-0.19488,-0.149137,-0.080697,-0.250955,-0.309062,-0.642337,-1.174465,-0.619479,-1.063212,-0.326393,-1.013479,-1.561794,-2.947945,-0.278867,-0.283795,-0.409247,-0.37944,-0.386429,-0.041852,-0.005999,-0.480582,-0.28791,-0.693545,-0.754986,-0.430944,-1.176035,-0.006867,-0.002019,-0.002097,-0.185024,-0.162354,-0.168614,-0.196211,-0.003362,-0.327419,-0.311702,-0.028594,-0.027655
4,-0.045109,-0.048419,-0.203562,-0.245929,-0.268081,-0.282665,-0.171615,-0.19488,-0.149137,-0.080697,-0.250955,-0.307676,-0.205706,-0.141115,-0.221606,-0.229496,-0.326393,-0.235721,-0.117844,0.305828,-0.231616,-0.246752,-0.232725,-0.252816,-0.293747,-0.041852,-0.005999,-0.167533,-0.182542,-0.182952,-0.152257,-0.19792,-0.128588,-0.006867,-0.002019,-0.002097,-0.185024,-0.162354,-0.168614,-0.196211,-0.003362,-0.324033,-0.311702,-0.028594,-0.027655


time: 2.14 s


#### Get out of fold predictions

In [302]:
kfold = StratifiedKFold(n_splits=3)
scores = pd.DataFrame({"SK_ID_CURR": [], "CREDIT_CARD_AGG_SYNTHETIC_TARGET": []})

time: 2.11 ms


In [303]:
for train_indx, test_indx in kfold.split(df.values, y.values):
    print("Determining lambda and fitting...")
    clf = LogisticRegressionCV(Cs=10, 
                               penalty="l2", 
                               fit_intercept=False, 
                               scoring="roc_auc", 
                               cv=kfold)
    clf.fit(df.iloc[train_indx], y.iloc[train_indx])
    print("Scoring...")
    fold_scores = pd.DataFrame({"SK_ID_CURR": sk_id_curr.iloc[test_indx], "CREDIT_CARD_AGG_SYNTHETIC_TARGET": clf.predict_proba(df.iloc[test_indx])[:,1]})
    scores = pd.concat([scores, fold_scores], axis=0)
    
scores.head()

Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...


Unnamed: 0,SK_ID_CURR,CREDIT_CARD_AGG_SYNTHETIC_TARGET
0,100002.0,0.497157
1,100003.0,0.497157
2,100004.0,0.497157
3,100006.0,0.471819
4,100007.0,0.497157


time: 1min 29s


#### Append

In [304]:
credit_card_agg = credit_card_agg.merge(scores, how="left", on="SK_ID_CURR")
credit_card_agg.head()

Unnamed: 0,SK_ID_CURR,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET
0,100006,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,0.0,0.0,0.0,0.0,0.0,6.0,1.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.471819
1,100011,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,54482.111149,189000.0,4031676.225,75.0,2.0,73.0,0.302678,1.05,891.528045,2520.0,65973.075311,0.004953,0.014,0.0,0.0,4.0,0.054054,4.0,180000.0,2432.432432,180000.0,1.0,inf,inf,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.483568
2,100013,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18159.919219,161420.22,1743352.245,96.0,1.0,95.0,0.115301,1.02489,230.066978,1944.407308,22086.429911,0.001461,0.012345,0.014493,0.014493,23.0,0.239583,7.0,571500.0,5953.125,157500.0,0.0,inf,inf,0.0,0.0,0.0,0.0,,0.0,0.0,,,
3,100021,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18.0,2.0,16.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.474393
4,100023,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11.0,4.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,,,,0.487986


time: 359 ms


#### Fill in test set cases

Fit model on full training data and predict TARGET for the test cases

In [305]:
clf = LogisticRegressionCV(Cs=10, 
                           penalty="l2", 
                           fit_intercept=False, 
                           scoring="roc_auc", 
                           cv=kfold)
clf.fit(df, y)

LogisticRegressionCV(Cs=10, class_weight=None,
           cv=StratifiedKFold(n_splits=3, random_state=None, shuffle=False),
           dual=False, fit_intercept=False, intercept_scaling=1.0,
           max_iter=100, multi_class='ovr', n_jobs=1, penalty='l2',
           random_state=None, refit=True, scoring='roc_auc',
           solver='lbfgs', tol=0.0001, verbose=0)

time: 58.8 s


In [306]:
null_id = credit_card_agg["CREDIT_CARD_AGG_SYNTHETIC_TARGET"].isnull()
temp_frame = credit_card_agg[null_id].drop(["SK_ID_CURR", "CREDIT_CARD_AGG_SYNTHETIC_TARGET"], axis=1).replace([-np.inf, np.inf], np.nan)
arr = scale.fit_transform(impute.fit_transform(temp_frame))
credit_card_agg.loc[null_id, "CREDIT_CARD_AGG_SYNTHETIC_TARGET"] = clf.predict_proba(pd.DataFrame(arr, columns=temp_frame.columns))[:,1]

time: 247 ms


#### Reappend principal components if necessary

In [307]:
prin_comp = pd.read_csv(path + "credit_card_agg.csv", usecols=lambda c: (c == "SK_ID_CURR") or ("AGG_COMP" in c))
credit_card_agg = credit_card_agg.merge(prin_comp, how="left", on="SK_ID_CURR")
del prin_comp
credit_card_agg.head()

Unnamed: 0,SK_ID_CURR,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7
0,100006,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,0.0,0.0,0.0,0.0,0.0,6.0,1.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.471819,-2.996367,0.956185,-1.143641,0.37796,0.322572,0.12285,-0.890276
1,100011,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,54482.111149,189000.0,4031676.225,75.0,2.0,73.0,0.302678,1.05,891.528045,2520.0,65973.075311,0.004953,0.014,0.0,0.0,4.0,0.054054,4.0,180000.0,2432.432432,180000.0,1.0,inf,inf,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.483568,-1.91423,-1.336225,0.97039,-0.360336,-1.157258,-0.099205,0.683874
2,100013,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18159.919219,161420.22,1743352.245,96.0,1.0,95.0,0.115301,1.02489,230.066978,1944.407308,22086.429911,0.001461,0.012345,0.014493,0.014493,23.0,0.239583,7.0,571500.0,5953.125,157500.0,0.0,inf,inf,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.481502,-1.995274,-1.079984,1.425906,-0.458675,-1.500304,-0.189693,1.339213
3,100021,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18.0,2.0,16.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.474393,-3.130604,0.815268,-0.953739,0.421427,0.156045,0.118608,-0.890236
4,100023,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11.0,4.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,,,,0.487986,-3.290014,1.021466,-1.043096,0.623813,0.148561,0.201433,-1.532772


time: 1.21 s


In [308]:
credit_card_agg.shape

(103558, 54)

time: 2.71 ms


### AUC

In [309]:
temp = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"]).merge(credit_card_agg[["SK_ID_CURR", "CREDIT_CARD_AGG_SYNTHETIC_TARGET"]], how="left", on="SK_ID_CURR").dropna()
print(round(roc_auc_score(temp["TARGET"], temp["CREDIT_CARD_AGG_SYNTHETIC_TARGET"]), 4))
del temp
gc.collect()

0.6549


76

time: 5.76 s


In [None]:
credit_card_agg.to_csv(path + "credit_card_agg.csv", index=False, header=True)

## Installments Aggregate Synthetic Target

In [311]:
frame = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"])
installment_agg = pd.read_csv(path + "installment_agg.csv", usecols=lambda c: ("AGG_SYNTH" not in c) and ("AGG_COMP" not in c))

df = pd.merge(frame, installment_agg, how="left", on="SK_ID_CURR")
del frame
gc.collect()
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")

time: 8.28 s


In [312]:
df.head()

Unnamed: 0,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M
0,0.0,0.0,53093.745,53093.745,9251.775,565.0,0.0,0.0,0.0,0.0,95.448632,11559.247105,1083.545816,53093.745,15.761116,9251.775,1813.524009,219625.695,0.0,-49.0,-587.0,538.0,0.0,0.0,90100.845,34590.195,53093.745,9251.775,-12.0,-31.0
1,0.0,0.0,,,,2310.0,0.0,0.0,0.0,0.0,100.798053,64754.586,1030.947353,560835.36,2.899015,6662.97,2519.951327,1618864.65,0.0,-544.0,-2324.0,1780.0,,,0.0,0.0,,,-1.0,-14.0
2,0.0,0.0,,,,784.0,0.0,0.0,0.0,0.0,9.434878,7096.155,14.544656,10573.965,6.738679,5357.25,28.304633,21288.465,0.0,-727.0,-795.0,68.0,,,0.0,0.0,,,-3.0,-11.0
3,0.0,0.0,691786.89,691786.89,29027.52,545.0,0.0,0.0,0.0,0.0,543.096731,62947.088438,3975.786724,691786.89,4.318122,2482.92,8689.547693,1007153.415,0.0,-12.0,-575.0,563.0,0.0,0.0,865952.01,749841.93,691786.89,29027.52,-1.0,-77.0
4,0.0,0.0,16037.64,16037.64,16037.64,2326.0,3.0,29857.365,25.402727,22655.655,49.833434,12214.060227,1145.545714,22678.785,0.000125,0.18,3289.00667,806127.975,16.0,-14.0,-2318.0,2304.0,0.0,0.0,96225.84,0.0,16037.64,16037.64,12.0,-31.0


time: 23.2 ms


In [313]:
df = pd.DataFrame(scale.fit_transform(impute.fit_transform(df.replace([-np.inf, np.inf], np.nan))), columns=df.columns)
df.head()

Unnamed: 0,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M
0,0.087124,0.057306,0.062455,-0.156028,-0.055344,-1.143503,-0.461146,0.03512,0.059059,-0.429348,0.025055,-0.280018,0.034783,-0.3293,0.008828,0.298862,-0.161664,-0.491631,-0.525024,0.504291,1.134204,-0.783105,-0.200594,-0.277533,-0.030966,0.231387,0.067885,-0.081803,-0.253549,0.229909
1,0.087124,0.057306,-0.213935,-0.303097,-0.113491,0.81744,-0.461146,0.03512,0.059059,-0.429348,0.036434,1.891991,0.017093,1.76566,-0.020582,0.114758,-0.019108,1.070434,-0.525024,-0.43673,-0.820883,0.566571,-0.200594,-0.277533,-0.455841,0.107633,-0.212541,-0.107967,-0.151926,0.831629
2,0.087124,0.057306,-0.213935,-0.303097,-0.113491,-0.897402,-0.461146,0.03512,0.059059,-0.429348,-0.15791,-0.46225,-0.324733,-0.504738,-0.011802,0.021902,-0.52192,-0.713049,-0.525024,-0.784623,0.900089,-1.293852,-0.200594,-0.277533,-0.455841,0.107633,-0.212541,-0.107967,-0.170403,0.937814
3,0.087124,0.057306,5.210003,3.270694,0.403188,-1.165978,-0.461146,0.03512,0.059059,-0.429348,0.977269,1.818189,1.007471,2.305971,-0.017337,-0.182507,1.225909,0.387539,-0.525024,0.57463,1.147711,-0.755937,-0.200594,-0.277533,3.627602,2.790347,5.254689,0.381197,-0.151926,-1.398273
4,0.087124,0.057306,-0.236199,-0.354842,0.101997,0.83542,0.291053,0.210329,0.083116,1.095966,-0.071976,-0.253282,0.055634,-0.454793,-0.02721,-0.359067,0.136086,0.163121,2.033883,0.570828,-0.814129,1.135999,-0.200594,-0.277533,-0.002083,0.107633,-0.233046,0.077071,-0.031826,0.229909


time: 1.81 s


#### Get out of fold predictions

In [314]:
kfold = StratifiedKFold(n_splits=3)
scores = pd.DataFrame({"SK_ID_CURR": [], "INSTALLMENT_AGG_SYNTHETIC_TARGET": []})

time: 2.36 ms


In [315]:
for train_indx, test_indx in kfold.split(df.values, y.values):
    print("Determining lambda and fitting...")
    clf = LogisticRegressionCV(Cs=10, 
                               penalty="l2", 
                               fit_intercept=False, 
                               scoring="roc_auc", 
                               cv=kfold)
    clf.fit(df.iloc[train_indx], y.iloc[train_indx])
    print("Scoring...")
    fold_scores = pd.DataFrame({"SK_ID_CURR": sk_id_curr.iloc[test_indx], "INSTALLMENT_AGG_SYNTHETIC_TARGET": clf.predict_proba(df.iloc[test_indx])[:,1]})
    scores = pd.concat([scores, fold_scores], axis=0)
    
scores.head()

Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...


Unnamed: 0,SK_ID_CURR,INSTALLMENT_AGG_SYNTHETIC_TARGET
0,100002.0,0.514141
1,100003.0,0.47399
2,100004.0,0.525224
3,100006.0,0.561795
4,100007.0,0.501933


time: 26.3 s


#### Append

In [316]:
installment_agg = installment_agg.merge(scores, how="left", on="SK_ID_CURR")
installment_agg.head()

Unnamed: 0,SK_ID_CURR,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET
0,100001,0.0,0.0,,,,2916.0,0.0,0.0,0.0,0.0,3.116986,5885.132143,10.686671,17397.9,1.365586,3951.0,21.8189,41195.925,1.0,-1628.0,-2916.0,1288.0,,,0.0,0.0,,,11.0,-36.0,
1,100002,0.0,0.0,53093.745,53093.745,9251.775,565.0,0.0,0.0,0.0,0.0,95.448632,11559.247105,1083.545816,53093.745,15.761116,9251.775,1813.524009,219625.695,0.0,-49.0,-587.0,538.0,0.0,0.0,90100.845,34590.195,53093.745,9251.775,-12.0,-31.0,0.514141
2,100003,0.0,0.0,,,,2310.0,0.0,0.0,0.0,0.0,100.798053,64754.586,1030.947353,560835.36,2.899015,6662.97,2519.951327,1618864.65,0.0,-544.0,-2324.0,1780.0,,,0.0,0.0,,,-1.0,-14.0,0.47399
3,100004,0.0,0.0,,,,784.0,0.0,0.0,0.0,0.0,9.434878,7096.155,14.544656,10573.965,6.738679,5357.25,28.304633,21288.465,0.0,-727.0,-795.0,68.0,,,0.0,0.0,,,-3.0,-11.0,0.525224
4,100005,0.0,0.0,,,,706.0,0.0,0.0,0.0,0.0,11.09417,6240.205,37.566479,17656.245,6.539674,4813.2,99.847528,56161.845,1.0,-470.0,-736.0,266.0,,,0.0,0.0,,,1.0,-37.0,


time: 213 ms


#### Fill in test set cases

Fit model on full training data and predict TARGET for the test cases

In [317]:
clf = LogisticRegressionCV(Cs=10, 
                           penalty="l2", 
                           fit_intercept=False, 
                           scoring="roc_auc", 
                           cv=kfold)
clf.fit(df, y)

LogisticRegressionCV(Cs=10, class_weight=None,
           cv=StratifiedKFold(n_splits=3, random_state=None, shuffle=False),
           dual=False, fit_intercept=False, intercept_scaling=1.0,
           max_iter=100, multi_class='ovr', n_jobs=1, penalty='l2',
           random_state=None, refit=True, scoring='roc_auc',
           solver='lbfgs', tol=0.0001, verbose=0)

time: 14.4 s


In [318]:
null_id = installment_agg["INSTALLMENT_AGG_SYNTHETIC_TARGET"].isnull()
temp_frame = installment_agg[null_id].drop(["SK_ID_CURR", "INSTALLMENT_AGG_SYNTHETIC_TARGET"], axis=1).replace([-np.inf, np.inf], np.nan)
arr = scale.fit_transform(impute.fit_transform(temp_frame))
installment_agg.loc[null_id, "INSTALLMENT_AGG_SYNTHETIC_TARGET"] = clf.predict_proba(pd.DataFrame(arr, columns=temp_frame.columns))[:,1]

time: 407 ms


#### Reappend principal components if necessary

In [319]:
prin_comp = pd.read_csv(path + "installment_agg.csv", usecols=lambda c: (c == "SK_ID_CURR") or ("AGG_COMP" in c))
installment_agg = installment_agg.merge(prin_comp, how="left", on="SK_ID_CURR")
del prin_comp
installment_agg.head()

Unnamed: 0,SK_ID_CURR,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7
0,100001,0.0,0.0,,,,2916.0,0.0,0.0,0.0,0.0,3.116986,5885.132143,10.686671,17397.9,1.365586,3951.0,21.8189,41195.925,1.0,-1628.0,-2916.0,1288.0,,,0.0,0.0,,,11.0,-36.0,0.485121,-1.311336,-0.289649,-1.265137,0.259213,1.925718,0.03656,1.028292
1,100002,0.0,0.0,53093.745,53093.745,9251.775,565.0,0.0,0.0,0.0,0.0,95.448632,11559.247105,1083.545816,53093.745,15.761116,9251.775,1813.524009,219625.695,0.0,-49.0,-587.0,538.0,0.0,0.0,90100.845,34590.195,53093.745,9251.775,-12.0,-31.0,0.514141,-0.752288,1.616157,0.754784,-0.702447,-0.535793,0.056893,0.006947
2,100003,0.0,0.0,,,,2310.0,0.0,0.0,0.0,0.0,100.798053,64754.586,1030.947353,560835.36,2.899015,6662.97,2519.951327,1618864.65,0.0,-544.0,-2324.0,1780.0,,,0.0,0.0,,,-1.0,-14.0,0.47399,0.659627,-0.035899,-0.624043,1.42402,0.239304,-0.727819,1.224179
3,100004,0.0,0.0,,,,784.0,0.0,0.0,0.0,0.0,9.434878,7096.155,14.544656,10573.965,6.738679,5357.25,28.304633,21288.465,0.0,-727.0,-795.0,68.0,,,0.0,0.0,,,-3.0,-11.0,0.525224,-1.700891,1.634542,0.456757,-0.633019,-0.255442,-0.037613,0.026482
4,100005,0.0,0.0,,,,706.0,0.0,0.0,0.0,0.0,11.09417,6240.205,37.566479,17656.245,6.539674,4813.2,99.847528,56161.845,1.0,-470.0,-736.0,266.0,,,0.0,0.0,,,1.0,-37.0,0.525405,-1.571981,1.428804,0.404391,-0.61607,-0.355109,-0.043216,-0.162738


time: 1.65 s


In [320]:
installment_agg.shape

(339587, 39)

time: 2.52 ms


### AUC

In [321]:
temp = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"]).merge(installment_agg[["SK_ID_CURR", "INSTALLMENT_AGG_SYNTHETIC_TARGET"]], how="left", on="SK_ID_CURR").dropna()
print(round(roc_auc_score(temp["TARGET"], temp["INSTALLMENT_AGG_SYNTHETIC_TARGET"]), 4))
del temp
gc.collect()

0.6228


70

time: 6.67 s


In [None]:
installment_agg.to_csv(path + "installment_agg.csv", index=False, header=True)

## Point of Sale Aggregate Synthetic Target

In [87]:
frame = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"])
pos_cash_agg = pd.read_csv(path + "pos_cash_agg.csv", usecols=lambda c: ("AGG_SYNTH" not in c) and ("AGG_COMP" not in c))

df = pd.merge(frame, pos_cash_agg, how="left", on="SK_ID_CURR")
del frame
gc.collect()
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")

time: 6.76 s


In [88]:
df.head()

Unnamed: 0,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M
0,0.0,0.0,1.0,6.0,11.0,0.0
1,0.0,0.0,3.0,,,
2,0.0,0.0,1.0,,,
3,0.0,0.0,3.0,0.0,48.0,0.0
4,0.0,0.0,5.0,13.0,18.0,0.0


time: 11.2 ms


In [89]:
df = pd.DataFrame(scale.fit_transform(impute.fit_transform(df.replace([-np.inf, np.inf], np.nan))), columns=df.columns)
df.head()

Unnamed: 0,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M
0,-0.099399,-0.046552,-0.899183,0.16206,-0.159063,-0.054276
1,-0.099399,-0.046552,0.146297,-0.309552,-0.255013,-0.054276
2,-0.099399,-0.046552,-0.899183,-0.309552,-0.255013,-0.054276
3,-0.099399,-0.046552,0.146297,-0.545357,3.391078,-0.054276
4,-0.099399,-0.046552,1.191777,0.98738,0.512585,-0.054276


time: 461 ms


#### Get out of fold predictions

In [90]:
kfold = StratifiedKFold(n_splits=3)
scores = pd.DataFrame({"SK_ID_CURR": [], "POS_AGG_SYNTHETIC_TARGET": []})

time: 8.96 ms


In [91]:
for train_indx, test_indx in kfold.split(df.values, y.values):
    print("Determining lambda and fitting...")
    clf = LogisticRegressionCV(Cs=10, 
                               penalty="l2", 
                               fit_intercept=False, 
                               scoring="roc_auc", 
                               cv=kfold)
    clf.fit(df.iloc[train_indx], y.iloc[train_indx])
    print("Scoring...")
    fold_scores = pd.DataFrame({"SK_ID_CURR": sk_id_curr.iloc[test_indx], "POS_AGG_SYNTHETIC_TARGET": clf.predict_proba(df.iloc[test_indx])[:,1]})
    scores = pd.concat([scores, fold_scores], axis=0)
    
scores.head()

Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...
Determining lambda and fitting...
Scoring...


Unnamed: 0,SK_ID_CURR,POS_AGG_SYNTHETIC_TARGET
0,100002.0,0.510127
1,100003.0,0.495285
2,100004.0,0.509493
3,100006.0,0.523314
4,100007.0,0.48669


time: 5.57 s


#### Append

In [92]:
pos_cash_agg = pos_cash_agg.merge(scores, how="left", on="SK_ID_CURR")
pos_cash_agg.head()

Unnamed: 0,SK_ID_CURR,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET
0,100001,7,7,2,,,,
1,100002,0,0,1,6.0,11.0,0.0,0.510127
2,100003,0,0,3,,,,0.495285
3,100004,0,0,1,,,,0.509493
4,100005,0,0,1,,,,


time: 201 ms


#### Fill in test set cases

Fit model on full training data and predict TARGET for the test cases

In [93]:
clf = LogisticRegressionCV(Cs=10, 
                           penalty="l2", 
                           fit_intercept=False, 
                           scoring="roc_auc", 
                           cv=kfold)
clf.fit(df, y)

LogisticRegressionCV(Cs=10, class_weight=None,
           cv=StratifiedKFold(n_splits=3, random_state=None, shuffle=False),
           dual=False, fit_intercept=False, intercept_scaling=1.0,
           max_iter=100, multi_class='ovr', n_jobs=1, penalty='l2',
           random_state=None, refit=True, scoring='roc_auc',
           solver='lbfgs', tol=0.0001, verbose=0)

time: 3.04 s


In [94]:
null_id = pos_cash_agg["POS_AGG_SYNTHETIC_TARGET"].isnull()
temp_frame = pos_cash_agg[null_id].drop(["SK_ID_CURR", "POS_AGG_SYNTHETIC_TARGET"], axis=1).replace([-np.inf, np.inf], np.nan)
arr = scale.fit_transform(impute.fit_transform(temp_frame))
pos_cash_agg.loc[null_id, "POS_AGG_SYNTHETIC_TARGET"] = clf.predict_proba(pd.DataFrame(arr, columns=temp_frame.columns))[:,1]

time: 162 ms


#### Reappend principal components if necessary

In [332]:
pos_cash_agg.shape

(337252, 8)

time: 2.47 ms


### AUC

In [96]:
temp = pd.read_csv(path + "train.csv", usecols=["SK_ID_CURR", "TARGET"]).merge(pos_cash_agg[["SK_ID_CURR", "POS_AGG_SYNTHETIC_TARGET"]], how="left", on="SK_ID_CURR").dropna()
print(round(roc_auc_score(temp["TARGET"], temp["POS_AGG_SYNTHETIC_TARGET"]), 4))
del temp
gc.collect()

0.5658


111

time: 5.84 s


# Principal Components

## Credit Card

In [3]:
credit_card_agg = pd.read_csv(path + "credit_card_agg.csv")
frame = credit_card_agg.drop(["SK_ID_CURR", "CREDIT_CARD_AGG_SYNTHETIC_TARGET"], axis=1)
frame = pd.DataFrame(scale.fit_transform(impute.fit_transform(frame.replace([-np.inf, np.inf], np.nan))), columns=frame.columns)
frame.head()

Unnamed: 0,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M
0,-0.083113,-0.088853,-0.398413,-0.499736,-0.55513,-0.592882,-0.334658,-0.384997,-0.286135,-0.146678,-0.51241,-0.658542,-0.650688,-0.830574,-0.661302,-0.944723,-0.706254,-0.928712,-0.990213,-1.301943,-0.494588,-0.525476,-0.568979,-0.590138,-0.676992,-0.076963,-0.012305,-0.489621,-0.414114,-0.637581,-0.604955,-0.513358,-0.80724,-0.01321,-0.003539,-0.003716,-0.355897,-0.308925,-0.321915,-0.380391,-0.00585,-0.707062,-0.671476,-0.045806,-0.051199
1,-0.083113,-0.088853,-0.398413,-0.499736,-0.55513,-0.592882,-0.334658,-0.384997,-0.286135,-0.146678,-0.51241,-0.658542,-0.144053,0.272594,0.571896,1.122404,0.654635,1.10744,-0.050815,0.88148,-0.462704,-0.506566,-0.409983,-0.536243,-0.63955,-0.076963,-0.012305,-0.414512,-0.399325,-0.259663,-0.209929,-0.421317,0.669207,0.001945,-0.003539,-0.003716,-0.355897,-0.308925,-0.321915,-0.380391,-0.00585,-0.707062,-0.671476,-0.045806,-0.051199
2,-0.083113,-0.088853,-0.398413,-0.499736,-0.55513,-0.592882,-0.334658,-0.384997,-0.286135,-0.146678,-0.51241,-0.658542,-0.481817,0.111614,-0.12805,1.75153,-0.706254,1.766195,-0.632363,0.829266,-0.48636,-0.510885,-0.515751,-0.574243,-0.643975,-0.076766,-0.011492,-0.057743,-0.348563,0.023775,0.649253,-0.288096,0.484651,-0.015844,-0.003539,-0.003716,-0.355897,-0.308925,-0.321915,-0.380391,-0.00585,-0.707062,-0.671476,-0.045806,-0.051199
3,-0.083113,-0.088853,-0.398413,-0.499736,-0.55513,-0.592882,-0.334658,-0.384997,-0.286135,-0.146678,-0.51241,-0.658542,-0.650688,-0.830574,-0.661302,-0.585223,0.654635,-0.599334,-0.990213,-1.301943,-0.494588,-0.525476,-0.568979,-0.590138,-0.676992,-0.076963,-0.012305,-0.489621,-0.414114,-0.637581,-0.604955,-0.513358,-0.80724,-0.01321,-0.003539,-0.003716,-0.355897,-0.308925,-0.321915,-0.380391,-0.00585,-0.707062,-0.671476,-0.045806,-0.051199
4,-0.083113,-0.088853,-0.398413,-0.499736,-0.55513,-0.592882,-0.334658,-0.384997,-0.286135,-0.146678,-0.51241,-0.658542,-0.650688,-0.830574,-0.661302,-0.794931,3.376414,-0.868825,-0.990213,-1.301943,-0.494588,-0.525476,-0.568979,-0.590138,-0.676992,-0.076963,-0.012305,-0.489621,-0.414114,-0.637581,-0.604955,-0.513358,-0.80724,-0.01321,-0.003539,-0.003716,-0.355897,-0.308925,-0.321915,-0.380391,-0.00585,-0.707062,-0.671476,-0.045806,-0.051199


time: 1.89 s


In [4]:
num_comp = 7
pca = PCA(n_components=num_comp)
pca.fit(frame)
princomp = pd.DataFrame(np.dot(frame, pca.components_.T), columns=["CREDIT_CARD_AGG_COMP" + str(i+1) for i in range(num_comp)])
credit_card_agg = pd.concat([credit_card_agg, princomp], axis=1)
credit_card_agg.head()

Unnamed: 0,SK_ID_CURR,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7
0,100006,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,0.0,0.0,0.0,0.0,0.0,6.0,1.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.055377,-2.996367,0.956185,-1.143641,0.37796,0.322572,0.12285,-0.890276
1,100011,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,54482.111149,189000.0,4031676.225,75.0,2.0,73.0,0.302678,1.05,891.528045,2520.0,65973.075311,0.004953,0.014,0.0,0.0,4.0,0.054054,4.0,180000.0,2432.432432,180000.0,1.0,inf,inf,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.068132,-1.91423,-1.336225,0.97039,-0.360336,-1.157258,-0.099205,0.683874
2,100013,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18159.919219,161420.22,1743352.245,96.0,1.0,95.0,0.115301,1.02489,230.066978,1944.407308,22086.429911,0.001461,0.012345,0.014493,0.014493,23.0,0.239583,7.0,571500.0,5953.125,157500.0,0.0,inf,inf,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.067048,-1.995274,-1.079984,1.425906,-0.458675,-1.500304,-0.189693,1.339213
3,100021,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18.0,2.0,16.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.056155,-3.130604,0.815268,-0.953739,0.421427,0.156045,0.118608,-0.890236
4,100023,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11.0,4.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,,,,0.065454,-3.290014,1.021466,-1.043096,0.623813,0.148561,0.201433,-1.532772


time: 748 ms


In [5]:
credit_card_agg.shape

(103558, 54)

time: 2.29 ms


## Previous Application

In [80]:
previous_agg = pd.read_csv(path + "previous_agg.csv", usecols=lambda c: "AGG_COMP" not in c)
frame = previous_agg.drop(["SK_ID_CURR", "PREVIOUS_AGG_SYNTHETIC_TARGET"], axis=1)
frame = pd.DataFrame(scale.fit_transform(impute.fit_transform(frame.replace([-np.inf, np.inf], np.nan))), columns=frame.columns)
frame.head()

Unnamed: 0,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M
0,-0.20337,-0.269348,-0.091275,-0.038181,0.010188,-0.043361,-0.031073,-0.930878,-0.290102,-1.046355,-0.806661,-0.888488,-0.253118,-0.859038,-0.888254,-0.061548,-0.146919,-0.15241,-0.48176,-1.247146,-1.274387,-0.102814,-0.203811,-0.215664,-0.521022,-1.038093,-1.060894,-0.088357,-0.183755,-0.191317,-0.228004,-2.343923,-1.182417,-0.652054,-1.015875,-0.152471,-0.147753,-0.849415,-0.835933,-0.097335,-0.264047,-0.235391,0.274481,-0.598271,-0.830647,0.220864,0.000575,-0.119362,-0.180841,-0.15509,-0.253959,-0.468607,-0.54178,-0.964522,-0.369597,-0.740713,-0.405002,-0.030494,-0.798083,-1.002924,-0.890906,-0.324769,-0.236958,-0.120713,-0.00144,0.014483,-0.309833,-0.286025,-0.265768,-0.373496,-0.364695,-0.068306,-0.39633,-0.584399,-0.226737,-0.134695,-0.190281,-0.083524,-0.065043,-0.030225,-0.17607,-0.174794
1,-0.20337,-0.283452,-0.091275,-0.038181,-0.471055,-0.043361,-0.601476,-0.930878,-0.273684,-1.037628,-0.792062,-0.888488,1.356782,-0.519619,0.052874,0.18822,-0.13332,-0.095998,2.722014,0.144542,1.363771,0.228852,-0.156504,-0.082367,0.176605,-0.762751,-0.535396,0.014917,-0.168238,-0.147301,1.082426,-0.231896,-1.182417,-0.652054,-1.015875,-0.091135,-0.132774,0.161104,-0.47043,-0.178424,-0.15959,-0.196526,-0.925028,-0.161182,-0.580702,0.522011,0.000575,-0.119362,-0.180841,-0.15509,-0.253959,-0.468607,-0.54178,-0.964522,-0.369597,-0.740713,-0.405002,-0.744408,-0.14507,-1.002924,-0.890906,-0.268249,-0.174918,-0.120713,-0.00144,0.014483,-0.309833,-0.286025,-0.265768,-0.373496,-0.364695,-0.068306,-0.39633,-0.584399,-0.226737,-0.134695,-0.190281,-0.083524,-0.065043,-0.030225,-0.17607,-0.174794
2,-0.20337,-0.269348,-0.091275,-0.038181,0.010188,-0.043361,-0.031073,-0.457024,-0.293849,-1.040419,-0.801492,-0.880512,0.20586,1.353425,1.902399,-0.047899,-0.08057,-0.032452,-0.630963,-0.776257,-0.748664,-0.092859,-0.186106,-0.192924,-0.15432,3.8657,4.153957,-0.083532,-0.029048,0.041124,-0.922508,-0.49264,0.594767,-0.652054,-1.015875,-0.036092,-0.084246,1.841035,1.238222,-0.149521,-0.214605,-0.200318,-0.349796,0.435829,0.313158,0.44364,0.000575,-0.119362,-0.180841,-0.15509,-0.253959,-0.468607,-0.54178,-0.02793,-0.369597,0.773034,-0.405002,-0.744408,-0.14507,0.472577,0.122849,-0.198602,-0.192782,-0.120713,-0.00144,0.014483,-0.309833,-0.286025,-0.265768,-0.373496,-0.364695,-0.068306,-0.39633,-0.584399,-0.226737,-0.134695,-0.190281,-0.083524,-0.065043,-0.030225,-0.17607,-0.174794
3,-0.20337,-0.269348,-0.091275,-0.038181,0.010188,-0.043361,-0.031073,-0.930878,-0.280858,-1.041442,-0.798441,-0.888488,-0.291285,-0.867085,-0.910566,-0.051799,-0.146388,-0.150208,-1.026602,-1.483819,-1.723039,-0.08948,-0.201909,-0.210304,-0.335947,-0.965047,-0.921484,-0.054167,-0.178618,-0.176745,0.840909,-0.621149,-1.182417,-0.652054,-1.015875,-0.149086,-0.146926,-0.853041,-0.837245,0.173388,-0.219829,-0.218939,1.512567,-1.941717,-1.598884,-0.704748,0.000575,-0.119362,-0.180841,-0.15509,-0.253959,-0.468607,-0.54178,-0.964522,-0.369597,-0.740713,-0.405002,-0.744408,-0.798083,-1.002924,-0.890906,-0.290488,-0.199329,-0.120713,-0.00144,0.014483,-0.309833,-0.286025,-0.265768,-0.373496,-0.364695,-0.068306,-0.39633,-0.584399,-0.226737,-0.134695,-0.190281,-0.083524,-0.065043,-0.030225,-0.17607,-0.174794
4,-0.20337,-0.269348,-0.091275,-0.038181,0.010188,-0.043361,-0.031073,-0.693951,-0.278244,-1.040052,-0.796117,-0.888488,-0.499755,-0.823261,-0.910743,-0.073665,-0.145019,-0.149837,0.076156,-1.004792,-0.814969,-0.01476,-0.191251,-0.180275,-0.407549,-0.993307,-0.975419,-0.055876,-0.178875,-0.177473,0.907933,0.31008,-0.689931,-0.323775,0.835001,-0.149157,-0.145374,-0.865971,-0.78905,0.016248,-0.20341,-0.21283,0.327805,-1.197024,-1.173038,-0.191667,0.000575,-0.119362,-0.180841,-0.15509,-0.253959,-0.468607,0.038602,-0.964522,-0.369597,-0.740713,-0.405002,-0.030494,-0.798083,-1.002924,-0.890906,-0.285548,-0.193906,-0.120713,-0.00144,0.014483,-0.309833,-0.286025,-0.265768,-0.373496,-0.364695,-0.068306,-0.39633,-0.180272,-0.226737,-0.134695,-0.190281,-0.083524,-0.065043,-0.030225,-0.17607,-0.174794


time: 12.5 s


In [81]:
previous_agg.shape

(338857, 84)

time: 2.71 ms


In [82]:
num_comp = 7
pca = PCA(n_components=num_comp)
pca.fit(frame)
princomp = pd.DataFrame(np.dot(frame, pca.components_.T), columns=["PREVIOUS_AGG_COMP" + str(i+1) for i in range(num_comp)])
previous_agg = pd.concat([previous_agg, princomp], axis=1)
previous_agg.head()

Unnamed: 0,SK_ID_CURR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7
0,100001,,,,,,,,1.0,-1612.0,-1612.0,-1612.0,0.0,23787.0,23787.0,23787.0,13.67069,13.67069,13.67069,6.020501,6.020501,6.020501,0.00346,0.00346,0.00346,3951.0,3951.0,3951.0,2.27069,2.27069,2.27069,-1740.0,-1740.0,0.0,0.0,0.0,14.273276,14.273276,24835.5,24835.5,6e-05,0.00055,0.00055,0.104326,0.957782,0.957782,0.957782,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.000575,0.000575,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.513661,-3.921423,0.977275,-0.190697,1.345474,-0.545294,1.929032,1.411176
1,100002,,9251.775,,,1.0,,1.0,1.0,-17.0,-17.0,-17.0,0.0,179055.0,179055.0,179055.0,295.470297,295.470297,295.470297,19.353584,19.353584,19.353584,0.031937,0.031937,0.031937,9251.775,9251.775,9251.775,15.266955,15.266955,15.266955,-606.0,-606.0,0.0,0.0,0.0,295.470297,295.470297,179055.0,179055.0,0.0,0.00165,0.00165,0.0,1.0,1.0,1.0,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.00165,0.00165,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.487067,-2.72488,1.59177,2.395666,0.118051,-0.42582,-0.376677,0.405732
2,100003,,,,,,,,3.0,-1976.0,-527.0,-1047.333333,1449.0,68053.5,1035882.0,484191.0,29.070269,1388.581769,612.90394,5.399568,10.531859,8.677472,0.004315,0.014118,0.008318,6737.31,98356.995,56553.99,2.877962,131.845838,70.901357,-2341.0,-746.0,1595.0,0.0,0.0,547.812073,1206.434316,435436.5,900000.0,2.1e-05,0.001071,0.001543,0.05003,1.057664,1.15098,0.989013,,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,2.0,0.0,0.0,1.0,2.0,3.0,0.002975,0.00134,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.42019,0.428183,-0.535911,2.110056,-4.18119,1.337309,1.599647,0.545277
3,100004,,,,,,,,1.0,-714.0,-714.0,-714.0,0.0,20106.0,20106.0,20106.0,24.669939,24.669939,24.669939,3.753045,3.753045,3.753045,0.004605,0.004605,0.004605,5357.25,5357.25,5357.25,6.573313,6.573313,6.573313,-815.0,-815.0,0.0,0.0,0.0,29.793865,29.793865,24282.0,24282.0,0.00026,0.001016,0.001016,0.212008,0.828021,0.828021,0.828021,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.001227,0.001227,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506853,-4.125854,1.233849,-0.810943,0.819096,-1.583013,1.885414,1.163706
4,100005,,,,,,,,2.0,-460.0,-460.0,-460.0,0.0,0.0,40153.5,20076.75,0.0,53.042933,26.521466,8.342371,8.342371,8.342371,0.01102,0.01102,0.01102,4813.2,4813.2,4813.2,6.358256,6.358256,6.358256,-757.0,-315.0,442.0,1.0,0.5,29.469947,58.939894,22308.75,44617.5,0.000144,0.001189,0.001189,0.108964,0.89995,0.89995,0.89995,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.001321,0.001321,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,0.529786,-3.004413,0.852979,-0.301994,1.40546,-1.294547,0.780261,1.127595


time: 4.13 s


In [86]:
previous_agg.shape

(338857, 91)

time: 2.45 ms


## Bureau

In [21]:
bureau_agg = pd.read_csv(path + "bureau_agg.csv")
frame = bureau_agg.drop(["SK_ID_CURR", "BUREAU_AGG_SYNTHETIC_TARGET"], axis=1)
frame = pd.DataFrame(scale.fit_transform(impute.fit_transform(frame.replace([-np.inf, np.inf], np.nan))), columns=frame.columns)
frame.head()

Unnamed: 0,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7
0,0.008409,-0.404347,-0.408288,2.979738,2.395456,-0.007603,-0.007255,0.794515,0.745754,0.597533,-0.142532,-0.03202,-0.007135,0.001625,-0.001846,-0.007685,-0.007685,-0.156358,-0.736477,-0.070091,0.426421,-0.151689,-0.03988,-0.716668,0.510476,0.268297,0.085164,-0.085164,0.169495,2.141916,-0.134742,-0.028612,0.073509,0.698633,-0.050086,-0.026582,0.001562,0.187357,1.026268,0.318205,-0.148818,-0.242212,-0.488278,-0.488278,0.355103,-0.113884,-0.287609,-0.166321,0.515261,0.313134,0.523474,-0.036308,-0.035193,-0.051846,-0.051706,-0.828339,0.579231,-0.097297,-0.102979,-0.021913,-0.025746,-0.154452,0.012633,-0.03488,-0.009142,-0.007649,-0.005878,0.005976,0.386648,-0.81578,0.271683,0.047063,-0.129411,-0.869386,-0.2578,-0.229794,-0.00076,0.346875,0.575874,0.662495,-0.323353,-1.129956,0.010354,0.152581
1,-0.022963,-0.404347,-0.408288,-0.198581,-0.235108,-0.011793,-0.011446,0.159632,0.123802,0.019504,-0.353989,-0.03202,-0.007135,0.001625,-0.001846,-0.247348,-0.247348,-0.156358,-0.475448,-5.494959,-0.424205,-0.190473,-0.435191,-0.611796,0.080166,0.255364,-5.329139,5.329139,4.20728,0.088639,-0.210269,1.034886,0.792557,-0.235326,-0.069023,0.174253,0.186197,2.101018,0.352518,0.693025,-0.24541,-0.41464,-0.424878,-0.424878,0.572956,-0.01542,-0.393909,-0.376646,-0.040002,0.53885,-0.034649,-0.036308,-0.035193,-0.051846,-0.051706,-0.727126,0.136671,0.03372,0.027172,-0.004304,0.003479,-0.154452,-0.075583,-0.248757,-0.009142,-0.007649,-0.005878,0.005976,0.383748,0.131473,0.065945,-0.063256,-0.270634,1.774782,-0.2578,-0.229794,-0.056204,0.327436,2.872822,0.236537,-0.400444,-0.335987,-0.167222,0.065951
2,-0.057216,-0.404347,-0.408288,-0.198581,-0.235108,-0.01698,-0.016633,-0.47525,-0.49815,-0.558524,-0.314095,-0.03202,-0.007135,0.001625,-0.001846,-0.415213,-0.415213,-0.156358,-0.16822,0.227302,-0.169636,-0.138085,-0.011643,-0.244743,-0.027412,-0.520616,0.23292,-0.23292,-0.305538,-0.185166,-0.143995,-0.120773,-0.138937,-0.113569,-0.056812,-0.068996,-0.070805,-0.262917,-0.224982,-0.191658,-0.177909,-0.391612,-0.171278,-0.171278,-0.02614,-0.537241,-0.34747,-0.383261,-0.595264,-0.364014,-0.592771,-0.036308,-0.035193,-0.051846,-0.051706,0.215654,-0.390123,-0.097297,-0.102979,-0.021913,-0.025746,-0.154452,-0.246663,-0.398561,-0.009577,-0.007983,-0.005878,0.005976,0.279337,0.96918,0.769155,-0.242179,-0.234064,0.452698,-0.2578,-0.229794,-0.056204,-0.436946,-0.196579,-0.36802,-0.118736,-0.403783,0.040286,0.091427
3,-0.057216,-0.404347,-0.408288,-0.198581,-0.235108,-0.008937,-0.008752,-1.110132,-1.120102,-1.136553,-0.425359,-0.03202,-0.007135,0.001625,-0.001846,-0.415213,-0.415213,-0.156358,-0.16822,0.227302,-0.169636,-0.138085,-0.011643,-0.244743,-0.027412,-0.520616,0.23292,-0.23292,-0.305538,-0.185166,-0.143995,-0.120773,-0.138937,-0.113569,-0.056812,-0.068996,-0.070805,-0.262917,-0.224982,-0.191658,-0.496225,-0.488503,-0.171278,-0.171278,-0.02614,0.167333,-0.517677,-0.288689,-1.150527,-0.815446,-1.150894,-0.036308,-0.035193,-0.051846,-0.051706,-0.155461,-0.418082,-0.097297,-0.102979,-0.021913,-0.025746,-0.154452,-0.246663,-0.398561,-0.009142,-0.007649,-0.005878,0.005976,-0.70386,-0.676776,-0.386897,-0.309133,-0.432911,-0.869386,-0.2578,-0.229794,-0.056204,-1.011322,-0.058936,-0.232194,0.132002,0.053512,-0.026916,0.019336
4,0.009934,-0.404347,-0.408288,-0.198581,-0.235108,-0.007912,-0.007565,0.159632,0.123802,0.019504,-0.29305,-0.03202,-0.007135,0.001625,-0.001846,-0.026999,-0.026999,-0.156358,-1.192315,0.227302,-0.397087,0.743468,-2.242331,-0.664232,-1.614183,-0.313688,0.23292,-0.23292,-0.305538,3.763111,0.915982,-0.120773,-0.138937,0.587925,0.00338,-0.068996,-0.070805,-0.262917,-0.224982,-0.191658,-0.260975,-0.373286,-1.18568,-1.18568,2.479168,0.346254,-0.335966,-0.107972,-0.040002,-0.58973,-0.034649,-0.036308,-0.035193,-0.051846,-0.051706,-0.803973,0.455183,-0.097297,-0.102979,-0.021913,-0.025746,-0.154452,-0.002122,-0.052116,-0.009142,-0.007649,-0.005878,0.005976,0.372147,-0.851682,-1.047653,-0.121223,-0.320547,-0.208344,-0.2578,-0.229794,-0.046684,-0.614042,-0.327899,2.136838,-0.300343,-0.836535,0.108691,0.118957


time: 10.6 s


In [22]:
num_comp = 7
pca = PCA(n_components=num_comp)
pca.fit(frame)
princomp = pd.DataFrame(np.dot(frame, pca.components_.T), columns=["BUREAU_AGG_COMP" + str(i+1) for i in range(num_comp)])
bureau_agg = pd.concat([bureau_agg, princomp], axis=1)
bureau_agg.head()

Unnamed: 0,SK_ID_CURR,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,BUREAU_AGG_COMP1.1,BUREAU_AGG_COMP2.1,BUREAU_AGG_COMP3.1,BUREAU_AGG_COMP4.1,BUREAU_AGG_COMP5.1,BUREAU_AGG_COMP6.1,BUREAU_AGG_COMP7.1
0,100001,603.706712,0.0,0.0,1.0,1.0,0.987405,0.987405,3.0,3.0,3.0,3091.0,0.0,,,,596686.5,596686.5,0.0,8.857143,0.983871,1.774194,0.007155,47.5,0.5,47.0,61.0,0.992481,0.007519,0.052632,0.349547,0.021053,0.000835,0.005848,120775.784672,1800.0,282.105263,1974.736842,0.142857,0.111111,0.015873,884025.0,3091.0,19.0,19.0,-51.0,-1329.0,1778.0,577.0,3.0,7.0,3.0,0.0,0.0,0.0,0.0,49.0,0.029363,,0.0,,0.0,0.0,53216.5875,596686.5,inf,inf,0.0,,-6.0,149.0,1523.0,100412.66129,1453365.0,0.0,0.0,0.0,24817.5,0.102038,1.10057,1.523734,1.496514,-0.660367,-1.992638,0.017996,0.257508,1.153939,1.628928,1.6366,-0.735256,-2.289269,0.020571,0.297415
1,100002,315.103846,0.0,0.0,0.0,0.0,0.54618,0.54618,2.0,2.0,2.0,780.0,0.0,,,,245781.0,245781.0,0.0,10.875,0.689655,0.264368,0.003698,40.5,1.5,39.0,60.0,0.716964,0.283036,0.5,0.109328,0.014109,0.010476,0.025641,4863.768166,0.0,1617.905476,7012.987013,0.75,0.051282,0.027542,638235.0,927.0,20.0,20.0,-47.0,-1072.0,780.0,-2094.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,103.0,0.017755,148.3425,153.695563,5043.645,8405.145,0.0,35111.571429,245781.0,inf,inf,0.0,inf,-7.0,1178.0,1334.0,69432.89321,865055.565,4.0,0.0,0.0,0.0,0.110174,1.038894,7.601345,0.534316,-0.817806,-0.592501,-0.290651,0.111304,1.089273,8.126102,0.584333,-0.910594,-0.682808,-0.335013,0.132145
2,100003,0.0,0.0,0.0,,,0.0,0.0,1.0,1.0,1.0,1216.0,0.0,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,810000.0,1216.0,,,,-2434.0,1216.0,-2178.0,1.0,4.0,1.0,0.0,0.0,0.0,0.0,606.0,0.003938,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,-43.0,2088.0,1980.0,19188.078259,1017400.5,2.0,0.0,0.0,0.0,0.051376,-1.386349,-0.52014,-0.831323,-0.242488,-0.712057,0.070022,0.154299,-1.453577,-0.556047,-0.909142,-0.270006,-0.818596,0.080747,0.179907
3,100004,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-595.0,-382.0,-977.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,408.0,0.003205,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-382.0,300.0,918.0,386.044202,189037.8,0.0,0.0,0.0,0.0,0.06984,-3.20874,-0.155941,-0.524505,0.269582,0.094367,-0.046783,0.032632,-3.36434,-0.166707,-0.573602,0.300168,0.108468,-0.053954,0.037803
4,100005,617.739835,0.0,0.0,0.0,0.0,0.954794,0.954794,2.0,2.0,2.0,1446.0,0.0,,,,568408.5,568408.5,0.0,5.333333,1.0,0.3125,0.086957,8.5,1.0,7.5,16.0,1.0,0.0,0.0,0.539216,0.117647,0.0,0.0,107036.117647,6882.352941,0.0,0.0,0.0,0.0,0.0,598626.0,1446.0,8.0,8.0,-12.0,-128.0,1324.0,1318.0,2.0,3.0,2.0,0.0,0.0,0.0,0.0,62.0,0.026109,0.0,0.0,0.0,0.0,0.0,50188.368035,568408.5,inf,inf,0.0,0.0,-11.0,110.0,311.0,53154.691016,657126.0,1.0,0.0,0.0,4261.5,0.130488,-1.948244,-0.867605,4.826918,-0.613374,-1.4752,0.188919,0.200762,-2.042719,-0.9275,5.278753,-0.682956,-1.69583,0.217995,0.233441


time: 3.7 s


## Installments

In [25]:
installment_agg = pd.read_csv(path + "installment_agg.csv")
frame = installment_agg.drop(["SK_ID_CURR", "INSTALLMENT_AGG_SYNTHETIC_TARGET"], axis=1)
frame = pd.DataFrame(scale.fit_transform(impute.fit_transform(frame.replace([-np.inf, np.inf], np.nan))), columns=frame.columns)
frame.head()

Unnamed: 0,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M
0,0.091688,0.060134,-0.217287,-0.310109,-0.116706,1.450319,-0.474592,0.042166,0.063254,-0.444175,-0.181221,-0.519936,-0.333909,-0.491256,-0.02592,-0.091849,-0.533982,-0.697498,-0.372866,-2.418434,-1.439745,0.016456,-0.20703,-0.280256,-0.461958,0.11574,-0.215724,-0.110836,-0.043183,0.067345
1,0.091688,0.060134,0.059417,-0.164289,-0.059087,-1.119002,-0.474592,0.042166,0.063254,-0.444175,0.022495,-0.295049,0.025893,-0.348274,0.008641,0.27376,-0.175815,-0.505823,-0.529753,0.519997,1.109948,-0.77654,-0.20703,-0.280256,-0.040331,0.237362,0.064922,-0.084646,-0.254742,0.240574
2,0.091688,0.060134,-0.217287,-0.310109,-0.116706,0.788044,-0.474592,0.042166,0.063254,-0.444175,0.034298,1.813283,0.008253,1.685522,-0.022239,0.095203,-0.034598,0.997287,-0.529753,-0.40117,-0.791648,0.536661,-0.20703,-0.280256,-0.461958,0.11574,-0.215724,-0.110836,-0.153562,0.829552
3,0.091688,0.060134,-0.217287,-0.310109,-0.116706,-0.879665,-0.474592,0.042166,0.063254,-0.444175,-0.167281,-0.471938,-0.332615,-0.51859,-0.013021,0.005144,-0.532685,-0.718883,-0.529753,-0.741723,0.882238,-1.273484,-0.20703,-0.280256,-0.461958,0.11574,-0.215724,-0.110836,-0.171958,0.933489
4,0.091688,0.060134,-0.217287,-0.310109,-0.116706,-0.964908,-0.474592,0.042166,0.063254,-0.444175,-0.16362,-0.505863,-0.324894,-0.490221,-0.013498,-0.032381,-0.518384,-0.681421,-0.372866,-0.26346,0.946829,-1.064133,-0.20703,-0.280256,-0.461958,0.11574,-0.215724,-0.110836,-0.135165,0.032699


time: 4.56 s


In [26]:
num_comp = 7
pca = PCA(n_components=num_comp)
pca.fit(frame)
princomp = pd.DataFrame(np.dot(frame, pca.components_.T), columns=["INSTALLMENT_AGG_COMP" + str(i+1) for i in range(num_comp)])
installment_agg = pd.concat([installment_agg, princomp], axis=1)
installment_agg.head()

Unnamed: 0,SK_ID_CURR,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7
0,100001,0.0,0.0,,,,2916.0,0.0,0.0,0.0,0.0,3.116986,5885.132143,10.686671,17397.9,1.365586,3951.0,21.8189,41195.925,1.0,-1628.0,-2916.0,1288.0,,,0.0,0.0,,,11.0,-36.0,0.06575,-1.311336,-0.289649,-1.265137,0.259213,1.925718,0.03656,1.028292
1,100002,0.0,0.0,53093.745,53093.745,9251.775,565.0,0.0,0.0,0.0,0.0,95.448632,11559.247105,1083.545816,53093.745,15.761116,9251.775,1813.524009,219625.695,0.0,-49.0,-587.0,538.0,0.0,0.0,90100.845,34590.195,53093.745,9251.775,-12.0,-31.0,0.087013,-0.752288,1.616157,0.754784,-0.702447,-0.535793,0.056893,0.006947
2,100003,0.0,0.0,,,,2310.0,0.0,0.0,0.0,0.0,100.798053,64754.586,1030.947353,560835.36,2.899015,6662.97,2519.951327,1618864.65,0.0,-544.0,-2324.0,1780.0,,,0.0,0.0,,,-1.0,-14.0,0.050903,0.659627,-0.035899,-0.624043,1.42402,0.239304,-0.727819,1.224179
3,100004,0.0,0.0,,,,784.0,0.0,0.0,0.0,0.0,9.434878,7096.155,14.544656,10573.965,6.738679,5357.25,28.304633,21288.465,0.0,-727.0,-795.0,68.0,,,0.0,0.0,,,-3.0,-11.0,0.111008,-1.700891,1.634542,0.456757,-0.633019,-0.255442,-0.037613,0.026482
4,100005,0.0,0.0,,,,706.0,0.0,0.0,0.0,0.0,11.09417,6240.205,37.566479,17656.245,6.539674,4813.2,99.847528,56161.845,1.0,-470.0,-736.0,266.0,,,0.0,0.0,,,1.0,-37.0,0.114271,-1.571981,1.428804,0.404391,-0.61607,-0.355109,-0.043216,-0.162738


time: 1.96 s


In [27]:
installment_agg.shape

(339587, 39)

time: 2.53 ms


# Linear Discriminant Analysis

In [None]:
df = pd.read_csv(path + "train.csv")
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")
df.drop("LDA_SCORE", axis=1, inplace=True)
df.head()

In [None]:
scaled_df = pd.DataFrame(scale.fit_transform(quant.fit_transform(impute.fit_transform(df))), 
                        columns=df.columns, 
                        index=df.index)
del df
gc.collect()

In [7]:
lda_score = pd.Series(np.empty(len(y)), 
                     index=scaled_df.index, 
                     name="LDA_SCORE")

time: 1.46 ms


In [8]:
kfold = StratifiedKFold(n_splits=3)

time: 716 µs


In [9]:
for train_indx, test_indx in kfold.split(scaled_df.values, y.values):
    print("Fitting...")
    clf = LinearDiscriminantAnalysis()
    clf.fit(scaled_df.iloc[train_indx], y.iloc[train_indx])
    print("Scoring...")
    lda_score.iloc[test_indx] = clf.predict_proba(scaled_df.iloc[test_indx])[:,1]

Fitting...
Scoring...
Fitting...
Scoring...
Fitting...
Scoring...
time: 1min 9s


In [10]:
roc_auc_score(y, lda_score)

0.776766596344993

time: 94.2 ms


In [12]:
del scaled_df
gc.collect()

134

time: 163 ms


#### Write to train.csv

In [21]:
df = pd.read_csv(path + "train.csv")
df.join(lda_score).to_csv(path + "train.csv", index=False, header=True)
del df
gc.collect()

35

time: 2min 19s


#### Refit and score test set

In [3]:
df = pd.read_csv(path + "train.csv", usecols=lambda c: c != "LDA_SCORE")
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")
df.head()

Unnamed: 0,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,TOTALAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET,TOTAL_AMT_CREDIT_SUM_DIV_SUM_DAYS_CREDIT_ENDDATE,TOTAL_AMT_CREDIT_SUM_POS_DAYS_DIV_SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_ABS_DAYS_INSTALMENT_DIV_DAYS_BIRTH,AMT_CREDIT_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_PLUS_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_GOODS_PRICE,AMT_CREDIT_DIV_SUM_PAYMENT,AMT_GOODS_PRICE_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_ANNUITY,AMT_CREDIT_DIV_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIV_MAX_PREV_REQ_AMOUNT,EXT_SOURCE_PROD,DAYS_EMPLOYED_DIV_DAYS_BIRTH,DAYS_EMPLOYED_PLUS_DAYS_REGISTRATION_PLUS_DAYS_LAST_PHONE_CHANGE,AVG_PAYMENT_SIZE_DIV_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIV_AMT_CREDIT,AVG_PAYMENT_SIZE_DIV_AMT_ANNUITY,DAYS_REGISTRATION_PLUS_DAYS_ID_PUBLISH,SUM_REFUSED_CONTRACT_DIV_SUM_APPR_CONTRACT,MAX_UTILIZATION_DIV_AVG_UTILIZATION,MAX_PREV_REQ_AMOUNT_DIV_AMT_CREDIT,AMT_INCOME_TOTAL_DIV_DAYS_BIRTH,SUM_DAYS_ID_REG_PHONE,SUM_REQ_CREDIT_YEAR,SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_1M,SUM_REQ_CREDIT_1M_DIV_SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_QRT_DIV_SUM_REQ_CREDIT_YEAR,DEF_30_PLUS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE_DIV_DAYS_BIRTH,LANDAREA_DIV_TOTALAREA_MODE,OWN_CAR_AGE_PLUS_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_EMPLOYED,AMT_ANNUITY_PROD_DAYS_EMPLOYED,DAYS_REGISTRATION_DIV_DAYS_ID_PUBLISH,DAYS_REGISTRATION_DIV_DAYS_LAST_PHONE_CHANGE,REGION_RATING_CLIENT_W_CITY_DIV_REGION_POPULATION_RELATIVE,SUM_REG_NOT_FLAG,SUM_AVG_BUILD,SUM_MODE_BUILD,SUM_MEDI_BUILD,SUM_DOC_FLAG,CNT_CHILDREN_DIV_DAYS_BIRTH,CNT_CHILDREN_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_PROD_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_CAR_DIV_OWN_CAR_AGE,EXT_SOURCE_1_DIV_DAYS_BIRTH,EXT_SOURCE_1_PROD_DAYS_BIRTH,AVG_AGG_SYNTHETIC_TARGET,SUM_AGG_SYNTHETIC_TARGET,MAX_AGG_SYNTHETIC_TARGET,MIN_AGG_SYNTHETIC_TARGET,NAME_CONTRACT_TYPE_Cash_loans,NAME_CONTRACT_TYPE_Revolving_loans,NAME_CONTRACT_TYPE_nan,CODE_GENDER_F,CODE_GENDER_M,CODE_GENDER_nan,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group_of_people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse,_partner",NAME_TYPE_SUITE_Unaccompanied,NAME_TYPE_SUITE_nan,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial_associate,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State_servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_INCOME_TYPE_nan,NAME_EDUCATION_TYPE_Academic_degree,NAME_EDUCATION_TYPE_Higher_education,NAME_EDUCATION_TYPE_Incomplete_higher,NAME_EDUCATION_TYPE_Lower_secondary,NAME_EDUCATION_TYPE_Secondary_/_secondary_special,NAME_EDUCATION_TYPE_nan,NAME_FAMILY_STATUS_Civil_marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single_/_not_married,NAME_FAMILY_STATUS_Widow,NAME_FAMILY_STATUS_nan,NAME_HOUSING_TYPE_Co-op_apartment,NAME_HOUSING_TYPE_House_/_apartment,NAME_HOUSING_TYPE_Municipal_apartment,NAME_HOUSING_TYPE_Office_apartment,NAME_HOUSING_TYPE_Rented_apartment,NAME_HOUSING_TYPE_With_parents,NAME_HOUSING_TYPE_nan,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning_staff,OCCUPATION_TYPE_Cooking_staff,OCCUPATION_TYPE_Core_staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR_staff,OCCUPATION_TYPE_High_skill_tech_staff,OCCUPATION_TYPE_IT_staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill_Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine_staff,OCCUPATION_TYPE_Private_service_staff,OCCUPATION_TYPE_Realty_agents,OCCUPATION_TYPE_Sales_staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security_staff,OCCUPATION_TYPE_Waiters/barmen_staff,OCCUPATION_TYPE_nan,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,WEEKDAY_APPR_PROCESS_START_nan,FONDKAPREMONT_MODE_not_specified,FONDKAPREMONT_MODE_org_spec_account,FONDKAPREMONT_MODE_reg_oper_account,FONDKAPREMONT_MODE_reg_oper_spec_account,FONDKAPREMONT_MODE_nan,HOUSETYPE_MODE_block_of_flats,HOUSETYPE_MODE_specific_housing,HOUSETYPE_MODE_terraced_house,HOUSETYPE_MODE_nan,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone,_brick",WALLSMATERIAL_MODE_Wooden,WALLSMATERIAL_MODE_nan,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,EMERGENCYSTATE_MODE_nan
0,0,1,0,202500.0,406597.5,24700.5,351000.0,0.018801,-9461,-637.0,-3648.0,-2120,,1,1,0,1,1,0,1.0,2,2,10,0,0,0,0,0,0,42,0.083037,0.262949,0.139376,0.0247,0.0369,0.9722,0.6192,0.0143,0.0,0.069,0.0833,0.125,0.0369,0.0202,0.019,0.0,0.0,0.0252,0.0383,0.9722,0.6341,0.0144,0.0,0.069,0.0833,0.125,0.0377,0.022,0.0198,0.0,0.0,0.025,0.0369,0.9722,0.6243,0.0144,0.0,0.069,0.0833,0.125,0.0375,0.0205,0.0193,0.0,0.0,0.0149,2.0,2.0,2.0,2.0,-1134.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,1.0,,9251.775,,,1.0,,1.0,1.0,-17.0,-17.0,-17.0,0.0,179055.0,179055.0,179055.0,295.470297,295.470297,295.470297,19.353584,19.353584,19.353584,0.031937,0.031937,0.031937,9251.775,9251.775,9251.775,15.266955,15.266955,15.266955,-606.0,-606.0,0.0,0.0,0.0,295.470297,295.470297,179055.0,179055.0,0.0,0.00165,0.00165,0.0,1.0,1.0,1.0,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.00165,0.00165,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.487067,-2.72488,1.59177,2.395666,0.118051,-0.42582,-0.376677,0.405732,315.103846,0.0,0.0,0.0,0.0,0.54618,0.54618,2.0,2.0,2.0,780.0,0.0,,,,245781.0,245781.0,0.0,10.875,0.689655,0.264368,0.003698,40.5,1.5,39.0,60.0,0.716964,0.283036,0.5,0.109328,0.014109,0.010476,0.025641,4863.768166,0.0,1617.905476,7012.987013,0.75,0.051282,0.027542,638235.0,927.0,20.0,20.0,-47.0,-1072.0,780.0,-2094.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,103.0,0.017755,148.3425,153.695563,5043.645,8405.145,0.0,35111.571429,245781.0,,,0.0,,-7.0,1178.0,1334.0,69432.89321,865055.565,4.0,0.0,0.0,0.0,0.527927,1.038894,7.601345,0.534316,-0.817806,-0.592501,-0.290651,0.111304,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,53093.745,53093.745,9251.775,565.0,0.0,0.0,0.0,0.0,95.448632,11559.247105,1083.545816,53093.745,15.761116,9251.775,1813.524009,219625.695,0.0,-49.0,-587.0,538.0,0.0,0.0,90100.845,34590.195,53093.745,9251.775,-12.0,-31.0,0.514141,-0.752288,1.616157,0.754784,-0.702447,-0.535793,0.056893,0.006947,0.0,0.0,1.0,6.0,11.0,0.0,0.510127,-413.11154,688.495146,-0.059719,2.007889,609097.5,1.158397,1.85132,1.733333,16.461104,2.270797,2.270797,0.003043,0.067329,-5419.0,0.057083,0.028429,0.467976,-5768.0,0.0,,0.440374,-21.403657,-6902.0,1.0,0.0,0.0,,0.0,4.0,,2.530201,,-2.610771,-38.776295,-15734218.5,1.720755,3.216931,0.037602,0,2.0207,2.041,2.0274,1,-0.0,0.0,0.018801,53.18866,,-9e-06,-785.612748,0.509815,2.039261,0.527927,0.487067,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0
1,0,0,0,270000.0,1293502.5,35698.5,1129500.0,0.003541,-16765,-1188.0,-1186.0,-291,,1,1,0,1,1,0,2.0,1,1,11,0,0,0,0,0,0,13,0.311267,0.622246,,0.0959,0.0529,0.9851,0.796,0.0605,0.08,0.0345,0.2917,0.3333,0.013,0.0773,0.0549,0.0039,0.0098,0.0924,0.0538,0.9851,0.804,0.0497,0.0806,0.0345,0.2917,0.3333,0.0128,0.079,0.0554,0.0,0.0,0.0968,0.0529,0.9851,0.7987,0.0608,0.08,0.0345,0.2917,0.3333,0.0132,0.0787,0.0558,0.0039,0.01,0.0714,1.0,0.0,1.0,0.0,-828.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,3.0,-1976.0,-527.0,-1047.333333,1449.0,68053.5,1035882.0,484191.0,29.070269,1388.581769,612.90394,5.399568,10.531859,8.677472,0.004315,0.014118,0.008318,6737.31,98356.995,56553.99,2.877962,131.845838,70.901357,-2341.0,-746.0,1595.0,0.0,0.0,547.812073,1206.434316,435436.5,900000.0,2.1e-05,0.001071,0.001543,0.05003,1.057664,1.15098,0.989013,,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,2.0,0.0,0.0,1.0,2.0,3.0,0.002975,0.00134,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.42019,0.428183,-0.535911,2.110056,-4.18119,1.337309,1.599647,0.545277,0.0,0.0,0.0,,,0.0,0.0,1.0,1.0,1.0,1216.0,0.0,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,810000.0,1216.0,,,,-2434.0,1216.0,-2178.0,1.0,4.0,1.0,0.0,0.0,0.0,0.0,606.0,0.003938,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,-43.0,2088.0,1980.0,19188.078259,1017400.5,2.0,0.0,0.0,0.0,0.459588,-1.386349,-0.52014,-0.831323,-0.242488,-0.712057,0.070022,0.154299,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,2310.0,0.0,0.0,0.0,0.0,100.798053,64754.586,1030.947353,560835.36,2.899015,6662.97,2519.951327,1618864.65,0.0,-544.0,-2324.0,1780.0,,,0.0,0.0,,,-1.0,-14.0,0.47399,0.659627,-0.035899,-0.624043,1.42402,0.239304,-0.727819,1.224179,0.0,0.0,3.0,,,,0.495285,-467.126033,666.118421,-0.137787,4.79075,1563502.5,1.145199,0.799018,4.183333,36.234085,2.970588,1.437225,,0.070862,-3202.0,0.239832,0.050061,1.81393,-1477.0,0.0,,0.695785,-16.104981,-2305.0,0.0,0.0,0.0,,,0.0,,0.179272,,-2.129347,-30.049242,-42409818.0,4.075601,1.432367,0.003541,0,2.8888,2.8723,2.8954,1,-0.0,0.0,0.0,0.0,,-1.9e-05,-5218.396475,0.462263,1.849054,0.495285,0.42019,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0
2,1,1,0,67500.0,135000.0,6750.0,135000.0,0.010032,-19046,-225.0,-4260.0,-2531,26.0,1,1,1,1,1,0,1.0,2,2,9,0,0,0,0,0,0,22,,0.555912,0.729567,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-815.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,1.0,-714.0,-714.0,-714.0,0.0,20106.0,20106.0,20106.0,24.669939,24.669939,24.669939,3.753045,3.753045,3.753045,0.004605,0.004605,0.004605,5357.25,5357.25,5357.25,6.573313,6.573313,6.573313,-815.0,-815.0,0.0,0.0,0.0,29.793865,29.793865,24282.0,24282.0,0.00026,0.001016,0.001016,0.212008,0.828021,0.828021,0.828021,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.001227,0.001227,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506853,-4.125854,1.233849,-0.810943,0.819096,-1.583013,1.885414,1.163706,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-595.0,-382.0,-977.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,408.0,0.003205,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-382.0,300.0,918.0,386.044202,189037.8,0.0,0.0,0.0,0.0,0.484335,-3.20874,-0.155941,-0.524505,0.269582,0.094367,-0.046783,0.032632,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,784.0,0.0,0.0,0.0,0.0,9.434878,7096.155,14.544656,10573.965,6.738679,5357.25,28.304633,21288.465,0.0,-727.0,-795.0,68.0,,,0.0,0.0,,,-3.0,-11.0,0.525224,-1.700891,1.634542,0.456757,-0.633019,-0.255442,-0.037613,0.026482,0.0,0.0,1.0,,,,0.509493,-193.488025,,-0.041163,2.0,202500.0,1.0,6.341462,2.0,20.0,5.559674,5.559674,,0.011814,-5300.0,0.105128,0.052564,1.051282,-6791.0,0.0,,0.179867,-3.544051,-7606.0,0.0,0.0,0.0,,,0.0,-0.001365,,-19020.0,-0.354405,-30.0,-1518750.0,1.683129,5.226994,0.020064,0,,,,0,-0.0,0.0,0.010032,99.681021,0.038462,,,0.506476,2.025905,0.525224,0.484335,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
3,0,1,0,135000.0,312682.5,29686.5,297000.0,0.008019,-19005,-3039.0,-9833.0,-2437,,1,1,0,1,0,0,2.0,2,2,17,0,0,0,0,0,0,42,,0.650442,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,0.0,2.0,0.0,-617.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,,,,,,13500.0,2482.92,0.799989,1.029197,1.012684,1.316797,1.316797,9.0,-416.0,365243.0,182481.75,365659.0,0.0,906615.0,291695.5,0.0,5008.922652,1358.887335,9.230206,27.839644,17.767287,0.015809,0.15381,0.081751,2482.92,39954.51,23651.175,4.024182,180.641436,96.293912,-617.0,-181.0,436.0,5.0,0.555556,1242.561634,3803.867403,272203.26,688500.0,0.000439,0.004129,0.007275,0.163412,1.012684,1.316797,0.799989,,0.0,0.0,0.0,1.0,1.0,3.0,5.0,0.0,0.0,0.0,2.0,2.0,1.0,4.0,0.015886,0.005525,2.0,,,1.0,1.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,,,,,,,,0.505468,2.847059,-1.193277,-0.546901,-0.548065,0.197115,-2.467181,-0.502496,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,0.0,0.0,0.0,0.0,0.0,6.0,1.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.471819,-2.996367,0.956185,-1.143641,0.37796,0.322572,0.12285,-0.890276,0.0,0.0,691786.89,691786.89,29027.52,545.0,0.0,0.0,0.0,0.0,543.096731,62947.088438,3975.786724,691786.89,4.318122,2482.92,8689.547693,1007153.415,0.0,-12.0,-575.0,563.0,0.0,0.0,865952.01,749841.93,691786.89,29027.52,-1.0,-77.0,0.561795,7.1613,2.248679,2.477131,-3.866771,0.665976,-0.403882,2.419674,0.0,0.0,3.0,0.0,48.0,0.0,0.523314,,,-0.028677,2.316167,447682.5,1.052803,0.310462,2.2,10.532818,1.14871,0.45415,,0.159905,-13489.0,0.466275,0.201313,2.120394,-12270.0,0.2,,2.201914,-7.103394,-12887.0,,,,,,0.0,,,,-1.562036,-9.768509,-90217273.5,4.034879,15.936791,0.016038,0,,,,1,-0.0,0.0,0.008019,124.703828,,,,0.515599,2.062397,0.561795,0.471819,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
4,0,1,0,121500.0,513000.0,21865.5,513000.0,0.028663,-19932,-3038.0,-4311.0,-3458,,1,1,0,1,0,0,1.0,2,2,11,0,0,0,0,1,1,12,,0.322738,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-1106.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,16037.64,,,1.108236,,1.108236,6.0,-2041.0,365243.0,72143.8,367284.0,14616.0,284400.0,166638.75,6.201103,733.391711,248.03877,7.968206,21.858453,12.644075,0.003381,0.045729,0.016725,1834.29,22678.785,12278.805,0.778231,42.88139,16.715844,-2357.0,-374.0,1983.0,1.0,0.166667,222.881532,661.764706,150530.25,247500.0,7.5e-05,0.001244,0.002963,0.159516,1.046356,1.264,0.85093,,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,3.0,1.0,3.0,0.0,3.0,5.0,0.005724,0.002674,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.492233,0.206872,-1.706155,-1.707714,-0.435966,2.093007,1.031252,-1.305981,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-783.0,-783.0,-783.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1149.0,0.00087,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-783.0,0.0,0.0,186.781609,146250.0,0.0,0.0,0.0,0.0,0.49316,-3.843688,0.002791,-0.603251,0.532176,0.838862,-0.111817,-0.095342,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,16037.64,16037.64,16037.64,2326.0,3.0,29857.365,25.402727,22655.655,49.833434,12214.060227,1145.545714,22678.785,0.000125,0.18,3289.00667,806127.975,16.0,-14.0,-2318.0,2304.0,0.0,0.0,96225.84,0.0,16037.64,16037.64,12.0,-31.0,0.501933,0.056196,-1.978048,-0.43754,0.186092,0.663907,0.565579,-0.741146,0.0,0.0,5.0,13.0,18.0,0.0,0.48669,-186.781609,,-0.116697,4.222222,634500.0,1.0,0.636375,4.222222,23.461618,3.407953,2.072727,,0.152418,-8455.0,0.100527,0.023809,0.5586,-7769.0,0.0,,0.482456,-6.095725,-8875.0,0.0,0.0,0.0,,,0.0,,,,-1.097005,-7.197334,-66427389.0,1.246674,3.89783,0.057326,2,,,,1,-0.0,0.0,0.028663,34.888183,,,,0.493504,1.974017,0.501933,0.48669,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1


time: 27.6 s


In [4]:
scaled_df = pd.DataFrame(scale.fit_transform(quant.fit_transform(impute.fit_transform(df))), 
                        columns=df.columns, 
                        index=df.index)
del df
gc.collect()

7

time: 1min 16s


In [5]:
clf = LinearDiscriminantAnalysis()
clf.fit(scaled_df, y)

LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,
              solver='svd', store_covariance=False, tol=0.0001)

time: 36.2 s


In [6]:
del scaled_df
gc.collect()

0

time: 187 ms


In [7]:
df_test = pd.read_csv(path + "test.csv")
df_test.head()

Unnamed: 0,SK_ID_CURR,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,TOTALAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET,TOTAL_AMT_CREDIT_SUM_DIV_SUM_DAYS_CREDIT_ENDDATE,TOTAL_AMT_CREDIT_SUM_POS_DAYS_DIV_SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_ABS_DAYS_INSTALMENT_DIV_DAYS_BIRTH,AMT_CREDIT_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_PLUS_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_GOODS_PRICE,AMT_CREDIT_DIV_SUM_PAYMENT,AMT_GOODS_PRICE_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_ANNUITY,AMT_CREDIT_DIV_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIV_MAX_PREV_REQ_AMOUNT,EXT_SOURCE_PROD,DAYS_EMPLOYED_DIV_DAYS_BIRTH,DAYS_EMPLOYED_PLUS_DAYS_REGISTRATION_PLUS_DAYS_LAST_PHONE_CHANGE,AVG_PAYMENT_SIZE_DIV_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIV_AMT_CREDIT,AVG_PAYMENT_SIZE_DIV_AMT_ANNUITY,DAYS_REGISTRATION_PLUS_DAYS_ID_PUBLISH,SUM_REFUSED_CONTRACT_DIV_SUM_APPR_CONTRACT,MAX_UTILIZATION_DIV_AVG_UTILIZATION,MAX_PREV_REQ_AMOUNT_DIV_AMT_CREDIT,AMT_INCOME_TOTAL_DIV_DAYS_BIRTH,SUM_DAYS_ID_REG_PHONE,SUM_REQ_CREDIT_YEAR,SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_1M,SUM_REQ_CREDIT_1M_DIV_SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_QRT_DIV_SUM_REQ_CREDIT_YEAR,DEF_30_PLUS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE_DIV_DAYS_BIRTH,LANDAREA_DIV_TOTALAREA_MODE,OWN_CAR_AGE_PLUS_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_EMPLOYED,AMT_ANNUITY_PROD_DAYS_EMPLOYED,DAYS_REGISTRATION_DIV_DAYS_ID_PUBLISH,DAYS_REGISTRATION_DIV_DAYS_LAST_PHONE_CHANGE,REGION_RATING_CLIENT_W_CITY_DIV_REGION_POPULATION_RELATIVE,SUM_REG_NOT_FLAG,SUM_AVG_BUILD,SUM_MODE_BUILD,SUM_MEDI_BUILD,SUM_DOC_FLAG,CNT_CHILDREN_DIV_DAYS_BIRTH,CNT_CHILDREN_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_PROD_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_CAR_DIV_OWN_CAR_AGE,EXT_SOURCE_1_DIV_DAYS_BIRTH,EXT_SOURCE_1_PROD_DAYS_BIRTH,AVG_AGG_SYNTHETIC_TARGET,SUM_AGG_SYNTHETIC_TARGET,MAX_AGG_SYNTHETIC_TARGET,MIN_AGG_SYNTHETIC_TARGET,NAME_CONTRACT_TYPE_Cash_loans,NAME_CONTRACT_TYPE_Revolving_loans,NAME_CONTRACT_TYPE_nan,CODE_GENDER_F,CODE_GENDER_M,CODE_GENDER_nan,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group_of_people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse,_partner",NAME_TYPE_SUITE_Unaccompanied,NAME_TYPE_SUITE_nan,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial_associate,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State_servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_INCOME_TYPE_nan,NAME_EDUCATION_TYPE_Academic_degree,NAME_EDUCATION_TYPE_Higher_education,NAME_EDUCATION_TYPE_Incomplete_higher,NAME_EDUCATION_TYPE_Lower_secondary,NAME_EDUCATION_TYPE_Secondary_/_secondary_special,NAME_EDUCATION_TYPE_nan,NAME_FAMILY_STATUS_Civil_marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single_/_not_married,NAME_FAMILY_STATUS_Widow,NAME_FAMILY_STATUS_nan,NAME_HOUSING_TYPE_Co-op_apartment,NAME_HOUSING_TYPE_House_/_apartment,NAME_HOUSING_TYPE_Municipal_apartment,NAME_HOUSING_TYPE_Office_apartment,NAME_HOUSING_TYPE_Rented_apartment,NAME_HOUSING_TYPE_With_parents,NAME_HOUSING_TYPE_nan,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning_staff,OCCUPATION_TYPE_Cooking_staff,OCCUPATION_TYPE_Core_staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR_staff,OCCUPATION_TYPE_High_skill_tech_staff,OCCUPATION_TYPE_IT_staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill_Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine_staff,OCCUPATION_TYPE_Private_service_staff,OCCUPATION_TYPE_Realty_agents,OCCUPATION_TYPE_Sales_staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security_staff,OCCUPATION_TYPE_Waiters/barmen_staff,OCCUPATION_TYPE_nan,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,WEEKDAY_APPR_PROCESS_START_nan,FONDKAPREMONT_MODE_not_specified,FONDKAPREMONT_MODE_org_spec_account,FONDKAPREMONT_MODE_reg_oper_account,FONDKAPREMONT_MODE_reg_oper_spec_account,FONDKAPREMONT_MODE_nan,HOUSETYPE_MODE_block_of_flats,HOUSETYPE_MODE_specific_housing,HOUSETYPE_MODE_terraced_house,HOUSETYPE_MODE_nan,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone,_brick",WALLSMATERIAL_MODE_Wooden,WALLSMATERIAL_MODE_nan,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,EMERGENCYSTATE_MODE_nan
0,100001,0,1,0,135000.0,568800.0,20560.5,450000.0,0.01885,-19241,-2329.0,-5170.0,-812,,1,1,0,1,0,1,2.0,2,2,18,0,0,0,0,0,0,24,0.752614,0.789654,0.15952,0.066,0.059,0.9732,,,,0.1379,0.125,,,,0.0505,,,0.0672,0.0612,0.9732,,,,0.1379,0.125,,,,0.0526,,,0.0666,0.059,0.9732,,,,0.1379,0.125,,,,0.0514,,,0.0392,0.0,0.0,0.0,0.0,-1740.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,1.0,-1612.0,-1612.0,-1612.0,0.0,23787.0,23787.0,23787.0,13.67069,13.67069,13.67069,6.020501,6.020501,6.020501,0.00346,0.00346,0.00346,3951.0,3951.0,3951.0,2.27069,2.27069,2.27069,-1740.0,-1740.0,0.0,0.0,0.0,14.273276,14.273276,24835.5,24835.5,6e-05,0.00055,0.00055,0.104326,0.957782,0.957782,0.957782,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.000575,0.000575,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.513661,-3.921423,0.977275,-0.190697,1.345474,-0.545294,1.929032,1.411176,603.706712,0.0,0.0,1.0,1.0,0.987405,0.987405,3.0,3.0,3.0,3091.0,0.0,,,,596686.5,596686.5,0.0,8.857143,0.983871,1.774194,0.007155,47.5,0.5,47.0,61.0,0.992481,0.007519,0.052632,0.349547,0.021053,0.000835,0.005848,120775.784672,1800.0,282.105263,1974.736842,0.142857,0.111111,0.015873,884025.0,3091.0,19.0,19.0,-51.0,-1329.0,1778.0,577.0,3.0,7.0,3.0,0.0,0.0,0.0,0.0,49.0,0.029363,,0.0,,0.0,0.0,53216.5875,596686.5,,,0.0,,-6.0,149.0,1523.0,100412.66129,1453365.0,0.0,0.0,0.0,24817.5,0.525061,1.10057,1.523734,1.496514,-0.660367,-1.992638,0.017996,0.257508,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,2916.0,0.0,0.0,0.0,0.0,3.116986,5885.132143,10.686671,17397.9,1.365586,3951.0,21.8189,41195.925,1.0,-1628.0,-2916.0,1288.0,,,0.0,0.0,,,11.0,-36.0,0.485121,-1.311336,-0.289649,-1.265137,0.259213,1.925718,0.03656,1.028292,7.0,7.0,2.0,,,,0.503134,2518.830156,285.999676,-0.151551,4.213333,703800.0,1.264,13.807191,3.333333,27.664697,22.9027,22.9027,0.094803,0.121044,-9239.0,0.043594,0.010347,0.286235,-5982.0,0.0,,0.043663,-7.016267,-7722.0,0.0,0.0,0.0,,,0.0,,,,-1.068578,-8.828038,-47885404.5,6.366995,2.971264,0.0377,0,,,,1,-0.0,0.0,0.01885,53.050398,,-3.9e-05,-14481.055414,0.506744,2.026977,0.525061,0.485121,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0
1,100005,0,1,0,99000.0,222768.0,17370.0,180000.0,0.035792,-18064,-4469.0,-9118.0,-1623,,1,1,0,1,0,0,2.0,2,2,9,0,0,0,0,0,0,46,0.56499,0.291656,0.432962,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,3.0,,,,,,,,2.0,-460.0,-460.0,-460.0,0.0,0.0,40153.5,20076.75,0.0,53.042933,26.521466,8.342371,8.342371,8.342371,0.01102,0.01102,0.01102,4813.2,4813.2,4813.2,6.358256,6.358256,6.358256,-757.0,-315.0,442.0,1.0,0.5,29.469947,58.939894,22308.75,44617.5,0.000144,0.001189,0.001189,0.108964,0.89995,0.89995,0.89995,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.001321,0.001321,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,0.529786,-3.004413,0.852979,-0.301994,1.40546,-1.294547,0.780261,1.127595,617.739835,0.0,0.0,0.0,0.0,0.954794,0.954794,2.0,2.0,2.0,1446.0,0.0,,,,568408.5,568408.5,0.0,5.333333,1.0,0.3125,0.086957,8.5,1.0,7.5,16.0,1.0,0.0,0.0,0.539216,0.117647,0.0,0.0,107036.117647,6882.352941,0.0,0.0,0.0,0.0,0.0,598626.0,1446.0,8.0,8.0,-12.0,-128.0,1324.0,1318.0,2.0,3.0,2.0,0.0,0.0,0.0,0.0,62.0,0.026109,0.0,0.0,0.0,0.0,0.0,50188.368035,568408.5,,,0.0,0.0,-11.0,110.0,311.0,53154.691016,657126.0,1.0,0.0,0.0,4261.5,0.54662,-1.948244,-0.867605,4.826918,-0.613374,-1.4752,0.188919,0.200762,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,706.0,0.0,0.0,0.0,0.0,11.09417,6240.205,37.566479,17656.245,6.539674,4813.2,99.847528,56161.845,1.0,-470.0,-736.0,266.0,,,0.0,0.0,,,1.0,-37.0,0.525405,-1.571981,1.428804,0.404391,-0.61607,-0.355109,-0.043216,-0.162738,0.0,0.0,1.0,,,,0.508932,498.578149,413.987552,-0.039083,2.250182,321768.0,1.2376,3.966536,1.818182,12.82487,9.985678,4.992839,0.071345,0.247398,-13587.0,0.063032,0.028012,0.359252,-10741.0,0.0,,0.200287,-5.480514,-10741.0,3.0,0.0,0.0,,0.0,0.0,,,,-0.961581,-3.886776,-77626530.0,5.617991,,0.071584,0,,,,1,-0.0,0.0,0.035792,27.939204,,-3.1e-05,-10205.983005,0.527686,2.110743,0.54662,0.508932,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
2,100013,1,1,0,202500.0,663264.0,69777.0,630000.0,0.019101,-20038,-4458.0,-2175.0,-3503,5.0,1,1,0,1,0,0,2.0,2,2,14,0,0,0,0,0,0,57,,0.699787,0.610991,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-856.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,1.0,4.0,4742.415,4742.415,1.079158,1.079158,1.079158,1.079158,1.079158,4.0,-1702.0,-85.0,-710.333333,1617.0,0.0,512370.0,146134.125,0.0,598.563084,177.826452,5.109738,22.128804,11.523312,0.003668,0.025851,0.016079,4742.415,23153.985,11478.195,3.270728,27.049048,15.897086,-1999.0,-222.0,1777.0,1.0,0.25,158.370361,525.700935,130871.25,450000.0,3.4e-05,0.001918,0.003953,0.067217,1.052363,1.1386,0.93933,,0.0,0.0,0.0,0.0,0.0,1.0,3.0,0.0,1.0,0.0,1.0,0.0,1.0,3.0,0.005331,0.003663,2.0,,,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,,,,,,,,0.499304,-0.690857,-0.565602,-0.438265,0.496767,0.94185,0.88094,0.138659,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,0.0,31.75,0.944882,0.811024,0.005744,54.5,19.5,35.0,120.0,0.934538,0.065462,0.136364,0.027611,0.015847,0.001329,0.002502,11763.832141,1358.464615,935.629196,1895.27027,0.75,0.027778,0.016119,0.0,0.0,40.0,40.0,-68.0,-1707.0,-567.0,-4272.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,1210.0,0.002409,14.471514,14.471514,19305.0,19305.0,0.0,0.0,0.0,,,,,-4.0,1330.0,860.0,9516.034492,2072280.06,0.0,2.0,0.0,0.0,0.450764,-1.855564,2.735181,-2.778506,1.382593,1.031266,-0.318153,-0.061797,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18159.919219,161420.22,1743352.245,96.0,1.0,95.0,0.115301,1.02489,230.066978,1944.407308,22086.429911,0.001461,0.012345,0.014493,0.014493,23.0,0.239583,7.0,571500.0,5953.125,157500.0,0.0,,,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.481502,-1.995274,-1.079984,1.425906,-0.458675,-1.500304,-0.189693,1.339213,9484.83,9484.83,4741.245,357347.745,23.58,2705.0,10.0,179437.725,381.708698,23147.82,14.445926,9740.235774,1029.820591,357347.745,0.01181,6.165,2239.118537,1509736.545,11.0,-14.0,-2705.0,2691.0,4718.835,4718.835,15871.995,-357348.915,4742.415,274.32,21.0,-38.0,0.500121,0.701369,-3.623967,-0.465886,1.219061,-0.284452,-0.394729,-0.151084,18.0,0.0,3.0,0.0,3.0,36.0,0.509721,-485.084284,,-0.134994,3.275378,865764.0,1.0528,0.439324,3.111111,9.505482,5.068065,1.47392,,0.222477,-7489.0,0.0481,0.014685,0.139591,-5678.0,0.0,8.888818,0.678463,-10.105799,-6534.0,5.0,1.0,0.0,0.0,0.2,0.0,-0.00025,,-20033.0,-3.482234,-15.652086,-311065866.0,0.620896,2.540888,0.038202,0,,,,1,-0.0,0.0,0.019101,52.35328,0.2,,,0.488282,2.441412,0.509721,0.450764,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
3,100028,0,1,2,315000.0,1575000.0,49018.5,1575000.0,0.026392,-13976,-1866.0,-2000.0,-4208,,1,1,0,1,1,0,4.0,2,2,11,0,0,0,0,0,0,42,0.525734,0.509677,0.612704,0.3052,0.1974,0.997,0.9592,0.1165,0.32,0.2759,0.375,0.0417,0.2042,0.2404,0.3673,0.0386,0.08,0.3109,0.2049,0.997,0.9608,0.1176,0.3222,0.2759,0.375,0.0417,0.2089,0.2626,0.3827,0.0389,0.0847,0.3081,0.1974,0.997,0.9597,0.1173,0.32,0.2759,0.375,0.0417,0.2078,0.2446,0.3739,0.0388,0.0817,0.37,0.0,0.0,0.0,0.0,-1805.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,3.0,,,,,,,,5.0,-1081.0,365243.0,121182.666667,366324.0,0.0,225000.0,92920.5,0.0,151.006711,69.509847,8.507039,21.692944,16.733328,0.010674,0.013423,0.012038,6028.02,11250.0,8091.585,3.339623,8.778839,6.556266,-1805.0,-531.0,1274.0,2.0,0.4,40.92331,82.75596,49207.5,130765.5,7.2e-05,,,0.057708,,,0.902436,,0.0,0.0,0.0,0.0,0.0,1.0,3.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,0.001809,0.001255,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506871,-1.06098,-0.298669,-0.388277,0.796905,0.387967,-0.199159,-1.206917,161.513904,178591.5,178591.5,0.0,0.0,0.838975,0.838975,4.0,4.0,4.0,31491.0,0.0,,,,178591.5,178591.5,0.0,24.75,1.0,0.885522,0.002466,65.5,4.0,61.5,297.0,1.0,0.0,0.0,0.064056,0.015267,0.0,0.0,9514.816939,0.0,0.0,0.0,0.0,0.0,0.0,735750.0,32596.0,60.0,60.0,-69.0,-1862.0,30885.0,23877.0,5.0,12.0,5.0,0.0,0.0,0.0,0.0,269.0,0.013641,0.0,0.0,0.0,0.0,0.0,2458.279889,186304.5,,,0.0,0.0,-20.0,1544.0,1836.0,14667.35831,1520875.08,5.0,0.0,0.0,21084.075,0.505237,5.622416,-1.250694,-1.959916,-3.17416,2.3044,-0.75604,-0.057765,0.0,0.0,22823.55,22823.55,11250.0,11250.0,9.0,12.0,9029.385,5495.775,13711.305,0.060939,8085.058163,37335.915,396167.85,49.0,1.0,48.0,0.035934,0.165937,1461.966014,37335.915,71636.334672,0.006498,0.165937,0.0,0.0,117.0,2.387755,12.0,301663.62,6156.400408,22823.55,0.565555,,,0.0,0.0,0.0,0.0,1.019568,0.165937,0.165937,,,0.474385,-0.824511,1.474199,0.817147,-1.033729,-0.138804,0.003143,-0.12993,16360.11,0.0,11250.0,11250.0,1.17,1773.0,10.0,70348.23,131.908966,8505.0,11.108996,4356.731549,387.931034,38988.54,0.001572,1.17,1255.316553,492310.665,12.0,-29.0,-1785.0,1756.0,0.0,8505.0,22503.51,-23583.33,11250.0,1.17,7.0,-19.0,0.518258,-0.789362,-1.863631,0.100024,-0.152822,-0.011525,0.885663,-1.055896,0.0,0.0,2.0,,,,0.50267,63.696238,22.571788,-0.12686,5.0,1890000.0,1.0,3.199199,5.0,32.130726,32.007316,12.044461,0.164177,0.133515,-5671.0,0.013831,0.002766,0.088879,-6208.0,0.0,4.617891,0.083026,-22.538638,-8013.0,3.0,0.0,0.0,,0.0,0.0,,0.564595,,-3.507334,-26.269293,-91468521.0,0.475285,1.108033,0.052784,0,4.5184,4.5838,4.5389,1,-0.000143,75.78054,0.026392,37.89027,,-3.8e-05,-7347.658072,0.501484,2.50742,0.518258,0.474385,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0
4,100038,1,0,1,180000.0,625500.0,32067.0,625500.0,0.010032,-13040,-2191.0,-4000.0,-4262,16.0,1,1,1,1,0,0,3.0,2,2,5,0,0,0,0,1,1,42,0.202145,0.425687,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-821.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,,,,,,24463.71,24463.71,1.118802,1.118802,1.118802,1.118802,1.118802,2.0,-449.0,-449.0,-449.0,0.0,92605.5,508495.5,300550.5,112.795981,4581.040541,2346.918261,8.342387,20.785707,14.564047,0.010161,0.187259,0.09871,11100.6,24463.71,17782.155,13.520828,220.393784,116.957306,-821.0,-111.0,710.0,1.0,0.5,2096.599977,4094.594595,267727.5,454500.0,0.000107,0.005736,0.010079,0.087554,1.131358,1.143913,1.118802,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,1.0,0.001218,0.001218,0.0,,,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,1.0,20.785707,20.785707,20.785707,1.118802,1.118802,532959.21,532959.21,0.568242,1.571133,2.179596,4.183057,1.353692,-0.953153,2.186798,-0.578805,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,787.0,0.0,0.0,0.0,0.0,18.007955,11100.3375,23.81427,11100.6,13.841147,11097.45,216.095461,133204.05,0.0,-466.0,-802.0,336.0,,,0.0,0.0,,,-9.0,-18.0,0.515418,-1.508894,1.59145,0.517567,-0.392059,-0.30697,-0.006584,-0.016673,0.0,0.0,1.0,,,,0.508932,,,-0.060353,3.475,805500.0,1.0,4.695803,3.475,19.506034,2.336331,1.376238,,0.168021,-7012.0,0.061669,0.017746,0.346161,-8262.0,0.0,,0.726619,-13.803681,-9083.0,,,,,,0.0,-0.001227,,-13024.0,-2.459126,-14.635783,-70258797.0,0.938527,4.872107,0.020064,2,,,,1,-7.7e-05,99.681021,0.0,0.0,0.0625,-1.6e-05,-2635.970697,0.530864,1.592592,0.568242,0.508932,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1


time: 4.13 s


In [8]:
scaled_test = pd.DataFrame(scale.fit_transform(quant.fit_transform(impute.fit_transform(df_test.drop("SK_ID_CURR", axis=1)))), 
                           columns=df_test.drop("SK_ID_CURR", axis=1).columns, 
                           index=df_test.drop("SK_ID_CURR", axis=1).index)
scaled_test.head()

Unnamed: 0,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,TOTALAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET,TOTAL_AMT_CREDIT_SUM_DIV_SUM_DAYS_CREDIT_ENDDATE,TOTAL_AMT_CREDIT_SUM_POS_DAYS_DIV_SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_ABS_DAYS_INSTALMENT_DIV_DAYS_BIRTH,AMT_CREDIT_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_PLUS_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_GOODS_PRICE,AMT_CREDIT_DIV_SUM_PAYMENT,AMT_GOODS_PRICE_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_ANNUITY,AMT_CREDIT_DIV_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIV_MAX_PREV_REQ_AMOUNT,EXT_SOURCE_PROD,DAYS_EMPLOYED_DIV_DAYS_BIRTH,DAYS_EMPLOYED_PLUS_DAYS_REGISTRATION_PLUS_DAYS_LAST_PHONE_CHANGE,AVG_PAYMENT_SIZE_DIV_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIV_AMT_CREDIT,AVG_PAYMENT_SIZE_DIV_AMT_ANNUITY,DAYS_REGISTRATION_PLUS_DAYS_ID_PUBLISH,SUM_REFUSED_CONTRACT_DIV_SUM_APPR_CONTRACT,MAX_UTILIZATION_DIV_AVG_UTILIZATION,MAX_PREV_REQ_AMOUNT_DIV_AMT_CREDIT,AMT_INCOME_TOTAL_DIV_DAYS_BIRTH,SUM_DAYS_ID_REG_PHONE,SUM_REQ_CREDIT_YEAR,SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_1M,SUM_REQ_CREDIT_1M_DIV_SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_QRT_DIV_SUM_REQ_CREDIT_YEAR,DEF_30_PLUS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE_DIV_DAYS_BIRTH,LANDAREA_DIV_TOTALAREA_MODE,OWN_CAR_AGE_PLUS_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_EMPLOYED,AMT_ANNUITY_PROD_DAYS_EMPLOYED,DAYS_REGISTRATION_DIV_DAYS_ID_PUBLISH,DAYS_REGISTRATION_DIV_DAYS_LAST_PHONE_CHANGE,REGION_RATING_CLIENT_W_CITY_DIV_REGION_POPULATION_RELATIVE,SUM_REG_NOT_FLAG,SUM_AVG_BUILD,SUM_MODE_BUILD,SUM_MEDI_BUILD,SUM_DOC_FLAG,CNT_CHILDREN_DIV_DAYS_BIRTH,CNT_CHILDREN_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_PROD_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_CAR_DIV_OWN_CAR_AGE,EXT_SOURCE_1_DIV_DAYS_BIRTH,EXT_SOURCE_1_PROD_DAYS_BIRTH,AVG_AGG_SYNTHETIC_TARGET,SUM_AGG_SYNTHETIC_TARGET,MAX_AGG_SYNTHETIC_TARGET,MIN_AGG_SYNTHETIC_TARGET,NAME_CONTRACT_TYPE_Cash_loans,NAME_CONTRACT_TYPE_Revolving_loans,NAME_CONTRACT_TYPE_nan,CODE_GENDER_F,CODE_GENDER_M,CODE_GENDER_nan,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group_of_people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse,_partner",NAME_TYPE_SUITE_Unaccompanied,NAME_TYPE_SUITE_nan,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial_associate,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State_servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_INCOME_TYPE_nan,NAME_EDUCATION_TYPE_Academic_degree,NAME_EDUCATION_TYPE_Higher_education,NAME_EDUCATION_TYPE_Incomplete_higher,NAME_EDUCATION_TYPE_Lower_secondary,NAME_EDUCATION_TYPE_Secondary_/_secondary_special,NAME_EDUCATION_TYPE_nan,NAME_FAMILY_STATUS_Civil_marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single_/_not_married,NAME_FAMILY_STATUS_Widow,NAME_FAMILY_STATUS_nan,NAME_HOUSING_TYPE_Co-op_apartment,NAME_HOUSING_TYPE_House_/_apartment,NAME_HOUSING_TYPE_Municipal_apartment,NAME_HOUSING_TYPE_Office_apartment,NAME_HOUSING_TYPE_Rented_apartment,NAME_HOUSING_TYPE_With_parents,NAME_HOUSING_TYPE_nan,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning_staff,OCCUPATION_TYPE_Cooking_staff,OCCUPATION_TYPE_Core_staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR_staff,OCCUPATION_TYPE_High_skill_tech_staff,OCCUPATION_TYPE_IT_staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill_Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine_staff,OCCUPATION_TYPE_Private_service_staff,OCCUPATION_TYPE_Realty_agents,OCCUPATION_TYPE_Sales_staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security_staff,OCCUPATION_TYPE_Waiters/barmen_staff,OCCUPATION_TYPE_nan,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,WEEKDAY_APPR_PROCESS_START_nan,FONDKAPREMONT_MODE_not_specified,FONDKAPREMONT_MODE_org_spec_account,FONDKAPREMONT_MODE_reg_oper_account,FONDKAPREMONT_MODE_reg_oper_spec_account,FONDKAPREMONT_MODE_nan,HOUSETYPE_MODE_block_of_flats,HOUSETYPE_MODE_specific_housing,HOUSETYPE_MODE_terraced_house,HOUSETYPE_MODE_nan,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone,_brick",WALLSMATERIAL_MODE_Wooden,WALLSMATERIAL_MODE_nan,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,EMERGENCYSTATE_MODE_nan
0,-0.713154,0.669488,-0.634477,-0.327293,0.442758,-0.47087,0.182072,-0.07231,-0.600125,-0.467686,-0.186955,1.22214,0.003463,0.004529,0.484762,-0.507337,0.040035,-0.597571,2.268994,0.322223,-0.07775,-0.274939,1.838144,-0.138545,-0.241633,-0.209477,-0.289777,-0.538296,-0.459316,-0.338079,1.492102,2.463098,-1.720596,-1.021122,-0.654545,-1.515519,0.016429,0.061891,-0.509043,0.029244,-1.372581,0.181521,0.121422,-0.010129,-1.112121,-0.394114,0.32689,-0.950124,-0.570835,-1.493762,-0.004706,0.079445,-0.486656,0.065865,-1.403609,-0.001833,-0.122124,-0.000714,-1.034928,-0.365184,0.360688,-0.995847,-0.644311,-1.513773,0.009558,0.070766,-0.500443,0.026728,-1.280339,-0.007223,0.121902,-0.001779,-1.105066,-0.383628,0.341915,-1.20786,-0.925335,-0.356783,-0.921032,-0.302701,-0.550231,0.0,0.520828,-0.010129,-0.122358,-0.309618,-0.006406,-0.311524,-0.06718,0.0,-0.034216,0.0,0.0,0.0,0.0,0.0,0.0,-0.039517,0.0,0.0,0.0,-0.042754,-0.037818,-0.048796,-0.085504,-0.800238,-1.803005,0.012202,0.013295,-0.139128,-0.002663,-0.001147,0.006553,-0.004527,-2.139774,-0.366226,-1.329569,-1.09813,-1.604627,0.717943,-2.241946,-1.976103,0.723693,-2.293924,-2.147694,-0.180542,-1.543365,-1.482638,-0.515307,-1.937237,-1.834875,-0.50705,-2.01004,-1.862892,-0.700259,-2.140521,-2.060776,-0.18604,-1.685017,-1.995981,-1.324352,-1.318171,-2.038821,-2.21225,-1.859456,-2.18433,0.591359,-1.577024,-1.699165,0.667322,-0.933068,-1.437689,-0.072248,-0.163429,-0.137597,-0.2343,-0.188537,-0.325085,-0.760191,-0.898662,-1.214271,-0.593903,-1.138649,-0.59826,0.76736,-1.348681,-1.568169,-1.040815,-1.520501,-1.355283,0.517035,0.000802,-2.858318,-0.424559,-0.294184,-0.288547,-0.458341,-0.448857,-0.060523,-0.471279,-0.904821,-0.22423,0.000241,-0.000535,0.000291,-0.001177,-0.001496,-8.4e-05,0.000777,0.434694,-1.831114,0.729047,-0.109248,0.870954,-0.570382,1.273648,1.000857,0.434215,-0.662203,-0.694003,2.6222,2.184215,0.834354,0.811192,0.700407,0.672925,0.653807,0.819757,-0.08524,-0.042718,2e-06,-0.011034,0.680516,0.680516,-0.077069,-1.134083,-1.233632,0.695264,-0.310582,0.213164,-1.312741,0.466328,-0.418575,-1.156663,1.15665,1.168079,1.722682,-0.006224,1.247226,1.288074,1.474345,0.452336,1.311805,1.34489,1.173281,1.416505,1.31172,0.505764,0.576746,-0.797456,-0.797456,0.370067,-0.200524,0.767916,0.464685,0.623192,0.527493,0.624693,-0.098297,-0.098297,-0.098262,-0.098288,-1.601799,1.407474,-0.502004,-0.502005,-0.502065,-0.502066,-0.077068,0.725627,0.63304,0.056355,0.559972,-0.083023,-0.216943,1.046053,-0.256595,0.397261,0.792576,0.344242,-1.510721,-0.265702,-0.234708,0.530505,0.898046,0.39478,0.842274,0.805728,-0.731664,-1.582766,0.840512,1.008365,-0.08941,-0.106755,-0.349622,-0.405391,-0.375876,-0.399792,-0.298528,-0.332987,-0.285307,-0.056997,-0.37552,-0.373743,-0.009096,0.230886,-0.015814,-0.101987,-0.401912,-0.071692,-0.003585,0.05705,-0.024414,0.230782,-0.005383,-0.015388,0.224705,-0.24549,-0.216477,0.231959,0.233886,0.240817,-0.015978,-0.015972,0.230762,0.181094,-0.080439,0.000205,-0.265116,-0.265118,-0.265124,-0.265127,-0.00086,-0.373755,-0.362356,0.012941,0.015751,-0.028912,-8.7e-05,0.000203,-0.447095,1.5e-05,3e-05,-0.01058,1.8e-05,-0.133375,-0.123619,0.000284,0.000286,0.009079,1.845663,-0.831478,-0.300019,-0.302775,-0.752363,-1.695241,-1.160315,-1.454559,-0.64126,-0.116184,0.217211,-2.086825,-1.777221,0.726524,-1.63161,-1.793556,0.159327,-0.295543,-0.409893,-1.210143,0.202441,0.000239,0.000664,0.865795,-0.295717,-0.577999,-0.760481,-0.300007,-1.113885,0.388857,1.993265,0.138447,1.396688,2.136877,2.664472,0.373913,0.332483,0.120719,-0.171727,0.278397,1.576245,-0.574487,-0.706487,0.740925,0.291746,1.212617,1.911469,0.547144,1.345876,1.959827,2.301501,-0.885651,0.188408,-0.543861,-0.923382,-1.319581,-0.804173,0.384118,-0.756613,-6e-05,-2.202012,0.687218,0.2193,-2.326335,-0.811248,-0.111766,-0.110447,0.351672,-0.356713,-0.005427,0.132971,0.000222,0.712172,0.166532,-0.267408,1.288975,-0.369304,-0.096199,-0.577455,-3.2e-05,-5.1e-05,-9e-05,0.124754,0.633865,-0.633861,0.55633,0.621486,-0.028669,-0.928697,-1.592889,0.345784,-0.032529,0.128419,0.378675,0.095331,-0.095331,0.0,0.701175,-0.701175,0.0,-0.091874,-0.370411,-0.031722,-0.047341,-0.065936,-0.174973,0.476418,-0.138005,-0.004529,-0.552576,-0.484698,-0.279501,-0.006406,-0.004529,0.993416,0.0,-0.029014,1.701333,-0.191482,-0.0992,-1.517674,0.0,-0.309499,0.714071,-0.254038,-0.410727,-0.217875,0.0,-0.050297,0.341803,-0.185234,-0.091761,-0.122271,-0.219164,0.0,-0.185884,-0.116798,-0.136687,-0.313462,-0.245603,-0.04624,-0.198845,-0.040798,-0.464645,-0.07491,-0.281289,-0.166575,-0.097069,-0.053284,-0.340791,-0.066249,-0.138314,-0.06054,1.457263,-0.418,-0.456497,-0.322923,-0.199124,-0.45689,1.999718,-0.458169,0.0,-0.138159,-0.138698,-0.575392,-0.206309,0.697304,0.988293,-0.073512,-0.064828,-0.969567,-0.173724,-0.085409,-0.077229,-0.076554,-0.548368,1.916155,-0.128681,-0.980536,0.928413,-0.085774,-0.914861
1,-0.713154,0.669488,-0.634477,-1.008893,-0.963265,-0.744739,-0.947508,0.871109,-0.396059,-1.170486,-1.047169,0.714316,0.003463,0.004529,0.484762,-0.507337,0.040035,-0.597571,-0.440724,0.322223,-0.07775,-0.274939,-0.965484,-0.138545,-0.241633,-0.209477,-0.289777,-0.538296,-0.459316,1.126647,0.730913,-1.085004,-0.542178,0.023494,0.103115,0.001084,0.016429,0.061891,-0.509043,0.029244,-1.285477,0.181521,0.121422,-0.010129,-0.000999,-0.394114,0.32689,0.001848,0.112872,0.020162,-0.004706,0.079445,-0.486656,0.065865,-0.19441,-0.001833,-0.122124,-0.000714,0.001429,-0.365184,0.360688,0.015482,0.106162,0.002287,0.009558,0.070766,-0.500443,0.026728,-1.192521,-0.007223,0.121902,-0.001779,0.000644,-0.383628,0.341915,0.001728,-0.925335,-0.356783,-0.921032,-0.302701,2.489258,0.0,0.520828,-0.010129,-0.122358,-0.309618,-0.006406,-0.311524,-0.06718,0.0,-0.034216,0.0,0.0,0.0,0.0,0.0,0.0,-0.039517,0.0,0.0,0.0,-0.042754,-0.037818,-0.048796,-0.085504,-0.800238,0.668567,0.012202,0.013295,-0.139128,-0.002663,-0.001147,0.006553,-0.004527,-0.059395,0.285027,-1.059827,-0.412078,-1.604627,-1.066226,-1.703145,-2.174438,-1.066217,-1.498099,-1.709315,0.234012,-1.291363,-0.915215,0.550832,-1.096984,-0.775794,-0.247983,-1.759623,-1.559103,0.205652,-1.45377,-1.271681,0.668201,0.069545,0.114988,0.487987,0.727235,-1.586582,-1.407309,-1.974909,-1.603414,0.795014,-0.728862,-1.117767,0.748485,-1.430824,-1.780546,-0.546778,-0.163429,-0.137597,-0.2343,-0.188537,-0.325085,-0.760191,0.927099,-1.214271,-0.593903,-1.138649,-0.59826,0.76736,-1.348681,-1.568169,-1.040815,-0.925107,-0.532542,0.517035,0.000802,-2.858318,-0.424559,-0.294184,-0.288547,-0.458341,-0.448857,-0.060523,-0.471279,0.905798,-0.22423,0.000241,-0.000535,0.000291,-0.001177,-0.001496,-8.4e-05,0.000777,0.854781,-1.03462,0.633608,-0.167724,0.918818,-1.030042,0.466991,0.716007,0.446392,-0.662203,-0.694003,-0.378465,-0.451509,0.700812,0.687889,0.493872,0.383997,0.363917,0.388915,-0.08524,-0.042718,2e-06,-0.011034,0.651874,0.651874,-0.077069,-1.710123,0.743081,-0.097408,1.521496,-1.523073,-1.077753,-0.261382,-1.275611,0.743081,-0.74308,-0.742482,2.08238,1.527091,-0.743055,-0.742791,1.397845,0.752162,-0.73278,-0.732775,-0.742521,-0.743034,-0.743044,0.427305,0.404947,-1.557314,-1.557314,1.639516,1.138995,0.435649,0.634365,0.330904,-0.115074,0.332062,-0.098297,-0.098297,-0.098262,-0.098288,-1.478138,1.318815,-0.502004,-0.502005,-0.502065,-0.502066,-0.077068,0.713037,0.622221,0.056355,0.559972,-0.083023,-0.216943,0.537047,-0.286184,-0.26226,0.440455,-0.443436,0.447526,-0.265702,-0.234708,0.165618,1.400583,-0.728003,-1.178205,1.737606,-0.695334,-1.184926,1.448889,0.776711,-0.08941,-0.106755,-0.349622,-0.405391,-0.375876,-0.399792,-0.298528,-0.332987,-0.285307,-0.056997,-0.37552,-0.373743,-0.009096,0.230886,-0.015814,-0.101987,-0.401912,-0.071692,-0.003585,0.05705,-0.024414,0.230782,-0.005383,-0.015388,0.224705,-0.24549,-0.216477,0.231959,0.233886,0.240817,-0.015978,-0.015972,0.230762,0.181094,-0.080439,0.000205,-0.265116,-0.265118,-0.265124,-0.265127,-0.00086,-0.373755,-0.362356,0.012941,0.015751,-0.028912,-8.7e-05,0.000203,-0.447095,1.5e-05,3e-05,-0.01058,1.8e-05,-0.133375,-0.123619,0.000284,0.000286,0.009079,-0.70282,-0.831478,-0.300019,-0.302775,-0.752363,-0.971197,-1.077906,-0.975082,-0.629267,0.520726,0.335187,-1.289544,-1.503162,0.726524,-0.801997,0.697951,-0.969949,-0.295543,-0.409893,-1.210143,0.202441,0.000239,0.000664,0.028512,-0.350019,1.004356,-1.441735,0.700543,0.344162,-1.001589,-0.201375,-0.305846,-0.319363,-0.451815,-0.375942,-1.520329,0.332483,0.120719,-0.171727,0.883239,0.887701,-0.405678,0.958071,-0.260275,-1.091878,0.936443,0.901397,-0.39274,-0.441221,1.111128,0.891448,-1.08115,0.923302,-1.297735,-0.458144,-0.227433,-0.526989,-0.671311,-0.756613,-6e-05,-0.866788,1.110248,-0.426889,0.479361,-0.811248,-0.111766,-0.110447,-1.269448,-0.356713,-0.005427,0.132971,0.000222,0.868528,0.624779,-0.629585,1.208643,0.000622,1.133571,-0.577455,-3.2e-05,-5.1e-05,-9e-05,0.124754,0.633865,-0.633861,0.932713,0.356188,-0.028669,0.685917,-0.978394,1.369625,0.399322,0.799449,1.747892,0.095331,-0.095331,0.0,-1.426178,1.426178,0.0,-0.091874,-0.370411,-0.031722,-0.047341,-0.065936,-0.174973,0.476418,-0.138005,-0.004529,-0.552576,-0.484698,-0.279501,-0.006406,-0.004529,0.993416,0.0,-0.029014,-0.587774,-0.191482,-0.0992,0.658903,0.0,-0.309499,0.714071,-0.254038,-0.410727,-0.217875,0.0,-0.050297,0.341803,-0.185234,-0.091761,-0.122271,-0.219164,0.0,-0.185884,-0.116798,-0.136687,-0.313462,-0.245603,-0.04624,-0.198845,-0.040798,-0.464645,13.349378,-0.281289,-0.166575,-0.097069,-0.053284,-0.340791,-0.066249,-0.138314,-0.06054,-0.686218,2.392344,-0.456497,-0.322923,-0.199124,-0.45689,-0.500071,-0.458169,0.0,-0.138159,-0.138698,-0.575392,-0.206309,0.697304,-1.011846,-0.073512,-0.064828,1.031388,-0.173724,-0.085409,-0.077229,-0.076554,-0.548368,-0.521878,-0.128681,1.019851,-1.077107,-0.085774,1.093063
2,1.402222,0.669488,-0.634477,0.551409,0.63473,2.096256,0.664487,-0.0182,-0.757262,-1.167363,0.596034,-0.100493,-1.439758,0.004529,0.484762,-0.507337,0.040035,-0.597571,-0.440724,0.322223,-0.07775,-0.274939,0.584445,-0.138545,-0.241633,-0.209477,-0.289777,-0.538296,-0.459316,5.145368,0.000123,1.057149,0.602999,0.023494,0.103115,0.001084,0.016429,0.061891,-0.509043,0.029244,-1.285477,0.181521,0.121422,-0.010129,-0.000999,-0.394114,0.32689,0.001848,0.112872,0.020162,-0.004706,0.079445,-0.486656,0.065865,-0.19441,-0.001833,-0.122124,-0.000714,0.001429,-0.365184,0.360688,0.015482,0.106162,0.002287,0.009558,0.070766,-0.500443,0.026728,-1.192521,-0.007223,0.121902,-0.001779,0.000644,-0.383628,0.341915,0.001728,-0.925335,-0.356783,-0.921032,-0.302701,-0.215507,0.0,-1.920019,-0.010129,-0.122358,-0.309618,-0.006406,3.210026,-0.06718,0.0,-0.034216,0.0,0.0,0.0,0.0,0.0,0.0,-0.039517,0.0,0.0,0.0,-0.042754,-0.037818,-0.048796,-0.085504,1.168445,0.835517,-1.393015,-0.824438,1.364156,1.045556,0.669283,0.860645,-0.41527,0.267479,-0.40491,-0.854295,-0.558899,0.364643,-1.066226,0.553471,0.229528,-1.066217,0.02577,-0.296193,-0.680719,0.665045,-0.090989,-0.414114,-0.387264,-0.355017,-0.265265,0.211349,-0.198016,-0.384871,-0.412406,-0.417596,-0.36178,0.45102,0.579731,0.487987,0.462337,-0.314872,-0.04679,0.217581,0.51048,0.391265,0.284928,0.600254,0.503517,0.512221,0.537934,-0.196895,-0.163429,-0.137597,-0.2343,-0.188537,-0.325085,-0.760191,0.927099,0.161224,-0.593903,0.705404,-0.59826,0.76736,-1.348681,0.392825,0.353254,0.480312,0.732267,0.778191,0.000802,-2.858318,-0.424559,3.329413,-0.288547,-0.458341,-0.448857,-0.060523,-0.471279,1.034088,-0.22423,0.000241,-0.000535,0.000291,-0.001177,-0.001496,-8.4e-05,0.000777,0.038943,0.033968,-0.289869,-0.240611,0.239087,0.585969,0.539516,-0.077721,-1.029792,-0.662203,-0.694003,-0.378465,-0.451509,-2.704602,-2.386376,-1.99277,-2.062858,-2.109177,-1.065884,-0.08524,-0.042718,2e-06,-0.011034,-1.146404,-1.146404,-0.077069,1.174712,-1.426178,0.350222,-0.498563,0.40485,1.010594,0.127412,0.477598,-1.443941,1.443926,1.298055,-1.406093,-0.559568,1.297917,1.193292,-0.527562,0.384976,1.431406,1.340935,1.549156,1.167795,1.314361,-1.943116,-2.007573,0.317857,0.317857,-0.369335,-0.495402,-1.391954,-1.08606,-2.185929,0.029565,-2.185755,-0.098297,-0.098297,-0.098262,-0.098288,1.418355,-1.051886,1.870476,1.865747,2.087075,2.043367,-0.077068,-1.694583,-1.694531,0.056355,0.559972,-0.083023,-0.216943,1.415166,0.508355,-0.029632,-0.54867,0.583835,-1.510721,4.066629,-0.234708,-1.656535,-1.673877,-0.698001,1.132502,-0.782843,1.221125,0.726946,-0.441239,-0.549107,-0.08941,-0.106755,-0.349622,-0.405391,-0.375876,-0.399792,-0.298528,-0.332987,-0.285307,-0.056997,-0.37552,-0.373743,1.063255,0.866908,1.397079,3.724669,-0.401912,4.175199,-1.168355,0.908564,-1.272748,-0.279259,-1.100451,-1.278916,-0.325339,3.88949,4.457512,0.906889,0.767393,0.923878,1.919927,1.227276,1.006963,-3.019464,-0.080439,0.000205,-0.265116,-0.265118,-0.265124,-0.265127,-0.00086,-0.373755,-0.362356,0.012941,0.015751,-1.388791,1.084397,-1.503996,1.928722,-1.362086,-2.142302,-1.7806,1.817804,1.508743,2.21531,-1.631459,1.615975,-1.725174,0.828695,1.434877,1.906195,1.771538,1.546255,-0.817022,-0.459636,0.730928,1.13677,-0.988786,-1.093769,0.401315,1.034162,1.153272,1.185806,-0.845048,1.118529,2.449781,1.616006,0.543573,-1.63116,-1.629593,-1.186371,1.225044,-0.402643,-0.135718,0.84146,-1.712478,-0.337195,1.347803,-0.130661,-1.051174,-0.299212,2.310265,-0.375942,0.584087,-1.896663,-1.004677,5.794645,1.384764,-0.875545,0.026543,-0.482338,0.317905,0.673424,-0.462956,-0.626379,0.431086,-1.251965,0.407226,-0.11262,0.000267,0.800014,-0.236283,-0.797818,-0.934608,-1.680002,0.470073,-0.756613,2.532592,0.114755,0.051537,0.510884,0.880932,1.148195,-0.111766,-0.110447,0.351672,-0.356713,1.607076,0.132971,-1.842609,-1.203967,-0.245153,-2.001902,-0.764466,-0.494173,-0.04209,-0.577455,-3.2e-05,-5.1e-05,-9e-05,0.124754,0.633865,-0.633861,0.575142,0.599902,1.258992,-0.00013,-0.180574,-0.590499,0.81973,-0.501063,-0.970483,0.095331,-0.095331,0.0,-1.426178,1.426178,0.0,-0.091874,-0.370411,-0.031722,-0.047341,-0.065936,-0.174973,-2.098997,7.246105,-0.004529,-0.552576,-0.484698,-0.279501,-0.006406,-0.004529,0.993416,0.0,-0.029014,1.701333,-0.191482,-0.0992,-1.517674,0.0,-0.309499,0.714071,-0.254038,-0.410727,-0.217875,0.0,-0.050297,0.341803,-0.185234,-0.091761,-0.122271,-0.219164,0.0,-0.185884,-0.116798,-0.136687,-0.313462,4.071618,-0.04624,-0.198845,-0.040798,-0.464645,-0.07491,-0.281289,-0.166575,-0.097069,-0.053284,-0.340791,-0.066249,-0.138314,-0.06054,-0.686218,-0.418,2.190597,-0.322923,-0.199124,-0.45689,-0.500071,-0.458169,0.0,-0.138159,-0.138698,-0.575392,-0.206309,0.697304,-1.011846,-0.073512,-0.064828,1.031388,-0.173724,-0.085409,-0.077229,-0.076554,-0.548368,-0.521878,-0.128681,1.019851,-1.077107,-0.085774,1.093063
3,-0.713154,0.669488,1.725368,1.498615,1.946503,1.179208,1.936555,0.361919,0.358865,-0.286933,0.645248,-0.405176,0.003463,0.004529,0.484762,-0.507337,0.040035,1.673441,-0.440724,1.051154,-0.07775,-0.274939,-0.237929,-0.138545,-0.241633,-0.209477,-0.289777,-0.538296,-0.459316,0.405052,0.622075,-0.253647,0.611986,1.876319,1.456832,2.125957,2.365829,1.645731,2.117751,1.803787,1.503366,-1.628368,1.535004,2.134663,2.078681,2.815802,1.048993,1.88522,1.435281,2.119557,2.414812,1.642729,2.206241,1.83964,1.530456,-1.900165,1.499069,2.152051,2.104386,3.020499,1.067609,1.87602,1.455059,2.11241,2.41459,1.655335,2.149583,1.821006,1.623461,-1.935399,1.526066,2.132143,2.085839,2.88824,1.052526,2.118855,-0.925335,-0.356783,-0.921032,-0.302701,-0.611835,0.0,0.520828,-0.010129,-0.122358,-0.309618,-0.006406,-0.311524,-0.06718,0.0,-0.034216,0.0,0.0,0.0,0.0,0.0,0.0,-0.039517,0.0,0.0,0.0,-0.042754,-0.037818,-0.048796,-0.085504,-0.800238,0.668567,0.012202,0.013295,-0.139128,-0.002663,-0.001147,0.006553,-0.004527,0.393516,-0.092752,0.931263,0.213173,0.665043,-1.066226,-0.128165,-0.351979,-1.066217,-0.874261,-1.071843,0.30726,0.566852,0.895702,0.525901,-0.955787,-0.684364,0.059872,-0.699463,-0.755707,-0.368213,-1.240593,-1.246513,-0.247457,-0.555714,0.427985,0.640842,0.619788,-1.371359,-1.209939,-1.063507,-0.516066,0.634687,-5.6e-05,-0.00079,0.482469,-8.5e-05,-0.001616,-0.277676,-0.163429,-0.137597,-0.2343,-0.188537,-0.325085,-0.760191,0.927099,0.161224,-0.593903,-1.138649,-0.59826,-1.070642,0.536756,0.678807,-0.197529,-0.593326,-0.612711,0.517035,0.000802,-2.858318,-0.424559,-0.294184,-0.288547,-0.458341,-0.448857,-0.060523,-0.471279,-0.904821,-0.22423,0.000241,-0.000535,0.000291,-0.001177,-0.001496,-8.4e-05,0.000777,0.251318,-0.142984,-0.129331,-0.216126,0.448824,0.172444,-0.21107,-0.729017,-0.377514,1.453501,1.385889,-0.378465,-0.451509,0.418148,0.429617,0.882306,0.858185,0.840219,1.710438,-0.08524,-0.042718,2e-06,-0.011034,0.154976,0.154976,-0.077069,0.739122,0.743081,0.383939,-1.431121,0.709261,-0.315523,0.669059,1.571569,0.743081,-0.74308,-0.742482,-0.396778,-0.619227,-0.743055,-0.742791,-0.666256,-2.196418,-0.73278,-0.732775,-0.742521,-0.743034,-0.743044,0.469355,1.037923,0.935555,0.935555,-0.392042,-0.622098,1.595404,1.31865,0.98096,0.929868,0.984533,-0.098297,-0.098297,-0.098262,-0.098288,-0.365256,0.704253,-0.502004,-0.502005,-0.502065,-0.502066,-0.077068,0.206993,0.30522,0.056355,0.559972,-0.083023,-0.216943,-0.292264,0.606008,0.522019,-0.411814,0.373913,1.150804,-0.265702,-0.234708,0.494231,0.384992,1.369826,-1.656786,-0.501368,-2.050657,1.170737,-1.324787,-0.537826,-0.08941,-0.106755,2.738138,2.299607,2.664073,2.495082,3.35683,3.022773,1.688535,2.068387,2.46444,2.467709,-1.141549,-0.339448,-1.135422,0.894473,-0.401912,1.046077,-1.270905,-0.375803,0.997021,0.894956,1.246224,1.152527,0.88881,-0.24549,-0.216477,1.350101,1.077508,1.063845,1.498185,1.234428,-0.343591,0.95719,-0.080439,0.000205,-0.265116,-0.265118,-0.265124,-0.265127,-3.063321,2.466559,2.548177,0.012941,0.015751,-2.328587,1.267856,2.064,1.473944,-1.770551,-1.200593,-1.168851,1.149486,1.688835,-0.123619,-0.932529,-0.991722,-2.53193,0.152339,1.434877,1.375326,1.30672,0.666823,-0.970437,-1.596063,0.111039,-0.084983,-1.524715,-1.657969,0.029693,0.219644,1.175452,0.501459,-0.165215,0.422916,-0.295543,1.821567,0.561795,-0.545094,-0.92807,-2.633308,0.655053,0.967678,0.58549,-0.111166,-1.108547,0.088076,-0.237176,0.13305,1.554754,-1.432668,-0.451815,-0.375942,0.373913,0.332483,0.120719,-0.171727,0.089475,0.488512,-1.312664,-0.365658,1.021806,1.960281,-1.088324,0.748316,1.200691,2.073505,2.305468,1.68974,0.991332,0.27606,0.100159,-2.261688,-2.627443,-2.157396,0.326962,-0.756613,2.063088,-1.641199,-1.421728,0.153244,0.479361,-0.811248,-0.111766,-0.110447,-1.269448,-0.356713,-0.005427,-0.467335,0.000222,-1.217684,-0.640439,-0.77012,-0.924952,-1.088787,0.359211,-0.577455,2.332853,2.39342,2.341535,0.124754,-1.682045,1.529698,0.716937,0.477731,-0.028669,-0.832098,-0.578701,0.078511,1.122377,-0.159979,-0.103877,0.095331,-0.095331,0.0,0.701175,-0.701175,0.0,-0.091874,-0.370411,-0.031722,-0.047341,-0.065936,-0.174973,0.476418,-0.138005,-0.004529,-0.552576,-0.484698,-0.279501,-0.006406,-0.004529,0.993416,0.0,-0.029014,-0.587774,-0.191482,-0.0992,0.658903,0.0,-0.309499,0.714071,-0.254038,-0.410727,-0.217875,0.0,-0.050297,0.341803,-0.185234,-0.091761,-0.122271,-0.219164,0.0,-0.185884,-0.116798,-0.136687,-0.313462,-0.245603,-0.04624,-0.198845,-0.040798,-0.464645,-0.07491,-0.281289,-0.166575,-0.097069,-0.053284,2.93435,-0.066249,-0.138314,-0.06054,-0.686218,-0.418,-0.456497,-0.322923,-0.199124,-0.45689,-0.500071,2.182601,0.0,-0.138159,-0.138698,1.737946,-0.206309,-1.434094,0.988293,-0.073512,-0.064828,-0.969567,-0.173724,-0.085409,-0.077229,-0.076554,1.823594,-0.521878,-0.128681,-0.980536,0.928413,-0.085774,-0.914861
4,1.402222,-1.493678,1.468296,0.312208,0.579309,0.403222,0.643756,-0.567963,0.557425,-0.419868,0.12538,-0.46818,1.60376,0.004529,0.484762,1.971078,0.040035,-0.597571,-0.440724,0.751925,-0.07775,-0.274939,-2.113402,-0.138545,-0.241633,-0.209477,-0.289777,1.857714,2.177152,0.405052,-1.675049,-0.609047,0.002494,0.023494,0.103115,0.001084,0.016429,0.061891,-0.509043,0.029244,-0.18081,-0.677575,-0.141086,-0.010129,0.007954,-0.394114,0.342009,0.001848,0.112872,0.020162,-0.004706,0.079445,-0.486656,0.065865,-0.19441,-0.001833,0.126835,-0.000714,0.001429,-0.365184,0.360688,0.00792,0.114283,0.002287,0.009558,0.070766,-0.500443,0.026728,-0.072524,-0.007223,0.12533,-0.001779,0.000644,-0.383628,0.332709,0.001728,-0.925335,-0.356783,-0.921032,-0.302701,-0.199349,0.0,0.520828,-0.010129,-0.122358,-0.309618,-0.006406,-0.311524,-0.06718,0.0,-0.034216,0.0,0.0,0.0,0.0,0.0,0.0,-0.039517,0.0,0.0,0.0,-0.042754,-0.037818,-0.048796,-0.085504,-0.800238,0.420515,1.397261,1.200709,1.689858,1.360144,1.119432,1.122156,0.612352,-0.059395,0.295723,-1.055075,-0.406129,-1.604627,1.032883,0.54184,1.065781,1.011064,1.471453,1.967672,0.235097,0.494302,0.508395,0.483799,1.522941,1.747202,0.793369,0.277266,0.547213,0.748609,1.396555,1.603612,0.585409,1.022505,0.234726,0.487987,0.727235,1.920539,1.441652,1.042528,0.597205,0.72435,1.597054,1.429982,0.559131,1.481963,0.558654,1.820056,-0.163429,-0.137597,-0.2343,-0.188537,-0.325085,-0.760191,0.927099,-1.214271,-0.593903,-1.138649,-0.59826,0.76736,-1.348681,0.392825,-1.040815,-0.997394,-0.654563,-1.378948,0.000802,-2.858318,-0.424559,-0.294184,-0.288547,2.033302,2.077473,-0.060523,1.999949,-0.904821,4.354922,2.60625,2.678487,2.534792,2.185537,2.086475,2.373606,2.337024,1.650799,0.696896,1.749259,1.817188,0.877125,-0.849824,1.486617,-0.321964,-0.019892,-0.662203,-0.694003,-0.378465,-0.451509,0.190258,0.238679,0.173104,0.383997,0.363917,-0.006196,-0.08524,-0.042718,2e-06,-0.011034,-0.02153,-0.02153,-0.077069,-0.003435,0.743081,0.233439,-0.002992,-0.00434,0.064198,0.221032,0.006151,0.743081,-0.74308,-0.742482,-0.003017,-0.006224,-0.743055,-0.742791,0.009244,0.267613,-0.73278,-0.732775,-0.742521,-0.743034,-0.743044,0.31958,0.305495,0.011505,0.011505,-0.008504,-0.00035,-0.000992,7.1e-05,0.330904,0.23634,0.332062,-0.098297,-0.098297,-0.098262,-0.098288,-0.000623,0.000243,-0.502004,-0.502005,-0.502065,-0.502066,-0.077068,0.38512,0.385144,0.056355,0.559972,-0.083023,-0.216943,0.0031,0.217431,0.215976,0.008766,0.008816,0.447526,-0.265702,-0.234708,0.396698,0.000128,-0.000265,-1.2e-05,-5e-06,8.3e-05,4.5e-05,1.2e-05,-5e-06,-0.08941,-0.106755,-0.349622,-0.405391,-0.375876,-0.399792,-0.298528,-0.332987,-0.285307,-0.056997,-0.37552,-0.373743,-0.009096,0.230886,-0.015814,-0.101987,-0.401912,-0.071692,-0.033779,0.223972,-0.287777,0.230782,-0.005383,-0.015388,0.224705,-0.24549,-0.216477,0.231959,0.233886,0.240817,-0.015978,-0.015972,0.230762,0.181094,-0.080439,0.000205,-0.265116,-0.265118,-0.265124,-0.265127,-0.00086,-0.373755,-0.362356,0.012941,0.015751,0.541447,-8.7e-05,0.000203,0.004728,1.5e-05,3e-05,-0.013306,1.8e-05,-0.133375,-0.123619,0.000284,0.000286,0.122795,-0.602851,-0.831478,-0.300019,-0.302775,-0.752363,-0.670226,-0.27975,-1.151461,-1.069455,0.893396,1.029676,-0.910744,-0.775057,-1.042218,-0.796232,0.615415,-0.715832,-0.295543,-0.409893,-1.210143,0.202441,0.000239,0.000664,-1.343463,1.068776,0.449246,-1.206374,0.863995,0.476592,-0.584257,-0.152695,-0.107249,-0.059457,-0.451815,-0.375942,-1.520329,0.332483,0.120719,-0.171727,0.883239,-2.4e-05,0.026543,0.494037,0.422765,0.54721,-1.088324,1.032319,0.629492,0.442735,-0.475874,-0.161102,0.000267,0.490293,-0.152546,-0.485607,-0.723871,-0.572728,-0.150339,-0.756613,-6e-05,0.162492,-0.524546,-0.08434,0.17717,-0.811248,-0.111766,-0.110447,0.351672,-0.356713,-1.673473,0.132971,1.341326,-0.587389,-0.197298,-0.550937,-0.48047,0.327224,-0.580904,1.646922,-3.2e-05,-5.1e-05,-9e-05,0.124754,-1.474006,1.580343,-1.423074,-1.457688,-1.44858,1.738896,1.522447,1.51821,-1.20864,1.273296,1.747892,0.095331,-0.095331,0.0,-1.426178,1.426178,0.0,-0.091874,-0.370411,-0.031722,-0.047341,-0.065936,-0.174973,0.476418,-0.138005,-0.004529,-0.552576,-0.484698,-0.279501,-0.006406,-0.004529,0.993416,0.0,-0.029014,-0.587774,-0.191482,-0.0992,0.658903,0.0,-0.309499,0.714071,-0.254038,-0.410727,-0.217875,0.0,-0.050297,0.341803,-0.185234,-0.091761,-0.122271,-0.219164,0.0,-0.185884,-0.116798,-0.136687,-0.313462,-0.245603,-0.04624,-0.198845,-0.040798,-0.464645,-0.07491,-0.281289,-0.166575,-0.097069,-0.053284,-0.340791,-0.066249,-0.138314,-0.06054,1.457263,2.392344,-0.456497,-0.322923,-0.199124,-0.45689,-0.500071,-0.458169,0.0,-0.138159,-0.138698,-0.575392,-0.206309,0.697304,-1.011846,-0.073512,-0.064828,1.031388,-0.173724,-0.085409,-0.077229,-0.076554,-0.548368,-0.521878,-0.128681,1.019851,-1.077107,-0.085774,1.093063


time: 10.6 s


In [9]:
lda_score = pd.Series(clf.predict_proba(scaled_test)[:,1], 
                     index=scaled_test.index,
                     name="LDA_SCORE")

time: 31.5 ms


# Gaussian Random Projection

#### Train

In [60]:
df = pd.read_csv(path + "train.csv", usecols=lambda c: "RAND_PROJ" not in c)
df.head()

Unnamed: 0,SK_ID_CURR,TARGET,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,TOTALAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET,TOTAL_AMT_CREDIT_SUM_DIV_SUM_DAYS_CREDIT_ENDDATE,TOTAL_AMT_CREDIT_SUM_POS_DAYS_DIV_SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_ABS_DAYS_INSTALMENT_DIV_DAYS_BIRTH,AMT_CREDIT_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_PLUS_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_GOODS_PRICE,AMT_CREDIT_DIV_SUM_PAYMENT,AMT_GOODS_PRICE_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_ANNUITY,AMT_CREDIT_DIV_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIV_MAX_PREV_REQ_AMOUNT,EXT_SOURCE_PROD,DAYS_EMPLOYED_DIV_DAYS_BIRTH,DAYS_EMPLOYED_PLUS_DAYS_REGISTRATION_PLUS_DAYS_LAST_PHONE_CHANGE,AVG_PAYMENT_SIZE_DIV_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIV_AMT_CREDIT,AVG_PAYMENT_SIZE_DIV_AMT_ANNUITY,DAYS_REGISTRATION_PLUS_DAYS_ID_PUBLISH,SUM_REFUSED_CONTRACT_DIV_SUM_APPR_CONTRACT,MAX_UTILIZATION_DIV_AVG_UTILIZATION,MAX_PREV_REQ_AMOUNT_DIV_AMT_CREDIT,AMT_INCOME_TOTAL_DIV_DAYS_BIRTH,SUM_DAYS_ID_REG_PHONE,SUM_REQ_CREDIT_YEAR,SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_1M,SUM_REQ_CREDIT_1M_DIV_SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_QRT_DIV_SUM_REQ_CREDIT_YEAR,DEF_30_PLUS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE_DIV_DAYS_BIRTH,LANDAREA_DIV_TOTALAREA_MODE,OWN_CAR_AGE_PLUS_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_EMPLOYED,AMT_ANNUITY_PROD_DAYS_EMPLOYED,DAYS_REGISTRATION_DIV_DAYS_ID_PUBLISH,DAYS_REGISTRATION_DIV_DAYS_LAST_PHONE_CHANGE,REGION_RATING_CLIENT_W_CITY_DIV_REGION_POPULATION_RELATIVE,SUM_REG_NOT_FLAG,SUM_AVG_BUILD,SUM_MODE_BUILD,SUM_MEDI_BUILD,SUM_DOC_FLAG,CNT_CHILDREN_DIV_DAYS_BIRTH,CNT_CHILDREN_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_PROD_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_CAR_DIV_OWN_CAR_AGE,EXT_SOURCE_1_DIV_DAYS_BIRTH,EXT_SOURCE_1_PROD_DAYS_BIRTH,AVG_AGG_SYNTHETIC_TARGET,SUM_AGG_SYNTHETIC_TARGET,MAX_AGG_SYNTHETIC_TARGET,MIN_AGG_SYNTHETIC_TARGET,DAYS_REGISTRATION_DIFF_DAYS_LAST_PHONE_CHANGE,DAYS_BIRTH_DIFF_DAYS_EMPLOYED,EXT_SOURCE_1_DIFF_EXT_SOURCE_2,EXT_SOURCE_1_DIFF_EXT_SOURCE_3,EXT_SOURCE_2_DIFF_EXT_SOURCE_3,AVG_PAYMENT_SIZE_DIFF_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIFF_AMT_CREDIT,AVG_PAYMENT_SIZE_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_GOODS_PRICE,AMT_CREDIT_DIFF_SUM_PAYMENT,AMT_GOODS_PRICE_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIFF_MAX_PREV_REQ_AMOUNT,NAME_CONTRACT_TYPE_Cash_loans,NAME_CONTRACT_TYPE_Revolving_loans,NAME_CONTRACT_TYPE_nan,CODE_GENDER_F,CODE_GENDER_M,CODE_GENDER_nan,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group_of_people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse,_partner",NAME_TYPE_SUITE_Unaccompanied,NAME_TYPE_SUITE_nan,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial_associate,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State_servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_INCOME_TYPE_nan,NAME_EDUCATION_TYPE_Academic_degree,NAME_EDUCATION_TYPE_Higher_education,NAME_EDUCATION_TYPE_Incomplete_higher,NAME_EDUCATION_TYPE_Lower_secondary,NAME_EDUCATION_TYPE_Secondary_/_secondary_special,NAME_EDUCATION_TYPE_nan,NAME_FAMILY_STATUS_Civil_marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single_/_not_married,NAME_FAMILY_STATUS_Widow,NAME_FAMILY_STATUS_nan,NAME_HOUSING_TYPE_Co-op_apartment,NAME_HOUSING_TYPE_House_/_apartment,NAME_HOUSING_TYPE_Municipal_apartment,NAME_HOUSING_TYPE_Office_apartment,NAME_HOUSING_TYPE_Rented_apartment,NAME_HOUSING_TYPE_With_parents,NAME_HOUSING_TYPE_nan,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning_staff,OCCUPATION_TYPE_Cooking_staff,OCCUPATION_TYPE_Core_staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR_staff,OCCUPATION_TYPE_High_skill_tech_staff,OCCUPATION_TYPE_IT_staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill_Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine_staff,OCCUPATION_TYPE_Private_service_staff,OCCUPATION_TYPE_Realty_agents,OCCUPATION_TYPE_Sales_staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security_staff,OCCUPATION_TYPE_Waiters/barmen_staff,OCCUPATION_TYPE_nan,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,WEEKDAY_APPR_PROCESS_START_nan,FONDKAPREMONT_MODE_not_specified,FONDKAPREMONT_MODE_org_spec_account,FONDKAPREMONT_MODE_reg_oper_account,FONDKAPREMONT_MODE_reg_oper_spec_account,FONDKAPREMONT_MODE_nan,HOUSETYPE_MODE_block_of_flats,HOUSETYPE_MODE_specific_housing,HOUSETYPE_MODE_terraced_house,HOUSETYPE_MODE_nan,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone,_brick",WALLSMATERIAL_MODE_Wooden,WALLSMATERIAL_MODE_nan,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,EMERGENCYSTATE_MODE_nan
0,100002,1,0,1,0,202500.0,406597.5,24700.5,351000.0,0.018801,-9461,-637.0,-3648.0,-2120,,1,1,0,1,1,0,1.0,2,2,10,0,0,0,0,0,0,42,0.083037,0.262949,0.139376,0.0247,0.0369,0.9722,0.6192,0.0143,0.0,0.069,0.0833,0.125,0.0369,0.0202,0.019,0.0,0.0,0.0252,0.0383,0.9722,0.6341,0.0144,0.0,0.069,0.0833,0.125,0.0377,0.022,0.0198,0.0,0.0,0.025,0.0369,0.9722,0.6243,0.0144,0.0,0.069,0.0833,0.125,0.0375,0.0205,0.0193,0.0,0.0,0.0149,2.0,2.0,2.0,2.0,-1134.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,1.0,,9251.775,,,1.0,,1.0,1.0,-17.0,-17.0,-17.0,0.0,179055.0,179055.0,179055.0,295.470297,295.470297,295.470297,19.353584,19.353584,19.353584,0.031937,0.031937,0.031937,9251.775,9251.775,9251.775,15.266955,15.266955,15.266955,-606.0,-606.0,0.0,0.0,0.0,295.470297,295.470297,179055.0,179055.0,0.0,0.00165,0.00165,0.0,1.0,1.0,1.0,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.00165,0.00165,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.487067,-2.72488,1.59177,2.395666,0.118051,-0.42582,-0.376677,0.405732,315.103846,0.0,0.0,0.0,0.0,0.54618,0.54618,2.0,2.0,2.0,780.0,0.0,,,,245781.0,245781.0,0.0,10.875,0.689655,0.264368,0.003698,40.5,1.5,39.0,60.0,0.716964,0.283036,0.5,0.109328,0.014109,0.010476,0.025641,4863.768166,0.0,1617.905476,7012.987013,0.75,0.051282,0.027542,638235.0,927.0,20.0,20.0,-47.0,-1072.0,780.0,-2094.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,103.0,0.017755,148.3425,153.695563,5043.645,8405.145,0.0,35111.571429,245781.0,,,0.0,,-7.0,1178.0,1334.0,69432.89321,865055.565,4.0,0.0,0.0,0.0,0.526688,1.038894,7.601345,0.534316,-0.817806,-0.592501,-0.290651,0.111304,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,53093.745,53093.745,9251.775,565.0,0.0,0.0,0.0,0.0,95.448632,11559.247105,1083.545816,53093.745,15.761116,9251.775,1813.524009,219625.695,0.0,-49.0,-587.0,538.0,0.0,0.0,90100.845,34590.195,53093.745,9251.775,-12.0,-31.0,0.514141,-0.752288,1.616157,0.754784,-0.702447,-0.535793,0.056893,0.006947,0.0,0.0,1.0,6.0,11.0,0.0,0.510127,-413.11154,688.495146,-0.059719,2.007889,609097.5,1.158397,1.85132,1.733333,16.461104,2.270797,2.270797,0.003043,0.067329,-5419.0,0.057083,0.028429,0.467976,-5768.0,0.0,,0.440374,-21.403657,-6902.0,1.0,0.0,0.0,,0.0,4.0,,2.530201,,-2.610771,-38.776295,-15734218.5,1.720755,3.216931,0.037602,0,2.0207,2.041,2.0274,1,-0.0,0.0,0.018801,53.18866,,-9e-06,-785.612748,0.509506,2.038022,0.526688,0.487067,-2514.0,-8824,-0.179912,-0.056339,0.123573,-190940.752895,-395038.3,-13141.252895,204097.5,55597.5,186971.805,148500.0,381897.0,227542.5,227542.5,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0
1,100003,0,0,0,0,270000.0,1293502.5,35698.5,1129500.0,0.003541,-16765,-1188.0,-1186.0,-291,,1,1,0,1,1,0,2.0,1,1,11,0,0,0,0,0,0,13,0.311267,0.622246,,0.0959,0.0529,0.9851,0.796,0.0605,0.08,0.0345,0.2917,0.3333,0.013,0.0773,0.0549,0.0039,0.0098,0.0924,0.0538,0.9851,0.804,0.0497,0.0806,0.0345,0.2917,0.3333,0.0128,0.079,0.0554,0.0,0.0,0.0968,0.0529,0.9851,0.7987,0.0608,0.08,0.0345,0.2917,0.3333,0.0132,0.0787,0.0558,0.0039,0.01,0.0714,1.0,0.0,1.0,0.0,-828.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,3.0,-1976.0,-527.0,-1047.333333,1449.0,68053.5,1035882.0,484191.0,29.070269,1388.581769,612.90394,5.399568,10.531859,8.677472,0.004315,0.014118,0.008318,6737.31,98356.995,56553.99,2.877962,131.845838,70.901357,-2341.0,-746.0,1595.0,0.0,0.0,547.812073,1206.434316,435436.5,900000.0,2.1e-05,0.001071,0.001543,0.05003,1.057664,1.15098,0.989013,,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,2.0,0.0,0.0,1.0,2.0,3.0,0.002975,0.00134,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.42019,0.428183,-0.535911,2.110056,-4.18119,1.337309,1.599647,0.545277,0.0,0.0,0.0,,,0.0,0.0,1.0,1.0,1.0,1216.0,0.0,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,810000.0,1216.0,,,,-2434.0,1216.0,-2178.0,1.0,4.0,1.0,0.0,0.0,0.0,0.0,606.0,0.003938,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,-43.0,2088.0,1980.0,19188.078259,1017400.5,2.0,0.0,0.0,0.0,0.459155,-1.386349,-0.52014,-0.831323,-0.242488,-0.712057,0.070022,0.154299,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,2310.0,0.0,0.0,0.0,0.0,100.798053,64754.586,1030.947353,560835.36,2.899015,6662.97,2519.951327,1618864.65,0.0,-544.0,-2324.0,1780.0,,,0.0,0.0,,,-1.0,-14.0,0.47399,0.659627,-0.035899,-0.624043,1.42402,0.239304,-0.727819,1.224179,0.0,0.0,3.0,,,,0.495285,-467.126033,666.118421,-0.137787,4.79075,1563502.5,1.145199,0.799018,4.183333,36.234085,2.970588,1.437225,,0.070862,-3202.0,0.239832,0.050061,1.81393,-1477.0,0.0,,0.695785,-16.104981,-2305.0,0.0,0.0,0.0,,,0.0,,0.179272,,-2.129347,-30.049242,-42409818.0,4.075601,1.432367,0.003541,0,2.8888,2.8723,2.8954,1,-0.0,0.0,0.0,0.0,,-1.9e-05,-5218.396475,0.462155,1.848621,0.495285,0.42019,-358.0,-15577,-0.310978,,,-205245.414,-1228748.0,29056.086,1023502.5,164002.5,-325362.15,859500.0,1257804.0,858066.0,393502.5,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0
2,100004,0,1,1,0,67500.0,135000.0,6750.0,135000.0,0.010032,-19046,-225.0,-4260.0,-2531,26.0,1,1,1,1,1,0,1.0,2,2,9,0,0,0,0,0,0,22,,0.555912,0.729567,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-815.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,1.0,-714.0,-714.0,-714.0,0.0,20106.0,20106.0,20106.0,24.669939,24.669939,24.669939,3.753045,3.753045,3.753045,0.004605,0.004605,0.004605,5357.25,5357.25,5357.25,6.573313,6.573313,6.573313,-815.0,-815.0,0.0,0.0,0.0,29.793865,29.793865,24282.0,24282.0,0.00026,0.001016,0.001016,0.212008,0.828021,0.828021,0.828021,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.001227,0.001227,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506853,-4.125854,1.233849,-0.810943,0.819096,-1.583013,1.885414,1.163706,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-595.0,-382.0,-977.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,408.0,0.003205,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-382.0,300.0,918.0,386.044202,189037.8,0.0,0.0,0.0,0.0,0.484266,-3.20874,-0.155941,-0.524505,0.269582,0.094367,-0.046783,0.032632,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,784.0,0.0,0.0,0.0,0.0,9.434878,7096.155,14.544656,10573.965,6.738679,5357.25,28.304633,21288.465,0.0,-727.0,-795.0,68.0,,,0.0,0.0,,,-3.0,-11.0,0.525224,-1.700891,1.634542,0.456757,-0.633019,-0.255442,-0.037613,0.026482,0.0,0.0,1.0,,,,0.509493,-193.488025,,-0.041163,2.0,202500.0,1.0,6.341462,2.0,20.0,5.559674,5.559674,,0.011814,-5300.0,0.105128,0.052564,1.051282,-6791.0,0.0,,0.179867,-3.544051,-7606.0,0.0,0.0,0.0,,,0.0,-0.001365,,-19020.0,-0.354405,-30.0,-1518750.0,1.683129,5.226994,0.020064,0,,,,0,-0.0,0.0,0.010032,99.681021,0.038462,,,0.506459,2.025836,0.525224,0.484266,-3445.0,-18821,,,-0.173655,-60403.845,-127903.8,346.155,67500.0,0.0,113711.535,67500.0,128250.0,110718.0,110718.0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
3,100006,0,0,1,0,135000.0,312682.5,29686.5,297000.0,0.008019,-19005,-3039.0,-9833.0,-2437,,1,1,0,1,0,0,2.0,2,2,17,0,0,0,0,0,0,42,,0.650442,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,0.0,2.0,0.0,-617.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,,,,,,13500.0,2482.92,0.799989,1.029197,1.012684,1.316797,1.316797,9.0,-416.0,365243.0,182481.75,365659.0,0.0,906615.0,291695.5,0.0,5008.922652,1358.887335,9.230206,27.839644,17.767287,0.015809,0.15381,0.081751,2482.92,39954.51,23651.175,4.024182,180.641436,96.293912,-617.0,-181.0,436.0,5.0,0.555556,1242.561634,3803.867403,272203.26,688500.0,0.000439,0.004129,0.007275,0.163412,1.012684,1.316797,0.799989,,0.0,0.0,0.0,1.0,1.0,3.0,5.0,0.0,0.0,0.0,2.0,2.0,1.0,4.0,0.015886,0.005525,2.0,,,1.0,1.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,,,,,,,,0.505468,2.847059,-1.193277,-0.546901,-0.548065,0.197115,-2.467181,-0.502496,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,0.0,0.0,0.0,0.0,0.0,6.0,1.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.471819,-2.996367,0.956185,-1.143641,0.37796,0.322572,0.12285,-0.890276,0.0,0.0,691786.89,691786.89,29027.52,545.0,0.0,0.0,0.0,0.0,543.096731,62947.088438,3975.786724,691786.89,4.318122,2482.92,8689.547693,1007153.415,0.0,-12.0,-575.0,563.0,0.0,0.0,865952.01,749841.93,691786.89,29027.52,-1.0,-77.0,0.561795,7.1613,2.248679,2.477131,-3.866771,0.665976,-0.403882,2.419674,0.0,0.0,3.0,0.0,48.0,0.0,0.523314,,,-0.028677,2.316167,447682.5,1.052803,0.310462,2.2,10.532818,1.14871,0.45415,,0.159905,-13489.0,0.466275,0.201313,2.120394,-12270.0,0.2,,2.201914,-7.103394,-12887.0,,,,,,0.0,,,,-1.562036,-9.768509,-90217273.5,4.034879,15.936791,0.016038,0,,,,1,-0.0,0.0,0.008019,124.703828,,,,0.515599,2.062397,0.561795,0.471819,-9216.0,-15966,,,,-72052.911562,-249735.4,33260.588438,177682.5,15682.5,-694470.915,162000.0,282996.0,40479.24,-375817.5,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
4,100007,0,0,1,0,121500.0,513000.0,21865.5,513000.0,0.028663,-19932,-3038.0,-4311.0,-3458,,1,1,0,1,0,0,1.0,2,2,11,0,0,0,0,1,1,12,,0.322738,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-1106.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,16037.64,,,1.108236,,1.108236,6.0,-2041.0,365243.0,72143.8,367284.0,14616.0,284400.0,166638.75,6.201103,733.391711,248.03877,7.968206,21.858453,12.644075,0.003381,0.045729,0.016725,1834.29,22678.785,12278.805,0.778231,42.88139,16.715844,-2357.0,-374.0,1983.0,1.0,0.166667,222.881532,661.764706,150530.25,247500.0,7.5e-05,0.001244,0.002963,0.159516,1.046356,1.264,0.85093,,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,3.0,1.0,3.0,0.0,3.0,5.0,0.005724,0.002674,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.492233,0.206872,-1.706155,-1.707714,-0.435966,2.093007,1.031252,-1.305981,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-783.0,-783.0,-783.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1149.0,0.00087,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-783.0,0.0,0.0,186.781609,146250.0,0.0,0.0,0.0,0.0,0.493031,-3.843688,0.002791,-0.603251,0.532176,0.838862,-0.111817,-0.095342,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,16037.64,16037.64,16037.64,2326.0,3.0,29857.365,25.402727,22655.655,49.833434,12214.060227,1145.545714,22678.785,0.000125,0.18,3289.00667,806127.975,16.0,-14.0,-2318.0,2304.0,0.0,0.0,96225.84,0.0,16037.64,16037.64,12.0,-31.0,0.501933,0.056196,-1.978048,-0.43754,0.186092,0.663907,0.565579,-0.741146,0.0,0.0,5.0,13.0,18.0,0.0,0.48669,-186.781609,,-0.116697,4.222222,634500.0,1.0,0.636375,4.222222,23.461618,3.407953,2.072727,,0.152418,-8455.0,0.100527,0.023809,0.5586,-7769.0,0.0,,0.482456,-6.095725,-8875.0,0.0,0.0,0.0,,,0.0,,,,-1.097005,-7.197334,-66427389.0,1.246674,3.89783,0.057326,2,,,,1,-0.0,0.0,0.028663,34.888183,,,,0.493472,1.973887,0.501933,0.48669,-3205.0,-16894,,,,-109285.939773,-500785.9,-9651.439773,391500.0,0.0,-293127.975,391500.0,491134.5,362469.75,265500.0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1


time: 1min 16s


In [61]:
sk_id_curr = df.pop("SK_ID_CURR")
y = df.pop("TARGET")
df.head()

Unnamed: 0,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,TOTALAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET,TOTAL_AMT_CREDIT_SUM_DIV_SUM_DAYS_CREDIT_ENDDATE,TOTAL_AMT_CREDIT_SUM_POS_DAYS_DIV_SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_ABS_DAYS_INSTALMENT_DIV_DAYS_BIRTH,AMT_CREDIT_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_PLUS_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_GOODS_PRICE,AMT_CREDIT_DIV_SUM_PAYMENT,AMT_GOODS_PRICE_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_ANNUITY,AMT_CREDIT_DIV_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIV_MAX_PREV_REQ_AMOUNT,EXT_SOURCE_PROD,DAYS_EMPLOYED_DIV_DAYS_BIRTH,DAYS_EMPLOYED_PLUS_DAYS_REGISTRATION_PLUS_DAYS_LAST_PHONE_CHANGE,AVG_PAYMENT_SIZE_DIV_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIV_AMT_CREDIT,AVG_PAYMENT_SIZE_DIV_AMT_ANNUITY,DAYS_REGISTRATION_PLUS_DAYS_ID_PUBLISH,SUM_REFUSED_CONTRACT_DIV_SUM_APPR_CONTRACT,MAX_UTILIZATION_DIV_AVG_UTILIZATION,MAX_PREV_REQ_AMOUNT_DIV_AMT_CREDIT,AMT_INCOME_TOTAL_DIV_DAYS_BIRTH,SUM_DAYS_ID_REG_PHONE,SUM_REQ_CREDIT_YEAR,SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_1M,SUM_REQ_CREDIT_1M_DIV_SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_QRT_DIV_SUM_REQ_CREDIT_YEAR,DEF_30_PLUS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE_DIV_DAYS_BIRTH,LANDAREA_DIV_TOTALAREA_MODE,OWN_CAR_AGE_PLUS_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_EMPLOYED,AMT_ANNUITY_PROD_DAYS_EMPLOYED,DAYS_REGISTRATION_DIV_DAYS_ID_PUBLISH,DAYS_REGISTRATION_DIV_DAYS_LAST_PHONE_CHANGE,REGION_RATING_CLIENT_W_CITY_DIV_REGION_POPULATION_RELATIVE,SUM_REG_NOT_FLAG,SUM_AVG_BUILD,SUM_MODE_BUILD,SUM_MEDI_BUILD,SUM_DOC_FLAG,CNT_CHILDREN_DIV_DAYS_BIRTH,CNT_CHILDREN_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_PROD_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_CAR_DIV_OWN_CAR_AGE,EXT_SOURCE_1_DIV_DAYS_BIRTH,EXT_SOURCE_1_PROD_DAYS_BIRTH,AVG_AGG_SYNTHETIC_TARGET,SUM_AGG_SYNTHETIC_TARGET,MAX_AGG_SYNTHETIC_TARGET,MIN_AGG_SYNTHETIC_TARGET,DAYS_REGISTRATION_DIFF_DAYS_LAST_PHONE_CHANGE,DAYS_BIRTH_DIFF_DAYS_EMPLOYED,EXT_SOURCE_1_DIFF_EXT_SOURCE_2,EXT_SOURCE_1_DIFF_EXT_SOURCE_3,EXT_SOURCE_2_DIFF_EXT_SOURCE_3,AVG_PAYMENT_SIZE_DIFF_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIFF_AMT_CREDIT,AVG_PAYMENT_SIZE_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_GOODS_PRICE,AMT_CREDIT_DIFF_SUM_PAYMENT,AMT_GOODS_PRICE_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIFF_MAX_PREV_REQ_AMOUNT,NAME_CONTRACT_TYPE_Cash_loans,NAME_CONTRACT_TYPE_Revolving_loans,NAME_CONTRACT_TYPE_nan,CODE_GENDER_F,CODE_GENDER_M,CODE_GENDER_nan,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group_of_people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse,_partner",NAME_TYPE_SUITE_Unaccompanied,NAME_TYPE_SUITE_nan,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial_associate,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State_servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_INCOME_TYPE_nan,NAME_EDUCATION_TYPE_Academic_degree,NAME_EDUCATION_TYPE_Higher_education,NAME_EDUCATION_TYPE_Incomplete_higher,NAME_EDUCATION_TYPE_Lower_secondary,NAME_EDUCATION_TYPE_Secondary_/_secondary_special,NAME_EDUCATION_TYPE_nan,NAME_FAMILY_STATUS_Civil_marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single_/_not_married,NAME_FAMILY_STATUS_Widow,NAME_FAMILY_STATUS_nan,NAME_HOUSING_TYPE_Co-op_apartment,NAME_HOUSING_TYPE_House_/_apartment,NAME_HOUSING_TYPE_Municipal_apartment,NAME_HOUSING_TYPE_Office_apartment,NAME_HOUSING_TYPE_Rented_apartment,NAME_HOUSING_TYPE_With_parents,NAME_HOUSING_TYPE_nan,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning_staff,OCCUPATION_TYPE_Cooking_staff,OCCUPATION_TYPE_Core_staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR_staff,OCCUPATION_TYPE_High_skill_tech_staff,OCCUPATION_TYPE_IT_staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill_Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine_staff,OCCUPATION_TYPE_Private_service_staff,OCCUPATION_TYPE_Realty_agents,OCCUPATION_TYPE_Sales_staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security_staff,OCCUPATION_TYPE_Waiters/barmen_staff,OCCUPATION_TYPE_nan,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,WEEKDAY_APPR_PROCESS_START_nan,FONDKAPREMONT_MODE_not_specified,FONDKAPREMONT_MODE_org_spec_account,FONDKAPREMONT_MODE_reg_oper_account,FONDKAPREMONT_MODE_reg_oper_spec_account,FONDKAPREMONT_MODE_nan,HOUSETYPE_MODE_block_of_flats,HOUSETYPE_MODE_specific_housing,HOUSETYPE_MODE_terraced_house,HOUSETYPE_MODE_nan,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone,_brick",WALLSMATERIAL_MODE_Wooden,WALLSMATERIAL_MODE_nan,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,EMERGENCYSTATE_MODE_nan
0,0,1,0,202500.0,406597.5,24700.5,351000.0,0.018801,-9461,-637.0,-3648.0,-2120,,1,1,0,1,1,0,1.0,2,2,10,0,0,0,0,0,0,42,0.083037,0.262949,0.139376,0.0247,0.0369,0.9722,0.6192,0.0143,0.0,0.069,0.0833,0.125,0.0369,0.0202,0.019,0.0,0.0,0.0252,0.0383,0.9722,0.6341,0.0144,0.0,0.069,0.0833,0.125,0.0377,0.022,0.0198,0.0,0.0,0.025,0.0369,0.9722,0.6243,0.0144,0.0,0.069,0.0833,0.125,0.0375,0.0205,0.0193,0.0,0.0,0.0149,2.0,2.0,2.0,2.0,-1134.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,1.0,,9251.775,,,1.0,,1.0,1.0,-17.0,-17.0,-17.0,0.0,179055.0,179055.0,179055.0,295.470297,295.470297,295.470297,19.353584,19.353584,19.353584,0.031937,0.031937,0.031937,9251.775,9251.775,9251.775,15.266955,15.266955,15.266955,-606.0,-606.0,0.0,0.0,0.0,295.470297,295.470297,179055.0,179055.0,0.0,0.00165,0.00165,0.0,1.0,1.0,1.0,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.00165,0.00165,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.487067,-2.72488,1.59177,2.395666,0.118051,-0.42582,-0.376677,0.405732,315.103846,0.0,0.0,0.0,0.0,0.54618,0.54618,2.0,2.0,2.0,780.0,0.0,,,,245781.0,245781.0,0.0,10.875,0.689655,0.264368,0.003698,40.5,1.5,39.0,60.0,0.716964,0.283036,0.5,0.109328,0.014109,0.010476,0.025641,4863.768166,0.0,1617.905476,7012.987013,0.75,0.051282,0.027542,638235.0,927.0,20.0,20.0,-47.0,-1072.0,780.0,-2094.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,103.0,0.017755,148.3425,153.695563,5043.645,8405.145,0.0,35111.571429,245781.0,,,0.0,,-7.0,1178.0,1334.0,69432.89321,865055.565,4.0,0.0,0.0,0.0,0.526688,1.038894,7.601345,0.534316,-0.817806,-0.592501,-0.290651,0.111304,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,53093.745,53093.745,9251.775,565.0,0.0,0.0,0.0,0.0,95.448632,11559.247105,1083.545816,53093.745,15.761116,9251.775,1813.524009,219625.695,0.0,-49.0,-587.0,538.0,0.0,0.0,90100.845,34590.195,53093.745,9251.775,-12.0,-31.0,0.514141,-0.752288,1.616157,0.754784,-0.702447,-0.535793,0.056893,0.006947,0.0,0.0,1.0,6.0,11.0,0.0,0.510127,-413.11154,688.495146,-0.059719,2.007889,609097.5,1.158397,1.85132,1.733333,16.461104,2.270797,2.270797,0.003043,0.067329,-5419.0,0.057083,0.028429,0.467976,-5768.0,0.0,,0.440374,-21.403657,-6902.0,1.0,0.0,0.0,,0.0,4.0,,2.530201,,-2.610771,-38.776295,-15734218.5,1.720755,3.216931,0.037602,0,2.0207,2.041,2.0274,1,-0.0,0.0,0.018801,53.18866,,-9e-06,-785.612748,0.509506,2.038022,0.526688,0.487067,-2514.0,-8824,-0.179912,-0.056339,0.123573,-190940.752895,-395038.3,-13141.252895,204097.5,55597.5,186971.805,148500.0,381897.0,227542.5,227542.5,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0
1,0,0,0,270000.0,1293502.5,35698.5,1129500.0,0.003541,-16765,-1188.0,-1186.0,-291,,1,1,0,1,1,0,2.0,1,1,11,0,0,0,0,0,0,13,0.311267,0.622246,,0.0959,0.0529,0.9851,0.796,0.0605,0.08,0.0345,0.2917,0.3333,0.013,0.0773,0.0549,0.0039,0.0098,0.0924,0.0538,0.9851,0.804,0.0497,0.0806,0.0345,0.2917,0.3333,0.0128,0.079,0.0554,0.0,0.0,0.0968,0.0529,0.9851,0.7987,0.0608,0.08,0.0345,0.2917,0.3333,0.0132,0.0787,0.0558,0.0039,0.01,0.0714,1.0,0.0,1.0,0.0,-828.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,3.0,-1976.0,-527.0,-1047.333333,1449.0,68053.5,1035882.0,484191.0,29.070269,1388.581769,612.90394,5.399568,10.531859,8.677472,0.004315,0.014118,0.008318,6737.31,98356.995,56553.99,2.877962,131.845838,70.901357,-2341.0,-746.0,1595.0,0.0,0.0,547.812073,1206.434316,435436.5,900000.0,2.1e-05,0.001071,0.001543,0.05003,1.057664,1.15098,0.989013,,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,2.0,0.0,0.0,1.0,2.0,3.0,0.002975,0.00134,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.42019,0.428183,-0.535911,2.110056,-4.18119,1.337309,1.599647,0.545277,0.0,0.0,0.0,,,0.0,0.0,1.0,1.0,1.0,1216.0,0.0,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,810000.0,1216.0,,,,-2434.0,1216.0,-2178.0,1.0,4.0,1.0,0.0,0.0,0.0,0.0,606.0,0.003938,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,-43.0,2088.0,1980.0,19188.078259,1017400.5,2.0,0.0,0.0,0.0,0.459155,-1.386349,-0.52014,-0.831323,-0.242488,-0.712057,0.070022,0.154299,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,2310.0,0.0,0.0,0.0,0.0,100.798053,64754.586,1030.947353,560835.36,2.899015,6662.97,2519.951327,1618864.65,0.0,-544.0,-2324.0,1780.0,,,0.0,0.0,,,-1.0,-14.0,0.47399,0.659627,-0.035899,-0.624043,1.42402,0.239304,-0.727819,1.224179,0.0,0.0,3.0,,,,0.495285,-467.126033,666.118421,-0.137787,4.79075,1563502.5,1.145199,0.799018,4.183333,36.234085,2.970588,1.437225,,0.070862,-3202.0,0.239832,0.050061,1.81393,-1477.0,0.0,,0.695785,-16.104981,-2305.0,0.0,0.0,0.0,,,0.0,,0.179272,,-2.129347,-30.049242,-42409818.0,4.075601,1.432367,0.003541,0,2.8888,2.8723,2.8954,1,-0.0,0.0,0.0,0.0,,-1.9e-05,-5218.396475,0.462155,1.848621,0.495285,0.42019,-358.0,-15577,-0.310978,,,-205245.414,-1228748.0,29056.086,1023502.5,164002.5,-325362.15,859500.0,1257804.0,858066.0,393502.5,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0
2,1,1,0,67500.0,135000.0,6750.0,135000.0,0.010032,-19046,-225.0,-4260.0,-2531,26.0,1,1,1,1,1,0,1.0,2,2,9,0,0,0,0,0,0,22,,0.555912,0.729567,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-815.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,1.0,-714.0,-714.0,-714.0,0.0,20106.0,20106.0,20106.0,24.669939,24.669939,24.669939,3.753045,3.753045,3.753045,0.004605,0.004605,0.004605,5357.25,5357.25,5357.25,6.573313,6.573313,6.573313,-815.0,-815.0,0.0,0.0,0.0,29.793865,29.793865,24282.0,24282.0,0.00026,0.001016,0.001016,0.212008,0.828021,0.828021,0.828021,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.001227,0.001227,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506853,-4.125854,1.233849,-0.810943,0.819096,-1.583013,1.885414,1.163706,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-595.0,-382.0,-977.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,408.0,0.003205,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-382.0,300.0,918.0,386.044202,189037.8,0.0,0.0,0.0,0.0,0.484266,-3.20874,-0.155941,-0.524505,0.269582,0.094367,-0.046783,0.032632,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,784.0,0.0,0.0,0.0,0.0,9.434878,7096.155,14.544656,10573.965,6.738679,5357.25,28.304633,21288.465,0.0,-727.0,-795.0,68.0,,,0.0,0.0,,,-3.0,-11.0,0.525224,-1.700891,1.634542,0.456757,-0.633019,-0.255442,-0.037613,0.026482,0.0,0.0,1.0,,,,0.509493,-193.488025,,-0.041163,2.0,202500.0,1.0,6.341462,2.0,20.0,5.559674,5.559674,,0.011814,-5300.0,0.105128,0.052564,1.051282,-6791.0,0.0,,0.179867,-3.544051,-7606.0,0.0,0.0,0.0,,,0.0,-0.001365,,-19020.0,-0.354405,-30.0,-1518750.0,1.683129,5.226994,0.020064,0,,,,0,-0.0,0.0,0.010032,99.681021,0.038462,,,0.506459,2.025836,0.525224,0.484266,-3445.0,-18821,,,-0.173655,-60403.845,-127903.8,346.155,67500.0,0.0,113711.535,67500.0,128250.0,110718.0,110718.0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
3,0,1,0,135000.0,312682.5,29686.5,297000.0,0.008019,-19005,-3039.0,-9833.0,-2437,,1,1,0,1,0,0,2.0,2,2,17,0,0,0,0,0,0,42,,0.650442,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,0.0,2.0,0.0,-617.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,,,,,,13500.0,2482.92,0.799989,1.029197,1.012684,1.316797,1.316797,9.0,-416.0,365243.0,182481.75,365659.0,0.0,906615.0,291695.5,0.0,5008.922652,1358.887335,9.230206,27.839644,17.767287,0.015809,0.15381,0.081751,2482.92,39954.51,23651.175,4.024182,180.641436,96.293912,-617.0,-181.0,436.0,5.0,0.555556,1242.561634,3803.867403,272203.26,688500.0,0.000439,0.004129,0.007275,0.163412,1.012684,1.316797,0.799989,,0.0,0.0,0.0,1.0,1.0,3.0,5.0,0.0,0.0,0.0,2.0,2.0,1.0,4.0,0.015886,0.005525,2.0,,,1.0,1.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,,,,,,,,0.505468,2.847059,-1.193277,-0.546901,-0.548065,0.197115,-2.467181,-0.502496,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,0.0,0.0,0.0,0.0,0.0,6.0,1.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,,,,0.0,0.0,,,0.471819,-2.996367,0.956185,-1.143641,0.37796,0.322572,0.12285,-0.890276,0.0,0.0,691786.89,691786.89,29027.52,545.0,0.0,0.0,0.0,0.0,543.096731,62947.088438,3975.786724,691786.89,4.318122,2482.92,8689.547693,1007153.415,0.0,-12.0,-575.0,563.0,0.0,0.0,865952.01,749841.93,691786.89,29027.52,-1.0,-77.0,0.561795,7.1613,2.248679,2.477131,-3.866771,0.665976,-0.403882,2.419674,0.0,0.0,3.0,0.0,48.0,0.0,0.523314,,,-0.028677,2.316167,447682.5,1.052803,0.310462,2.2,10.532818,1.14871,0.45415,,0.159905,-13489.0,0.466275,0.201313,2.120394,-12270.0,0.2,,2.201914,-7.103394,-12887.0,,,,,,0.0,,,,-1.562036,-9.768509,-90217273.5,4.034879,15.936791,0.016038,0,,,,1,-0.0,0.0,0.008019,124.703828,,,,0.515599,2.062397,0.561795,0.471819,-9216.0,-15966,,,,-72052.911562,-249735.4,33260.588438,177682.5,15682.5,-694470.915,162000.0,282996.0,40479.24,-375817.5,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
4,0,1,0,121500.0,513000.0,21865.5,513000.0,0.028663,-19932,-3038.0,-4311.0,-3458,,1,1,0,1,0,0,1.0,2,2,11,0,0,0,0,1,1,12,,0.322738,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-1106.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,16037.64,,,1.108236,,1.108236,6.0,-2041.0,365243.0,72143.8,367284.0,14616.0,284400.0,166638.75,6.201103,733.391711,248.03877,7.968206,21.858453,12.644075,0.003381,0.045729,0.016725,1834.29,22678.785,12278.805,0.778231,42.88139,16.715844,-2357.0,-374.0,1983.0,1.0,0.166667,222.881532,661.764706,150530.25,247500.0,7.5e-05,0.001244,0.002963,0.159516,1.046356,1.264,0.85093,,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,3.0,1.0,3.0,0.0,3.0,5.0,0.005724,0.002674,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.492233,0.206872,-1.706155,-1.707714,-0.435966,2.093007,1.031252,-1.305981,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,,,,,,,,0.0,,,,,,,,,,,,,,,0.0,0.0,,,,-783.0,-783.0,-783.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1149.0,0.00087,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,-783.0,0.0,0.0,186.781609,146250.0,0.0,0.0,0.0,0.0,0.493031,-3.843688,0.002791,-0.603251,0.532176,0.838862,-0.111817,-0.095342,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,16037.64,16037.64,16037.64,2326.0,3.0,29857.365,25.402727,22655.655,49.833434,12214.060227,1145.545714,22678.785,0.000125,0.18,3289.00667,806127.975,16.0,-14.0,-2318.0,2304.0,0.0,0.0,96225.84,0.0,16037.64,16037.64,12.0,-31.0,0.501933,0.056196,-1.978048,-0.43754,0.186092,0.663907,0.565579,-0.741146,0.0,0.0,5.0,13.0,18.0,0.0,0.48669,-186.781609,,-0.116697,4.222222,634500.0,1.0,0.636375,4.222222,23.461618,3.407953,2.072727,,0.152418,-8455.0,0.100527,0.023809,0.5586,-7769.0,0.0,,0.482456,-6.095725,-8875.0,0.0,0.0,0.0,,,0.0,,,,-1.097005,-7.197334,-66427389.0,1.246674,3.89783,0.057326,2,,,,1,-0.0,0.0,0.028663,34.888183,,,,0.493472,1.973887,0.501933,0.48669,-3205.0,-16894,,,,-109285.939773,-500785.9,-9651.439773,391500.0,0.0,-293127.975,391500.0,491134.5,362469.75,265500.0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1


time: 1.54 s


In [62]:
grp = GaussianRandomProjection(n_components=10, random_state=2357)

arr = grp.fit_transform(impute.fit_transform(df.replace([-np.inf, np.inf], np.nan)))

time: 1min 27s


In [63]:
proj = pd.DataFrame(arr, 
                    columns=["RAND_PROJ" + str(i+1) for i in range(arr.shape[1])], 
                    index=df.index)

proj.head()

Unnamed: 0,RAND_PROJ1,RAND_PROJ2,RAND_PROJ3,RAND_PROJ4,RAND_PROJ5,RAND_PROJ6,RAND_PROJ7,RAND_PROJ8,RAND_PROJ9,RAND_PROJ10
0,1083332.0,-1600332.0,-3420386.0,5278310.0,-1979387.0,5074353.0,7653430.0,3876388.0,-802971.3,-7818119.0
1,3086248.0,-4502904.0,-8520878.0,12758010.0,-5461605.0,14512910.0,19431220.0,9584260.0,-2026135.0,-19266600.0
2,263462.1,-396058.5,-899339.8,1074632.0,-68391.39,359429.1,665779.4,166658.4,-63713.72,-981440.6
3,4925500.0,-8232414.0,-19077760.0,25511440.0,-11683860.0,28639330.0,44321980.0,22848640.0,-6715022.0,-42679100.0
4,4127197.0,-6389153.0,-15166070.0,19222410.0,-9400587.0,20909010.0,32365970.0,16272870.0,-4966610.0,-31314780.0


time: 52.7 ms


In [64]:
proj.join(sk_id_curr).to_csv(path + "train_proj.csv", index=False, header=True)
del proj
gc.collect()

186

time: 11.3 s


#### Test

In [65]:
df = pd.read_csv(path + "test.csv", usecols=lambda c: "RAND_PROJ" not in c)
df.head()

Unnamed: 0,SK_ID_CURR,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,TOTALAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET,TOTAL_AMT_CREDIT_SUM_DIV_SUM_DAYS_CREDIT_ENDDATE,TOTAL_AMT_CREDIT_SUM_POS_DAYS_DIV_SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_ABS_DAYS_INSTALMENT_DIV_DAYS_BIRTH,AMT_CREDIT_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_PLUS_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_GOODS_PRICE,AMT_CREDIT_DIV_SUM_PAYMENT,AMT_GOODS_PRICE_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_ANNUITY,AMT_CREDIT_DIV_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIV_MAX_PREV_REQ_AMOUNT,EXT_SOURCE_PROD,DAYS_EMPLOYED_DIV_DAYS_BIRTH,DAYS_EMPLOYED_PLUS_DAYS_REGISTRATION_PLUS_DAYS_LAST_PHONE_CHANGE,AVG_PAYMENT_SIZE_DIV_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIV_AMT_CREDIT,AVG_PAYMENT_SIZE_DIV_AMT_ANNUITY,DAYS_REGISTRATION_PLUS_DAYS_ID_PUBLISH,SUM_REFUSED_CONTRACT_DIV_SUM_APPR_CONTRACT,MAX_UTILIZATION_DIV_AVG_UTILIZATION,MAX_PREV_REQ_AMOUNT_DIV_AMT_CREDIT,AMT_INCOME_TOTAL_DIV_DAYS_BIRTH,SUM_DAYS_ID_REG_PHONE,SUM_REQ_CREDIT_YEAR,SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_1M,SUM_REQ_CREDIT_1M_DIV_SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_QRT_DIV_SUM_REQ_CREDIT_YEAR,DEF_30_PLUS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE_DIV_DAYS_BIRTH,LANDAREA_DIV_TOTALAREA_MODE,OWN_CAR_AGE_PLUS_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_EMPLOYED,AMT_ANNUITY_PROD_DAYS_EMPLOYED,DAYS_REGISTRATION_DIV_DAYS_ID_PUBLISH,DAYS_REGISTRATION_DIV_DAYS_LAST_PHONE_CHANGE,REGION_RATING_CLIENT_W_CITY_DIV_REGION_POPULATION_RELATIVE,SUM_REG_NOT_FLAG,SUM_AVG_BUILD,SUM_MODE_BUILD,SUM_MEDI_BUILD,SUM_DOC_FLAG,CNT_CHILDREN_DIV_DAYS_BIRTH,CNT_CHILDREN_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_PROD_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_CAR_DIV_OWN_CAR_AGE,EXT_SOURCE_1_DIV_DAYS_BIRTH,EXT_SOURCE_1_PROD_DAYS_BIRTH,AVG_AGG_SYNTHETIC_TARGET,SUM_AGG_SYNTHETIC_TARGET,MAX_AGG_SYNTHETIC_TARGET,MIN_AGG_SYNTHETIC_TARGET,DAYS_REGISTRATION_DIFF_DAYS_LAST_PHONE_CHANGE,DAYS_BIRTH_DIFF_DAYS_EMPLOYED,EXT_SOURCE_1_DIFF_EXT_SOURCE_2,EXT_SOURCE_1_DIFF_EXT_SOURCE_3,EXT_SOURCE_2_DIFF_EXT_SOURCE_3,AVG_PAYMENT_SIZE_DIFF_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIFF_AMT_CREDIT,AVG_PAYMENT_SIZE_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_GOODS_PRICE,AMT_CREDIT_DIFF_SUM_PAYMENT,AMT_GOODS_PRICE_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIFF_MAX_PREV_REQ_AMOUNT,NAME_CONTRACT_TYPE_Cash_loans,NAME_CONTRACT_TYPE_Revolving_loans,NAME_CONTRACT_TYPE_nan,CODE_GENDER_F,CODE_GENDER_M,CODE_GENDER_nan,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group_of_people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse,_partner",NAME_TYPE_SUITE_Unaccompanied,NAME_TYPE_SUITE_nan,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial_associate,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State_servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_INCOME_TYPE_nan,NAME_EDUCATION_TYPE_Academic_degree,NAME_EDUCATION_TYPE_Higher_education,NAME_EDUCATION_TYPE_Incomplete_higher,NAME_EDUCATION_TYPE_Lower_secondary,NAME_EDUCATION_TYPE_Secondary_/_secondary_special,NAME_EDUCATION_TYPE_nan,NAME_FAMILY_STATUS_Civil_marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single_/_not_married,NAME_FAMILY_STATUS_Widow,NAME_FAMILY_STATUS_nan,NAME_HOUSING_TYPE_Co-op_apartment,NAME_HOUSING_TYPE_House_/_apartment,NAME_HOUSING_TYPE_Municipal_apartment,NAME_HOUSING_TYPE_Office_apartment,NAME_HOUSING_TYPE_Rented_apartment,NAME_HOUSING_TYPE_With_parents,NAME_HOUSING_TYPE_nan,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning_staff,OCCUPATION_TYPE_Cooking_staff,OCCUPATION_TYPE_Core_staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR_staff,OCCUPATION_TYPE_High_skill_tech_staff,OCCUPATION_TYPE_IT_staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill_Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine_staff,OCCUPATION_TYPE_Private_service_staff,OCCUPATION_TYPE_Realty_agents,OCCUPATION_TYPE_Sales_staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security_staff,OCCUPATION_TYPE_Waiters/barmen_staff,OCCUPATION_TYPE_nan,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,WEEKDAY_APPR_PROCESS_START_nan,FONDKAPREMONT_MODE_not_specified,FONDKAPREMONT_MODE_org_spec_account,FONDKAPREMONT_MODE_reg_oper_account,FONDKAPREMONT_MODE_reg_oper_spec_account,FONDKAPREMONT_MODE_nan,HOUSETYPE_MODE_block_of_flats,HOUSETYPE_MODE_specific_housing,HOUSETYPE_MODE_terraced_house,HOUSETYPE_MODE_nan,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone,_brick",WALLSMATERIAL_MODE_Wooden,WALLSMATERIAL_MODE_nan,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,EMERGENCYSTATE_MODE_nan
0,100001,0,1,0,135000.0,568800.0,20560.5,450000.0,0.01885,-19241,-2329.0,-5170.0,-812,,1,1,0,1,0,1,2.0,2,2,18,0,0,0,0,0,0,24,0.752614,0.789654,0.15952,0.066,0.059,0.9732,,,,0.1379,0.125,,,,0.0505,,,0.0672,0.0612,0.9732,,,,0.1379,0.125,,,,0.0526,,,0.0666,0.059,0.9732,,,,0.1379,0.125,,,,0.0514,,,0.0392,0.0,0.0,0.0,0.0,-1740.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,1.0,-1612.0,-1612.0,-1612.0,0.0,23787.0,23787.0,23787.0,13.67069,13.67069,13.67069,6.020501,6.020501,6.020501,0.00346,0.00346,0.00346,3951.0,3951.0,3951.0,2.27069,2.27069,2.27069,-1740.0,-1740.0,0.0,0.0,0.0,14.273276,14.273276,24835.5,24835.5,6e-05,0.00055,0.00055,0.104326,0.957782,0.957782,0.957782,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.000575,0.000575,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.513661,-3.921423,0.977275,-0.190697,1.345474,-0.545294,1.929032,1.411176,603.706712,0.0,0.0,1.0,1.0,0.987405,0.987405,3.0,3.0,3.0,3091.0,0.0,,,,596686.5,596686.5,0.0,8.857143,0.983871,1.774194,0.007155,47.5,0.5,47.0,61.0,0.992481,0.007519,0.052632,0.349547,0.021053,0.000835,0.005848,120775.784672,1800.0,282.105263,1974.736842,0.142857,0.111111,0.015873,884025.0,3091.0,19.0,19.0,-51.0,-1329.0,1778.0,577.0,3.0,7.0,3.0,0.0,0.0,0.0,0.0,49.0,0.029363,,0.0,,0.0,0.0,53216.5875,596686.5,,,0.0,,-6.0,149.0,1523.0,100412.66129,1453365.0,0.0,0.0,0.0,24817.5,0.525046,1.10057,1.523734,1.496514,-0.660367,-1.992638,0.017996,0.257508,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,2916.0,0.0,0.0,0.0,0.0,3.116986,5885.132143,10.686671,17397.9,1.365586,3951.0,21.8189,41195.925,1.0,-1628.0,-2916.0,1288.0,,,0.0,0.0,,,11.0,-36.0,0.485121,-1.311336,-0.289649,-1.265137,0.259213,1.925718,0.03656,1.028292,7.0,7.0,2.0,,,,0.503134,2518.830156,285.999676,-0.151551,4.213333,703800.0,1.264,13.807191,3.333333,27.664697,22.9027,22.9027,0.094803,0.121044,-9239.0,0.043594,0.010347,0.286235,-5982.0,0.0,,0.043663,-7.016267,-7722.0,0.0,0.0,0.0,,,0.0,,,,-1.068578,-8.828038,-47885404.5,6.366995,2.971264,0.0377,0,,,,1,-0.0,0.0,0.01885,53.050398,,-3.9e-05,-14481.055414,0.50674,2.026962,0.525046,0.485121,-3430.0,-16912,-0.03704,0.593095,0.630135,-129114.867857,-562914.9,-14675.367857,433800.0,118800.0,527604.075,315000.0,548239.5,543964.5,543964.5,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0
1,100005,0,1,0,99000.0,222768.0,17370.0,180000.0,0.035792,-18064,-4469.0,-9118.0,-1623,,1,1,0,1,0,0,2.0,2,2,9,0,0,0,0,0,0,46,0.56499,0.291656,0.432962,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,3.0,,,,,,,,2.0,-460.0,-460.0,-460.0,0.0,0.0,40153.5,20076.75,0.0,53.042933,26.521466,8.342371,8.342371,8.342371,0.01102,0.01102,0.01102,4813.2,4813.2,4813.2,6.358256,6.358256,6.358256,-757.0,-315.0,442.0,1.0,0.5,29.469947,58.939894,22308.75,44617.5,0.000144,0.001189,0.001189,0.108964,0.89995,0.89995,0.89995,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.001321,0.001321,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,0.529786,-3.004413,0.852979,-0.301994,1.40546,-1.294547,0.780261,1.127595,617.739835,0.0,0.0,0.0,0.0,0.954794,0.954794,2.0,2.0,2.0,1446.0,0.0,,,,568408.5,568408.5,0.0,5.333333,1.0,0.3125,0.086957,8.5,1.0,7.5,16.0,1.0,0.0,0.0,0.539216,0.117647,0.0,0.0,107036.117647,6882.352941,0.0,0.0,0.0,0.0,0.0,598626.0,1446.0,8.0,8.0,-12.0,-128.0,1324.0,1318.0,2.0,3.0,2.0,0.0,0.0,0.0,0.0,62.0,0.026109,0.0,0.0,0.0,0.0,0.0,50188.368035,568408.5,,,0.0,0.0,-11.0,110.0,311.0,53154.691016,657126.0,1.0,0.0,0.0,4261.5,0.546448,-1.948244,-0.867605,4.826918,-0.613374,-1.4752,0.188919,0.200762,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,706.0,0.0,0.0,0.0,0.0,11.09417,6240.205,37.566479,17656.245,6.539674,4813.2,99.847528,56161.845,1.0,-470.0,-736.0,266.0,,,0.0,0.0,,,1.0,-37.0,0.525405,-1.571981,1.428804,0.404391,-0.61607,-0.355109,-0.043216,-0.162738,0.0,0.0,1.0,,,,0.508932,498.578149,413.987552,-0.039083,2.250182,321768.0,1.2376,3.966536,1.818182,12.82487,9.985678,4.992839,0.071345,0.247398,-13587.0,0.063032,0.028012,0.359252,-10741.0,0.0,,0.200287,-5.480514,-10741.0,3.0,0.0,0.0,,0.0,0.0,,,,-0.961581,-3.886776,-77626530.0,5.617991,,0.071584,0,,,,1,-0.0,0.0,0.035792,27.939204,,-3.1e-05,-10205.983005,0.527643,2.110571,0.546448,0.508932,-9118.0,-13595,0.273335,0.132029,-0.141306,-92759.795,-216527.8,-11129.795,123768.0,42768.0,166606.155,81000.0,205398.0,200459.25,178150.5,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
2,100013,1,1,0,202500.0,663264.0,69777.0,630000.0,0.019101,-20038,-4458.0,-2175.0,-3503,5.0,1,1,0,1,0,0,2.0,2,2,14,0,0,0,0,0,0,57,,0.699787,0.610991,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-856.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,1.0,4.0,4742.415,4742.415,1.079158,1.079158,1.079158,1.079158,1.079158,4.0,-1702.0,-85.0,-710.333333,1617.0,0.0,512370.0,146134.125,0.0,598.563084,177.826452,5.109738,22.128804,11.523312,0.003668,0.025851,0.016079,4742.415,23153.985,11478.195,3.270728,27.049048,15.897086,-1999.0,-222.0,1777.0,1.0,0.25,158.370361,525.700935,130871.25,450000.0,3.4e-05,0.001918,0.003953,0.067217,1.052363,1.1386,0.93933,,0.0,0.0,0.0,0.0,0.0,1.0,3.0,0.0,1.0,0.0,1.0,0.0,1.0,3.0,0.005331,0.003663,2.0,,,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,,,,,,,,0.499304,-0.690857,-0.565602,-0.438265,0.496767,0.94185,0.88094,0.138659,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,0.0,31.75,0.944882,0.811024,0.005744,54.5,19.5,35.0,120.0,0.934538,0.065462,0.136364,0.027611,0.015847,0.001329,0.002502,11763.832141,1358.464615,935.629196,1895.27027,0.75,0.027778,0.016119,0.0,0.0,40.0,40.0,-68.0,-1707.0,-567.0,-4272.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,1210.0,0.002409,14.471514,14.471514,19305.0,19305.0,0.0,0.0,0.0,,,,,-4.0,1330.0,860.0,9516.034492,2072280.06,0.0,2.0,0.0,0.0,0.450881,-1.855564,2.735181,-2.778506,1.382593,1.031266,-0.318153,-0.061797,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18159.919219,161420.22,1743352.245,96.0,1.0,95.0,0.115301,1.02489,230.066978,1944.407308,22086.429911,0.001461,0.012345,0.014493,0.014493,23.0,0.239583,7.0,571500.0,5953.125,157500.0,0.0,,,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.481502,-1.995274,-1.079984,1.425906,-0.458675,-1.500304,-0.189693,1.339213,9484.83,9484.83,4741.245,357347.745,23.58,2705.0,10.0,179437.725,381.708698,23147.82,14.445926,9740.235774,1029.820591,357347.745,0.01181,6.165,2239.118537,1509736.545,11.0,-14.0,-2705.0,2691.0,4718.835,4718.835,15871.995,-357348.915,4742.415,274.32,21.0,-38.0,0.500121,0.701369,-3.623967,-0.465886,1.219061,-0.284452,-0.394729,-0.151084,18.0,0.0,3.0,0.0,3.0,36.0,0.509721,-485.084284,,-0.134994,3.275378,865764.0,1.0528,0.439324,3.111111,9.505482,5.068065,1.47392,,0.222477,-7489.0,0.0481,0.014685,0.139591,-5678.0,0.0,8.888818,0.678463,-10.105799,-6534.0,5.0,1.0,0.0,0.0,0.2,0.0,-0.00025,,-20033.0,-3.482234,-15.652086,-311065866.0,0.620896,2.540888,0.038202,0,,,,1,-0.0,0.0,0.019101,52.35328,0.2,,,0.488306,2.441529,0.509721,0.450881,-1319.0,-15580,,,0.088796,-192759.764226,-653523.8,-60036.764226,460764.0,33264.0,-846472.545,427500.0,593487.0,532392.75,213264.0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
3,100028,0,1,2,315000.0,1575000.0,49018.5,1575000.0,0.026392,-13976,-1866.0,-2000.0,-4208,,1,1,0,1,1,0,4.0,2,2,11,0,0,0,0,0,0,42,0.525734,0.509677,0.612704,0.3052,0.1974,0.997,0.9592,0.1165,0.32,0.2759,0.375,0.0417,0.2042,0.2404,0.3673,0.0386,0.08,0.3109,0.2049,0.997,0.9608,0.1176,0.3222,0.2759,0.375,0.0417,0.2089,0.2626,0.3827,0.0389,0.0847,0.3081,0.1974,0.997,0.9597,0.1173,0.32,0.2759,0.375,0.0417,0.2078,0.2446,0.3739,0.0388,0.0817,0.37,0.0,0.0,0.0,0.0,-1805.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,3.0,,,,,,,,5.0,-1081.0,365243.0,121182.666667,366324.0,0.0,225000.0,92920.5,0.0,151.006711,69.509847,8.507039,21.692944,16.733328,0.010674,0.013423,0.012038,6028.02,11250.0,8091.585,3.339623,8.778839,6.556266,-1805.0,-531.0,1274.0,2.0,0.4,40.92331,82.75596,49207.5,130765.5,7.2e-05,,,0.057708,,,0.902436,,0.0,0.0,0.0,0.0,0.0,1.0,3.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,0.001809,0.001255,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506871,-1.06098,-0.298669,-0.388277,0.796905,0.387967,-0.199159,-1.206917,161.513904,178591.5,178591.5,0.0,0.0,0.838975,0.838975,4.0,4.0,4.0,31491.0,0.0,,,,178591.5,178591.5,0.0,24.75,1.0,0.885522,0.002466,65.5,4.0,61.5,297.0,1.0,0.0,0.0,0.064056,0.015267,0.0,0.0,9514.816939,0.0,0.0,0.0,0.0,0.0,0.0,735750.0,32596.0,60.0,60.0,-69.0,-1862.0,30885.0,23877.0,5.0,12.0,5.0,0.0,0.0,0.0,0.0,269.0,0.013641,0.0,0.0,0.0,0.0,0.0,2458.279889,186304.5,,,0.0,0.0,-20.0,1544.0,1836.0,14667.35831,1520875.08,5.0,0.0,0.0,21084.075,0.505209,5.622416,-1.250694,-1.959916,-3.17416,2.3044,-0.75604,-0.057765,0.0,0.0,22823.55,22823.55,11250.0,11250.0,9.0,12.0,9029.385,5495.775,13711.305,0.060939,8085.058163,37335.915,396167.85,49.0,1.0,48.0,0.035934,0.165937,1461.966014,37335.915,71636.334672,0.006498,0.165937,0.0,0.0,117.0,2.387755,12.0,301663.62,6156.400408,22823.55,0.565555,,,0.0,0.0,0.0,0.0,1.019568,0.165937,0.165937,,,0.474385,-0.824511,1.474199,0.817147,-1.033729,-0.138804,0.003143,-0.12993,16360.11,0.0,11250.0,11250.0,1.17,1773.0,10.0,70348.23,131.908966,8505.0,11.108996,4356.731549,387.931034,38988.54,0.001572,1.17,1255.316553,492310.665,12.0,-29.0,-1785.0,1756.0,0.0,8505.0,22503.51,-23583.33,11250.0,1.17,7.0,-19.0,0.518258,-0.789362,-1.863631,0.100024,-0.152822,-0.011525,0.885663,-1.055896,0.0,0.0,2.0,,,,0.50267,63.696238,22.571788,-0.12686,5.0,1890000.0,1.0,3.199199,5.0,32.130726,32.007316,12.044461,0.164177,0.133515,-5671.0,0.013831,0.002766,0.088879,-6208.0,0.0,4.617891,0.083026,-22.538638,-8013.0,3.0,0.0,0.0,,0.0,0.0,,0.564595,,-3.507334,-26.269293,-91468521.0,0.475285,1.108033,0.052784,0,4.5184,4.5838,4.5389,1,-0.000143,75.78054,0.026392,37.89027,,-3.8e-05,-7347.658072,0.501478,2.507392,0.518258,0.474385,-195.0,-12110,0.016057,-0.08697,-0.103027,-310643.268451,-1570643.0,-44661.768451,1260000.0,0.0,1082689.335,1260000.0,1525981.5,1525792.5,1444234.5,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0
4,100038,1,0,1,180000.0,625500.0,32067.0,625500.0,0.010032,-13040,-2191.0,-4000.0,-4262,16.0,1,1,1,1,0,0,3.0,2,2,5,0,0,0,0,1,1,42,0.202145,0.425687,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-821.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,,,,,,24463.71,24463.71,1.118802,1.118802,1.118802,1.118802,1.118802,2.0,-449.0,-449.0,-449.0,0.0,92605.5,508495.5,300550.5,112.795981,4581.040541,2346.918261,8.342387,20.785707,14.564047,0.010161,0.187259,0.09871,11100.6,24463.71,17782.155,13.520828,220.393784,116.957306,-821.0,-111.0,710.0,1.0,0.5,2096.599977,4094.594595,267727.5,454500.0,0.000107,0.005736,0.010079,0.087554,1.131358,1.143913,1.118802,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,1.0,0.001218,0.001218,0.0,,,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,1.0,20.785707,20.785707,20.785707,1.118802,1.118802,532959.21,532959.21,0.568242,1.571133,2.179596,4.183057,1.353692,-0.953153,2.186798,-0.578805,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,787.0,0.0,0.0,0.0,0.0,18.007955,11100.3375,23.81427,11100.6,13.841147,11097.45,216.095461,133204.05,0.0,-466.0,-802.0,336.0,,,0.0,0.0,,,-9.0,-18.0,0.515418,-1.508894,1.59145,0.517567,-0.392059,-0.30697,-0.006584,-0.016673,0.0,0.0,1.0,,,,0.508932,,,-0.060353,3.475,805500.0,1.0,4.695803,3.475,19.506034,2.336331,1.376238,,0.168021,-7012.0,0.061669,0.017746,0.346161,-8262.0,0.0,,0.726619,-13.803681,-9083.0,,,,,,0.0,-0.001227,,-13024.0,-2.459126,-14.635783,-70258797.0,0.938527,4.872107,0.020064,2,,,,1,-7.7e-05,99.681021,0.0,0.0,0.0625,-1.6e-05,-2635.970697,0.530864,1.592592,0.568242,0.508932,-3179.0,-10849,-0.223542,,,-168899.6625,-614399.7,-20966.6625,445500.0,0.0,492295.95,445500.0,593433.0,357772.5,171000.0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1


time: 8.31 s


In [66]:
sk_id_curr = df.pop("SK_ID_CURR")
df.head()

Unnamed: 0,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,TOTALAREA_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR,MIN_PREV_AMT_ANNUITY_12M,MIN_PREV_AMT_ANNUITY_24M,MIN_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_12M,AVG_PREV_PROP_APPROVED_24M,MAX_PREV_PROP_APPROVED_12M,MAX_PREV_PROP_APPROVED_24M,COUNT_PREV_APP,MIN_PREV_DAYS_TERMINATION,MAX_PREV_DAYS_TERMINATION,AVG_PREV_DAYS_TERMINATION,RANGE_PREV_DAYS_TERMINATION,MIN_PREV_AMT_CREDIT,MAX_PREV_AMT_CREDIT,AVG_PREV_AMT_CREDIT,MIN_PREV_AMT_CREDIT_WEIGHTED,MAX_PREV_AMT_CREDIT_WEIGHTED,AVG_PREV_AMT_CREDIT_WEIGHTED,MIN_PREV_AMT_CREDIT_DIV_ANNUITY,MAX_PREV_AMT_CREDIT_DIV_ANNUITY,AVG_PREV_AMT_CREDIT_DIV_ANNUITY,MIN_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MAX_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,AVG_PREV_AMT_CREDIT_DIV_ANNUITY_WEIGHTED,MIN_PREV_AMT_ANNUITY,MAX_PREV_AMT_ANNUITY,AVG_PREV_AMT_ANNUITY,MIN_PREV_AMT_ANNUITY_WEIGHTED,MAX_PREV_AMT_ANNUITY_WEIGHTED,AVG_PREV_AMT_ANNUITY_WEIGHTED,MIN_DAYS_DECISION,MAX_DAYS_DECISION,RANGE_DAYS_DECISION,SUM_DAYS_LAST_DUE_NULL,AVG_DAYS_LAST_DUE_NULL,AVG_PREV_REQ_AMOUNT_WEIGHTED,MAX_PREV_REQ_AMOUNT_WEIGHTED,AVG_PREV_REQ_AMOUNT,MAX_PREV_REQ_AMOUNT,AVG_PREV_RATE_DOWNPAYMENT_WEIGHTED,AVG_PREV_PROP_APPROVED_WEIGHTED,MAX_PREV_PROP_APPROVED_WEIGHTED,AVG_PREV_RATE_DOWNPAYMENT,AVG_PREV_PROP_APPROVED,MAX_PREV_PROP_APPROVED,MIN_PREV_PROP_APPROVED,AVG_PREV_INT_RATE,SUM_PREV_URGENT_NEEDS,SUM_PREV_REPAIRS,SUM_PREV_OTHER,SUM_PREV_LIMIT_REJECT,SUM_REFUSED_CONTRACT,SUM_CANC_CONTRACT,SUM_APPR_CONTRACT,SUM_PREV_HC_REJECT,SUM_PREV_INSURE_REQ,COUNT_PREV_WALK_IN,COUNT_PREV_HIGH_YIELD,COUNT_PREV_LOW_YIELD,SUM_DAYS_LAST_DUE_1ST_VERSION_EQ_DAYS_LAST_DUE,SUM_DAYS_FIRST_DRAWING_SENTINEL,SUM_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,MAX_DAYS_FIRST_DRAWING_SENTINEL_WEIGHTED,SUM_DAYS_LAST_DUE_LT_FIRST_VERSION,MIN_RATE_INTEREST_PRIMARY_12M,AVG_RATE_INTEREST_PRIVILEGED_12M,SUM_REFUSED_CONTRACT_6M,SUM_PRODUCT_COMBINATION_POS_HOUSE_INTEREST_12M,SUM_PRODUCT_COMBINATION_POS_MOBILE_INTEREST_12M,SUM_NAME_GOODS_CATEGORY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_XNA_6M,SUM_NAME_SELLER_INDUSTRY_CSTR_6M,SUM_NAME_PAYMENT_TYPE_XNA_6M,COUNT_NAME_CLIENT_TYPE_REPEATER_12M,COUNT_NAME_CLIENT_TYPE_NEW_12M,AVG_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_ANNUITY_6M,AVG_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,MAX_PREV_AMT_CREDIT_DIV_AMT_GOODS_PRICE_6M,AVG_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,MIN_PREV_AMT_CREDIT_PLUS_AMT_ANNUITY_6M,PREVIOUS_AGG_SYNTHETIC_TARGET,PREVIOUS_AGG_COMP1,PREVIOUS_AGG_COMP2,PREVIOUS_AGG_COMP3,PREVIOUS_AGG_COMP4,PREVIOUS_AGG_COMP5,PREVIOUS_AGG_COMP6,PREVIOUS_AGG_COMP7,SUM_AMT_CREDIT_SUM_DEBT_DIV_DAYS_CREDIT_ENDDATE_ACTIVE_12M,SUM_CC_DEBT_6M,SUM_CC_DEBT_12M,MAX_WORST_DQ_BUREAU_BALANCE_6M,MAX_WORST_DQ_BUREAU_BALANCE_12M,MAX_BUREAU_UTILIZATION_6M,MAX_BUREAU_UTILIZATION_12M,COUNT_ACTIVE_6M,COUNT_ACTIVE_12M,COUNT_ACTIVE_24M,DAYS_REMAINING_ACTIVE,MAX_CREDIT_DAY_OVERDUE_6M,MAX_CREDIT_DAY_OVERDUE_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_6M_12M,BUREAU_UTILIZATION_DIFF_12M_24M,BUREAU_SUM_DEBT_DIFF_6M_12M,BUREAU_SUM_DEBT_DIFF_12M_24M,MAX_CNT_CREDIT_PROLONG,AVG_LEN_BUREAU_BALANCE,PROP_CURRENT,PROP_CLOSED,PROP_CURRENT_WEIGHTED,MAX_AVG_MONTHS_BALANCE_BUREAU_BALANCE,MIN_AVG_MONTHS_BALANCE_BUREAU_BALANCE,RANGE_AVG_MONTHS_BALANCE_BUREAU_BALANCE,SUM_SUM_CURRENT_BUREAU_BALANCE,AVG_PROP_CURRENT,AVG_PROP_DQ,MAX_PROP_DQ,AVG_PROP_CURRENT_WEIGHTED,MIN_PROP_CURRENT_WEIGHTED,AVG_PROP_DQ_WEIGHTED,MAX_PROP_DQ_WEIGHTED,AVG_PROP_CURRENT_WEIGHTED_AMT,MIN_PROP_CURRENT_WEIGHTED_AMT,AVG_PROP_DQ_WEIGHTED_AMT,MAX_PROP_DQ_WEIGHTED_AMT,AVG_WORST_DQ_BUREAU_BALANCE,MAX_WORST_DQ_BUREAU_BALANCE_WEIGHTED,AVG_WORST_DQ_BUREAU_BALANCE_WEIGHTED,TOTAL_AMT_CREDIT_SUM_POS_DAYS,SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_LEN_BUREAU_BALANCE,SUM_LEN_BUREAU_BALANCE,MIN_MIN_MONTHS_BALANCE_BUREAU_BALANCE,MIN_DAYS_CREDIT_ENDDATE,MAX_DAYS_CREDIT_ENDDATE,SUM_DAYS_CREDIT_ENDDATE,SUM_NULL_DAYS_ENDDATE_FACT,COUNT_BUREAU_RECORDS,COUNT_ACTIVE,MAX_CREDIT_DAY_OVERDUE_WEIGHTED,SUM_CREDIT_DAY_OVERDUE_WEIGHTED,MAX_CREDIT_DAY_OVERDUE,SUM_CREDIT_DAY_OVERDUE,DAYS_SINCE_APPLIED,SUM_INVERSE_DAYS_CREDIT,MAX_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,SUM_AMT_CREDIT_MAX_OVERDUE_WEIGHTED,MAX_AMT_CREDIT_MAX_OVERDUE,SUM_AMT_CREDIT_MAX_OVERDUE,SUM_CNT_CREDIT_PROLONG,SUM_AMT_CREDIT_SUM_DEBT_WEIGHTED,SUM_AMT_CREDIT_SUM_DEBT,BUREAU_UTILIZATION_AVG,BUREAU_UTILIZATION_MAX,BUREAU_PROP_SUM_OVERDUE_AVG,BUREAU_PROP_MAX_OVERDUE_AVG,MAX_DAYS_CREDIT_UPDATE,RANGE_DAYS_CREDIT_UPDATE,DAYS_CREDIT_RANGE,TOTAL_AMT_CREDIT_SUM_WEIGHTED,TOTAL_AMT_CREDIT_SUM,COUNT_CREDIT_CARD,COUNT_CAR_LOAN,COUNT_MORTGAGE,SUM_AMT_ANNUITY,BUREAU_AGG_SYNTHETIC_TARGET,BUREAU_AGG_COMP1,BUREAU_AGG_COMP2,BUREAU_AGG_COMP3,BUREAU_AGG_COMP4,BUREAU_AGG_COMP5,BUREAU_AGG_COMP6,BUREAU_AGG_COMP7,MAX_CREDIT_CARD_SK_DPD_6M,MAX_CREDIT_CARD_SK_DPD_12M,MAX_AMT_DRAWINGS_CURRENT_6M,MAX_AMT_DRAWINGS_CURRENT_12M,MAX_AMT_INST_MIN_REGULARITY_6M,MAX_AMT_INST_MIN_REGULARITY_12M,MAX_CNT_DRAWINGS_POS_CURRENT_6M,MAX_CNT_DRAWINGS_POS_CURRENT_12M,SUM_CC_PAYMENT_DIFF_12M,DIFF_AVG_BALANCE_6M_12M,AVG_BALANCE_6M,AVG_UTILIZATION_6M,AVG_BALANCE,MAX_BALANCE,SUM_BALANCE,MAX_MONTHS_BALANCE,MIN_MONTHS_BALANCE,RANGE_MONTHS_BALANCE,AVG_UTILIZATION,MAX_UTILIZATION,AVG_BALANCE_WEIGHTED,MAX_BALANCE_WEIGHTED,SUM_BALANCE_WEIGHTED,AVG_UTILIZATION_WEIGHTED,MAX_UTILIZATION_WEIGHTED,MAX_DPD_WEIGHTED,MAX_DPD_DEF_WEIGHTED,SUM_CNT_DRAWINGS_CURRENT,AVG_CNT_DRAWINGS_CURRENT,MAX_CNT_DRAWINGS_CURRENT,SUM_AMT_DRAWINGS_CURRENT,AVG_AMT_DRAWINGS_CURRENT,MAX_AMT_DRAWINGS_CURRENT,MIN_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,AVG_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,MAX_AMT_PAYMENT_CURRENT_DIV_AMT_INST_MIN_REGULARITY,SUM_CNT_DRAWINGS_ATM_CURRENT_6M,SUM_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_DRAWINGS_ATM_CURRENT_6M,MAX_CNT_DRAWINGS_ATM_CURRENT_6M,MAX_AMT_RECEIVABLE_DIV_AMT_RECEIVABLE_PRINCIPAL_6M,MAX_UTILIZATION_6M,MAX_UTILIZATION_3M,MAX_CREDIT_CARD_INST_AMT_PAST_DUE_6M,MIN_CREDIT_CARD_INST_AMT_PAST_DUE_12M,CREDIT_CARD_AGG_SYNTHETIC_TARGET,CREDIT_CARD_AGG_COMP1,CREDIT_CARD_AGG_COMP2,CREDIT_CARD_AGG_COMP3,CREDIT_CARD_AGG_COMP4,CREDIT_CARD_AGG_COMP5,CREDIT_CARD_AGG_COMP6,CREDIT_CARD_AGG_COMP7,SUM_UNDERPAYMENT_12M,SUM_UNDERPAYMENT_6M,MAX_PAYMENT_SIZE_6M,MAX_PAYMENT_SIZE_12M,MIN_PAYMENT_SIZE_6M,MAX_ABS_DAYS_INSTALMENT,COUNT_UNDERPAYMENT,SUM_UNDERPAYMENT,SUM_UNDERPAYMENT_WEIGHTED,MAX_UNDERPAYMENT,AVG_PAYMENT_SIZE_WEIGHTED,AVG_PAYMENT_SIZE,MAX_PAYMENT_SIZE_WEIGHTED,MAX_PAYMENT_SIZE,MIN_PAYMENT_SIZE_WEIGHTED,MIN_PAYMENT_SIZE,SUM_PAYMENT_WEIGHTED,SUM_PAYMENT,SUM_DAYS_ENTRY_PAYMENT_GT_DAYS_INSTALMENT,MAX_DAYS_ENTRY_PAYMENT,MIN_DAYS_ENTRY_PAYMENT,RANGE_DAYS_ENTRY_PAYMENT,MAX_UNDERPAYMENT_6M,MAX_UNDERPAYMENT_12M,SUM_PAYMENT_6M,SUM_PAYMENT_DIFF_6M_12M,MAX_AMT_INSTALMENT_6M,MIN_AMT_INSTALMENT_6M,MAX_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,MIN_DAYS_ENTRY_PAYMENT_DIFF_DAYS_INSTALMENT_12M,INSTALLMENT_AGG_SYNTHETIC_TARGET,INSTALLMENT_AGG_COMP1,INSTALLMENT_AGG_COMP2,INSTALLMENT_AGG_COMP3,INSTALLMENT_AGG_COMP4,INSTALLMENT_AGG_COMP5,INSTALLMENT_AGG_COMP6,INSTALLMENT_AGG_COMP7,MAX_POS_DPD,MAX_POS_DPD_DEF,NUM_POS_CASH,MIN_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_6M,MAX_CNT_INSTALMENT_FUTURE_PROD_SK_DPD_12M,POS_AGG_SYNTHETIC_TARGET,TOTAL_AMT_CREDIT_SUM_DIV_SUM_DAYS_CREDIT_ENDDATE,TOTAL_AMT_CREDIT_SUM_POS_DAYS_DIV_SUM_DAYS_CREDIT_ENDDATE_POS_DAYS,MAX_ABS_DAYS_INSTALMENT_DIV_DAYS_BIRTH,AMT_CREDIT_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_PLUS_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_GOODS_PRICE,AMT_CREDIT_DIV_SUM_PAYMENT,AMT_GOODS_PRICE_DIV_AMT_INCOME_TOTAL,AMT_CREDIT_DIV_AMT_ANNUITY,AMT_CREDIT_DIV_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIV_MAX_PREV_REQ_AMOUNT,EXT_SOURCE_PROD,DAYS_EMPLOYED_DIV_DAYS_BIRTH,DAYS_EMPLOYED_PLUS_DAYS_REGISTRATION_PLUS_DAYS_LAST_PHONE_CHANGE,AVG_PAYMENT_SIZE_DIV_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIV_AMT_CREDIT,AVG_PAYMENT_SIZE_DIV_AMT_ANNUITY,DAYS_REGISTRATION_PLUS_DAYS_ID_PUBLISH,SUM_REFUSED_CONTRACT_DIV_SUM_APPR_CONTRACT,MAX_UTILIZATION_DIV_AVG_UTILIZATION,MAX_PREV_REQ_AMOUNT_DIV_AMT_CREDIT,AMT_INCOME_TOTAL_DIV_DAYS_BIRTH,SUM_DAYS_ID_REG_PHONE,SUM_REQ_CREDIT_YEAR,SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_1M,SUM_REQ_CREDIT_1M_DIV_SUM_REQ_CREDIT_QRT,SUM_REQ_CREDIT_QRT_DIV_SUM_REQ_CREDIT_YEAR,DEF_30_PLUS_60_CNT_SOCIAL_CIRCLE,OWN_CAR_AGE_DIV_DAYS_BIRTH,LANDAREA_DIV_TOTALAREA_MODE,OWN_CAR_AGE_PLUS_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_BIRTH,AMT_ANNUITY_DIV_DAYS_EMPLOYED,AMT_ANNUITY_PROD_DAYS_EMPLOYED,DAYS_REGISTRATION_DIV_DAYS_ID_PUBLISH,DAYS_REGISTRATION_DIV_DAYS_LAST_PHONE_CHANGE,REGION_RATING_CLIENT_W_CITY_DIV_REGION_POPULATION_RELATIVE,SUM_REG_NOT_FLAG,SUM_AVG_BUILD,SUM_MODE_BUILD,SUM_MEDI_BUILD,SUM_DOC_FLAG,CNT_CHILDREN_DIV_DAYS_BIRTH,CNT_CHILDREN_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_PROD_REGION_POPULATION_RELATIVE,FLAG_OWN_REALTY_DIV_REGION_POPULATION_RELATIVE,FLAG_OWN_CAR_DIV_OWN_CAR_AGE,EXT_SOURCE_1_DIV_DAYS_BIRTH,EXT_SOURCE_1_PROD_DAYS_BIRTH,AVG_AGG_SYNTHETIC_TARGET,SUM_AGG_SYNTHETIC_TARGET,MAX_AGG_SYNTHETIC_TARGET,MIN_AGG_SYNTHETIC_TARGET,DAYS_REGISTRATION_DIFF_DAYS_LAST_PHONE_CHANGE,DAYS_BIRTH_DIFF_DAYS_EMPLOYED,EXT_SOURCE_1_DIFF_EXT_SOURCE_2,EXT_SOURCE_1_DIFF_EXT_SOURCE_3,EXT_SOURCE_2_DIFF_EXT_SOURCE_3,AVG_PAYMENT_SIZE_DIFF_AMT_INCOME_TOTAL,AVG_PAYMENT_SIZE_DIFF_AMT_CREDIT,AVG_PAYMENT_SIZE_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_GOODS_PRICE,AMT_CREDIT_DIFF_SUM_PAYMENT,AMT_GOODS_PRICE_DIFF_AMT_INCOME_TOTAL,AMT_CREDIT_DIFF_AMT_ANNUITY,AMT_CREDIT_DIFF_AVG_PREV_REQ_AMOUNT,AMT_CREDIT_DIFF_MAX_PREV_REQ_AMOUNT,NAME_CONTRACT_TYPE_Cash_loans,NAME_CONTRACT_TYPE_Revolving_loans,NAME_CONTRACT_TYPE_nan,CODE_GENDER_F,CODE_GENDER_M,CODE_GENDER_nan,NAME_TYPE_SUITE_Children,NAME_TYPE_SUITE_Family,NAME_TYPE_SUITE_Group_of_people,NAME_TYPE_SUITE_Other_A,NAME_TYPE_SUITE_Other_B,"NAME_TYPE_SUITE_Spouse,_partner",NAME_TYPE_SUITE_Unaccompanied,NAME_TYPE_SUITE_nan,NAME_INCOME_TYPE_Businessman,NAME_INCOME_TYPE_Commercial_associate,NAME_INCOME_TYPE_Pensioner,NAME_INCOME_TYPE_State_servant,NAME_INCOME_TYPE_Student,NAME_INCOME_TYPE_Unemployed,NAME_INCOME_TYPE_Working,NAME_INCOME_TYPE_nan,NAME_EDUCATION_TYPE_Academic_degree,NAME_EDUCATION_TYPE_Higher_education,NAME_EDUCATION_TYPE_Incomplete_higher,NAME_EDUCATION_TYPE_Lower_secondary,NAME_EDUCATION_TYPE_Secondary_/_secondary_special,NAME_EDUCATION_TYPE_nan,NAME_FAMILY_STATUS_Civil_marriage,NAME_FAMILY_STATUS_Married,NAME_FAMILY_STATUS_Separated,NAME_FAMILY_STATUS_Single_/_not_married,NAME_FAMILY_STATUS_Widow,NAME_FAMILY_STATUS_nan,NAME_HOUSING_TYPE_Co-op_apartment,NAME_HOUSING_TYPE_House_/_apartment,NAME_HOUSING_TYPE_Municipal_apartment,NAME_HOUSING_TYPE_Office_apartment,NAME_HOUSING_TYPE_Rented_apartment,NAME_HOUSING_TYPE_With_parents,NAME_HOUSING_TYPE_nan,OCCUPATION_TYPE_Accountants,OCCUPATION_TYPE_Cleaning_staff,OCCUPATION_TYPE_Cooking_staff,OCCUPATION_TYPE_Core_staff,OCCUPATION_TYPE_Drivers,OCCUPATION_TYPE_HR_staff,OCCUPATION_TYPE_High_skill_tech_staff,OCCUPATION_TYPE_IT_staff,OCCUPATION_TYPE_Laborers,OCCUPATION_TYPE_Low-skill_Laborers,OCCUPATION_TYPE_Managers,OCCUPATION_TYPE_Medicine_staff,OCCUPATION_TYPE_Private_service_staff,OCCUPATION_TYPE_Realty_agents,OCCUPATION_TYPE_Sales_staff,OCCUPATION_TYPE_Secretaries,OCCUPATION_TYPE_Security_staff,OCCUPATION_TYPE_Waiters/barmen_staff,OCCUPATION_TYPE_nan,WEEKDAY_APPR_PROCESS_START_FRIDAY,WEEKDAY_APPR_PROCESS_START_MONDAY,WEEKDAY_APPR_PROCESS_START_SATURDAY,WEEKDAY_APPR_PROCESS_START_SUNDAY,WEEKDAY_APPR_PROCESS_START_THURSDAY,WEEKDAY_APPR_PROCESS_START_TUESDAY,WEEKDAY_APPR_PROCESS_START_WEDNESDAY,WEEKDAY_APPR_PROCESS_START_nan,FONDKAPREMONT_MODE_not_specified,FONDKAPREMONT_MODE_org_spec_account,FONDKAPREMONT_MODE_reg_oper_account,FONDKAPREMONT_MODE_reg_oper_spec_account,FONDKAPREMONT_MODE_nan,HOUSETYPE_MODE_block_of_flats,HOUSETYPE_MODE_specific_housing,HOUSETYPE_MODE_terraced_house,HOUSETYPE_MODE_nan,WALLSMATERIAL_MODE_Block,WALLSMATERIAL_MODE_Mixed,WALLSMATERIAL_MODE_Monolithic,WALLSMATERIAL_MODE_Others,WALLSMATERIAL_MODE_Panel,"WALLSMATERIAL_MODE_Stone,_brick",WALLSMATERIAL_MODE_Wooden,WALLSMATERIAL_MODE_nan,EMERGENCYSTATE_MODE_No,EMERGENCYSTATE_MODE_Yes,EMERGENCYSTATE_MODE_nan
0,0,1,0,135000.0,568800.0,20560.5,450000.0,0.01885,-19241,-2329.0,-5170.0,-812,,1,1,0,1,0,1,2.0,2,2,18,0,0,0,0,0,0,24,0.752614,0.789654,0.15952,0.066,0.059,0.9732,,,,0.1379,0.125,,,,0.0505,,,0.0672,0.0612,0.9732,,,,0.1379,0.125,,,,0.0526,,,0.0666,0.059,0.9732,,,,0.1379,0.125,,,,0.0514,,,0.0392,0.0,0.0,0.0,0.0,-1740.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,1.0,-1612.0,-1612.0,-1612.0,0.0,23787.0,23787.0,23787.0,13.67069,13.67069,13.67069,6.020501,6.020501,6.020501,0.00346,0.00346,0.00346,3951.0,3951.0,3951.0,2.27069,2.27069,2.27069,-1740.0,-1740.0,0.0,0.0,0.0,14.273276,14.273276,24835.5,24835.5,6e-05,0.00055,0.00055,0.104326,0.957782,0.957782,0.957782,,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.000575,0.000575,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.513661,-3.921423,0.977275,-0.190697,1.345474,-0.545294,1.929032,1.411176,603.706712,0.0,0.0,1.0,1.0,0.987405,0.987405,3.0,3.0,3.0,3091.0,0.0,,,,596686.5,596686.5,0.0,8.857143,0.983871,1.774194,0.007155,47.5,0.5,47.0,61.0,0.992481,0.007519,0.052632,0.349547,0.021053,0.000835,0.005848,120775.784672,1800.0,282.105263,1974.736842,0.142857,0.111111,0.015873,884025.0,3091.0,19.0,19.0,-51.0,-1329.0,1778.0,577.0,3.0,7.0,3.0,0.0,0.0,0.0,0.0,49.0,0.029363,,0.0,,0.0,0.0,53216.5875,596686.5,,,0.0,,-6.0,149.0,1523.0,100412.66129,1453365.0,0.0,0.0,0.0,24817.5,0.525046,1.10057,1.523734,1.496514,-0.660367,-1.992638,0.017996,0.257508,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,2916.0,0.0,0.0,0.0,0.0,3.116986,5885.132143,10.686671,17397.9,1.365586,3951.0,21.8189,41195.925,1.0,-1628.0,-2916.0,1288.0,,,0.0,0.0,,,11.0,-36.0,0.485121,-1.311336,-0.289649,-1.265137,0.259213,1.925718,0.03656,1.028292,7.0,7.0,2.0,,,,0.503134,2518.830156,285.999676,-0.151551,4.213333,703800.0,1.264,13.807191,3.333333,27.664697,22.9027,22.9027,0.094803,0.121044,-9239.0,0.043594,0.010347,0.286235,-5982.0,0.0,,0.043663,-7.016267,-7722.0,0.0,0.0,0.0,,,0.0,,,,-1.068578,-8.828038,-47885404.5,6.366995,2.971264,0.0377,0,,,,1,-0.0,0.0,0.01885,53.050398,,-3.9e-05,-14481.055414,0.50674,2.026962,0.525046,0.485121,-3430.0,-16912,-0.03704,0.593095,0.630135,-129114.867857,-562914.9,-14675.367857,433800.0,118800.0,527604.075,315000.0,548239.5,543964.5,543964.5,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0
1,0,1,0,99000.0,222768.0,17370.0,180000.0,0.035792,-18064,-4469.0,-9118.0,-1623,,1,1,0,1,0,0,2.0,2,2,9,0,0,0,0,0,0,46,0.56499,0.291656,0.432962,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,3.0,,,,,,,,2.0,-460.0,-460.0,-460.0,0.0,0.0,40153.5,20076.75,0.0,53.042933,26.521466,8.342371,8.342371,8.342371,0.01102,0.01102,0.01102,4813.2,4813.2,4813.2,6.358256,6.358256,6.358256,-757.0,-315.0,442.0,1.0,0.5,29.469947,58.939894,22308.75,44617.5,0.000144,0.001189,0.001189,0.108964,0.89995,0.89995,0.89995,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.001321,0.001321,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,,,,,,,,0.529786,-3.004413,0.852979,-0.301994,1.40546,-1.294547,0.780261,1.127595,617.739835,0.0,0.0,0.0,0.0,0.954794,0.954794,2.0,2.0,2.0,1446.0,0.0,,,,568408.5,568408.5,0.0,5.333333,1.0,0.3125,0.086957,8.5,1.0,7.5,16.0,1.0,0.0,0.0,0.539216,0.117647,0.0,0.0,107036.117647,6882.352941,0.0,0.0,0.0,0.0,0.0,598626.0,1446.0,8.0,8.0,-12.0,-128.0,1324.0,1318.0,2.0,3.0,2.0,0.0,0.0,0.0,0.0,62.0,0.026109,0.0,0.0,0.0,0.0,0.0,50188.368035,568408.5,,,0.0,0.0,-11.0,110.0,311.0,53154.691016,657126.0,1.0,0.0,0.0,4261.5,0.546448,-1.948244,-0.867605,4.826918,-0.613374,-1.4752,0.188919,0.200762,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,706.0,0.0,0.0,0.0,0.0,11.09417,6240.205,37.566479,17656.245,6.539674,4813.2,99.847528,56161.845,1.0,-470.0,-736.0,266.0,,,0.0,0.0,,,1.0,-37.0,0.525405,-1.571981,1.428804,0.404391,-0.61607,-0.355109,-0.043216,-0.162738,0.0,0.0,1.0,,,,0.508932,498.578149,413.987552,-0.039083,2.250182,321768.0,1.2376,3.966536,1.818182,12.82487,9.985678,4.992839,0.071345,0.247398,-13587.0,0.063032,0.028012,0.359252,-10741.0,0.0,,0.200287,-5.480514,-10741.0,3.0,0.0,0.0,,0.0,0.0,,,,-0.961581,-3.886776,-77626530.0,5.617991,,0.071584,0,,,,1,-0.0,0.0,0.035792,27.939204,,-3.1e-05,-10205.983005,0.527643,2.110571,0.546448,0.508932,-9118.0,-13595,0.273335,0.132029,-0.141306,-92759.795,-216527.8,-11129.795,123768.0,42768.0,166606.155,81000.0,205398.0,200459.25,178150.5,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
2,1,1,0,202500.0,663264.0,69777.0,630000.0,0.019101,-20038,-4458.0,-2175.0,-3503,5.0,1,1,0,1,0,0,2.0,2,2,14,0,0,0,0,0,0,57,,0.699787,0.610991,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-856.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,1.0,4.0,4742.415,4742.415,1.079158,1.079158,1.079158,1.079158,1.079158,4.0,-1702.0,-85.0,-710.333333,1617.0,0.0,512370.0,146134.125,0.0,598.563084,177.826452,5.109738,22.128804,11.523312,0.003668,0.025851,0.016079,4742.415,23153.985,11478.195,3.270728,27.049048,15.897086,-1999.0,-222.0,1777.0,1.0,0.25,158.370361,525.700935,130871.25,450000.0,3.4e-05,0.001918,0.003953,0.067217,1.052363,1.1386,0.93933,,0.0,0.0,0.0,0.0,0.0,1.0,3.0,0.0,1.0,0.0,1.0,0.0,1.0,3.0,0.005331,0.003663,2.0,,,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,,,,,,,,0.499304,-0.690857,-0.565602,-0.438265,0.496767,0.94185,0.88094,0.138659,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,0.0,0.0,0.0,31.75,0.944882,0.811024,0.005744,54.5,19.5,35.0,120.0,0.934538,0.065462,0.136364,0.027611,0.015847,0.001329,0.002502,11763.832141,1358.464615,935.629196,1895.27027,0.75,0.027778,0.016119,0.0,0.0,40.0,40.0,-68.0,-1707.0,-567.0,-4272.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,1210.0,0.002409,14.471514,14.471514,19305.0,19305.0,0.0,0.0,0.0,,,,,-4.0,1330.0,860.0,9516.034492,2072280.06,0.0,2.0,0.0,0.0,0.450881,-1.855564,2.735181,-2.778506,1.382593,1.031266,-0.318153,-0.061797,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18159.919219,161420.22,1743352.245,96.0,1.0,95.0,0.115301,1.02489,230.066978,1944.407308,22086.429911,0.001461,0.012345,0.014493,0.014493,23.0,0.239583,7.0,571500.0,5953.125,157500.0,0.0,,,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.481502,-1.995274,-1.079984,1.425906,-0.458675,-1.500304,-0.189693,1.339213,9484.83,9484.83,4741.245,357347.745,23.58,2705.0,10.0,179437.725,381.708698,23147.82,14.445926,9740.235774,1029.820591,357347.745,0.01181,6.165,2239.118537,1509736.545,11.0,-14.0,-2705.0,2691.0,4718.835,4718.835,15871.995,-357348.915,4742.415,274.32,21.0,-38.0,0.500121,0.701369,-3.623967,-0.465886,1.219061,-0.284452,-0.394729,-0.151084,18.0,0.0,3.0,0.0,3.0,36.0,0.509721,-485.084284,,-0.134994,3.275378,865764.0,1.0528,0.439324,3.111111,9.505482,5.068065,1.47392,,0.222477,-7489.0,0.0481,0.014685,0.139591,-5678.0,0.0,8.888818,0.678463,-10.105799,-6534.0,5.0,1.0,0.0,0.0,0.2,0.0,-0.00025,,-20033.0,-3.482234,-15.652086,-311065866.0,0.620896,2.540888,0.038202,0,,,,1,-0.0,0.0,0.019101,52.35328,0.2,,,0.488306,2.441529,0.509721,0.450881,-1319.0,-15580,,,0.088796,-192759.764226,-653523.8,-60036.764226,460764.0,33264.0,-846472.545,427500.0,593487.0,532392.75,213264.0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1
3,0,1,2,315000.0,1575000.0,49018.5,1575000.0,0.026392,-13976,-1866.0,-2000.0,-4208,,1,1,0,1,1,0,4.0,2,2,11,0,0,0,0,0,0,42,0.525734,0.509677,0.612704,0.3052,0.1974,0.997,0.9592,0.1165,0.32,0.2759,0.375,0.0417,0.2042,0.2404,0.3673,0.0386,0.08,0.3109,0.2049,0.997,0.9608,0.1176,0.3222,0.2759,0.375,0.0417,0.2089,0.2626,0.3827,0.0389,0.0847,0.3081,0.1974,0.997,0.9597,0.1173,0.32,0.2759,0.375,0.0417,0.2078,0.2446,0.3739,0.0388,0.0817,0.37,0.0,0.0,0.0,0.0,-1805.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,3.0,,,,,,,,5.0,-1081.0,365243.0,121182.666667,366324.0,0.0,225000.0,92920.5,0.0,151.006711,69.509847,8.507039,21.692944,16.733328,0.010674,0.013423,0.012038,6028.02,11250.0,8091.585,3.339623,8.778839,6.556266,-1805.0,-531.0,1274.0,2.0,0.4,40.92331,82.75596,49207.5,130765.5,7.2e-05,,,0.057708,,,0.902436,,0.0,0.0,0.0,0.0,0.0,1.0,3.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,0.001809,0.001255,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,0.506871,-1.06098,-0.298669,-0.388277,0.796905,0.387967,-0.199159,-1.206917,161.513904,178591.5,178591.5,0.0,0.0,0.838975,0.838975,4.0,4.0,4.0,31491.0,0.0,,,,178591.5,178591.5,0.0,24.75,1.0,0.885522,0.002466,65.5,4.0,61.5,297.0,1.0,0.0,0.0,0.064056,0.015267,0.0,0.0,9514.816939,0.0,0.0,0.0,0.0,0.0,0.0,735750.0,32596.0,60.0,60.0,-69.0,-1862.0,30885.0,23877.0,5.0,12.0,5.0,0.0,0.0,0.0,0.0,269.0,0.013641,0.0,0.0,0.0,0.0,0.0,2458.279889,186304.5,,,0.0,0.0,-20.0,1544.0,1836.0,14667.35831,1520875.08,5.0,0.0,0.0,21084.075,0.505209,5.622416,-1.250694,-1.959916,-3.17416,2.3044,-0.75604,-0.057765,0.0,0.0,22823.55,22823.55,11250.0,11250.0,9.0,12.0,9029.385,5495.775,13711.305,0.060939,8085.058163,37335.915,396167.85,49.0,1.0,48.0,0.035934,0.165937,1461.966014,37335.915,71636.334672,0.006498,0.165937,0.0,0.0,117.0,2.387755,12.0,301663.62,6156.400408,22823.55,0.565555,,,0.0,0.0,0.0,0.0,1.019568,0.165937,0.165937,,,0.474385,-0.824511,1.474199,0.817147,-1.033729,-0.138804,0.003143,-0.12993,16360.11,0.0,11250.0,11250.0,1.17,1773.0,10.0,70348.23,131.908966,8505.0,11.108996,4356.731549,387.931034,38988.54,0.001572,1.17,1255.316553,492310.665,12.0,-29.0,-1785.0,1756.0,0.0,8505.0,22503.51,-23583.33,11250.0,1.17,7.0,-19.0,0.518258,-0.789362,-1.863631,0.100024,-0.152822,-0.011525,0.885663,-1.055896,0.0,0.0,2.0,,,,0.50267,63.696238,22.571788,-0.12686,5.0,1890000.0,1.0,3.199199,5.0,32.130726,32.007316,12.044461,0.164177,0.133515,-5671.0,0.013831,0.002766,0.088879,-6208.0,0.0,4.617891,0.083026,-22.538638,-8013.0,3.0,0.0,0.0,,0.0,0.0,,0.564595,,-3.507334,-26.269293,-91468521.0,0.475285,1.108033,0.052784,0,4.5184,4.5838,4.5389,1,-0.000143,75.78054,0.026392,37.89027,,-3.8e-05,-7347.658072,0.501478,2.507392,0.518258,0.474385,-195.0,-12110,0.016057,-0.08697,-0.103027,-310643.268451,-1570643.0,-44661.768451,1260000.0,0.0,1082689.335,1260000.0,1525981.5,1525792.5,1444234.5,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0
4,1,0,1,180000.0,625500.0,32067.0,625500.0,0.010032,-13040,-2191.0,-4000.0,-4262,16.0,1,1,1,1,0,0,3.0,2,2,5,0,0,0,0,1,1,42,0.202145,0.425687,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,-821.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,,,,,,,24463.71,24463.71,1.118802,1.118802,1.118802,1.118802,1.118802,2.0,-449.0,-449.0,-449.0,0.0,92605.5,508495.5,300550.5,112.795981,4581.040541,2346.918261,8.342387,20.785707,14.564047,0.010161,0.187259,0.09871,11100.6,24463.71,17782.155,13.520828,220.393784,116.957306,-821.0,-111.0,710.0,1.0,0.5,2096.599977,4094.594595,267727.5,454500.0,0.000107,0.005736,0.010079,0.087554,1.131358,1.143913,1.118802,,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,1.0,0.001218,0.001218,0.0,,,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,1.0,20.785707,20.785707,20.785707,1.118802,1.118802,532959.21,532959.21,0.568242,1.571133,2.179596,4.183057,1.353692,-0.953153,2.186798,-0.578805,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,,,,787.0,0.0,0.0,0.0,0.0,18.007955,11100.3375,23.81427,11100.6,13.841147,11097.45,216.095461,133204.05,0.0,-466.0,-802.0,336.0,,,0.0,0.0,,,-9.0,-18.0,0.515418,-1.508894,1.59145,0.517567,-0.392059,-0.30697,-0.006584,-0.016673,0.0,0.0,1.0,,,,0.508932,,,-0.060353,3.475,805500.0,1.0,4.695803,3.475,19.506034,2.336331,1.376238,,0.168021,-7012.0,0.061669,0.017746,0.346161,-8262.0,0.0,,0.726619,-13.803681,-9083.0,,,,,,0.0,-0.001227,,-13024.0,-2.459126,-14.635783,-70258797.0,0.938527,4.872107,0.020064,2,,,,1,-7.7e-05,99.681021,0.0,0.0,0.0625,-1.6e-05,-2635.970697,0.530864,1.592592,0.568242,0.508932,-3179.0,-10849,-0.223542,,,-168899.6625,-614399.7,-20966.6625,445500.0,0.0,492295.95,445500.0,593433.0,357772.5,171000.0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1


time: 527 ms


In [67]:
grp = GaussianRandomProjection(n_components=10, random_state=2357)

arr = grp.fit_transform(impute.fit_transform(df.replace([-np.inf, np.inf], np.nan)))

time: 12.8 s


In [68]:
proj = pd.DataFrame(arr, 
                    columns=["RAND_PROJ" + str(i+1) for i in range(arr.shape[1])], 
                    index=df.index)

proj.head()

Unnamed: 0,RAND_PROJ1,RAND_PROJ2,RAND_PROJ3,RAND_PROJ4,RAND_PROJ5,RAND_PROJ6,RAND_PROJ7,RAND_PROJ8,RAND_PROJ9,RAND_PROJ10
0,3228880.0,-4067673.0,-10569630.0,14295420.0,-6972493.0,15421230.0,23765890.0,12224200.0,-3052922.0,-23446160.0
1,4975321.0,-6790573.0,-17418510.0,22751370.0,-11099860.0,24230530.0,38806490.0,19753510.0,-5968268.0,-37348200.0
2,20596160.0,-28608350.0,-70609150.0,90753020.0,-43719080.0,96003030.0,153426200.0,77822680.0,-23277870.0,-146838100.0
3,6568142.0,-8709612.0,-20528190.0,27068070.0,-13478580.0,29516540.0,44938420.0,22107920.0,-5739098.0,-43104690.0
4,4898901.0,-6635660.0,-15397680.0,21018830.0,-9744195.0,22288860.0,35295040.0,17055670.0,-5109527.0,-33131860.0


time: 20.6 ms


In [69]:
proj.join(sk_id_curr).to_csv(path + "test_proj.csv", index=False, header=True)
del proj
gc.collect()

7

time: 1.5 s
