# Import Libraries

In [2]:
import gc
import warnings
warnings.filterwarnings('ignore')
import scipy as sp
import numpy as np
import pandas as pd
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.width', 1000)
from tqdm.auto import tqdm
import itertools
from dotenv import dotenv_values

In [3]:
config = dotenv_values('../.env')

In [9]:
def read_preprocess_data():
    train = pd.read_parquet(config["INT_TRAIN_PARQUET"])
    features = train.drop(['customer_ID', 'S_2'], axis = 1).columns.to_list()
    cat_features = [
        "B_30",
        "B_38",
        "D_114",
        "D_116",
        "D_117",
        "D_120",
        "D_126",
        "D_63",
        "D_64",
        "D_66",
        "D_68",
    ]
    num_features = [col for col in features if col not in cat_features]
    
    # Train FE
    print('Starting train feature extraction')
    train_num_agg = train.groupby("customer_ID")[num_features].agg(['first', 'mean', 'std', 'min', 'max', 'last'])
    train_num_agg.columns = ['_'.join(x) for x in train_num_agg.columns]
    train_num_agg.reset_index(inplace = True)
    
    # Lag Features
    for col in train_num_agg:
        if 'last' in col and col.replace('last', 'first') in train_num_agg:
            train_num_agg[col + '_lag_sub'] = train_num_agg[col] - train_num_agg[col.replace('last', 'first')]
            train_num_agg[col + '_lag_div'] = train_num_agg[col] / train_num_agg[col.replace('last', 'first')]

    train_cat_agg = train.groupby("customer_ID")[cat_features].agg(['count', 'first', 'last', 'nunique'])
    train_cat_agg.columns = ['_'.join(x) for x in train_cat_agg.columns]
    train_cat_agg.reset_index(inplace = True)
    
    train_labels = pd.read_csv(config["TRAIN_LABELS_PATH"])
    train = train_num_agg.merge(train_cat_agg, how = 'inner', on = 'customer_ID').merge(train_labels, how = 'inner', on = 'customer_ID')
    print('Train shape: ', train.shape)    
    del train_num_agg, train_cat_agg        
    gc.collect()
    
    # Test FE
    test = pd.read_parquet(config["INT_TEST_PARQUET"])
    print('Starting test feature extraction')
    test_num_agg = test.groupby("customer_ID")[num_features].agg(['first', 'mean', 'std', 'min', 'max', 'last'])
    test_num_agg.columns = ['_'.join(x) for x in test_num_agg.columns]
    test_num_agg.reset_index(inplace = True)
    
     # Lag Features
    for col in test_num_agg:
        if 'last' in col and col.replace('last', 'first') in test_num_agg:
            test_num_agg[col + '_lag_sub'] = test_num_agg[col] - test_num_agg[col.replace('last', 'first')]
            test_num_agg[col + '_lag_div'] = test_num_agg[col] / test_num_agg[col.replace('last', 'first')]

    test_cat_agg = test.groupby("customer_ID")[cat_features].agg(['count', 'first', 'last', 'nunique'])
    test_cat_agg.columns = ['_'.join(x) for x in test_cat_agg.columns]
    test_cat_agg.reset_index(inplace = True)
    
    test = test_num_agg.merge(test_cat_agg, how = 'inner', on = 'customer_ID')
    print('Test shape: ', test.shape)
    del test_num_agg, test_cat_agg
    gc.collect()
    
    
    # Save files to disk
    train.to_parquet(config["ENGINEERED_DATA"] + 'train_fe_plus_plus.parquet')
    test.to_parquet(config["ENGINEERED_DATA"] + 'test_fe_plus_plus.parquet')

In [10]:
read_preprocess_data()

Starting train feature extraction
Train shape:  (458913, 1462)
Starting test feature extraction
Test shape:  (924621, 1461)


In [12]:
train = pd.read_parquet(config["ENGINEERED_DATA"] + 'train_fe_plus_plus.parquet')

In [13]:
train.head()

Unnamed: 0,customer_ID,P_2_first,P_2_mean,P_2_std,P_2_min,P_2_max,P_2_last,D_39_first,D_39_mean,D_39_std,D_39_min,D_39_max,D_39_last,B_1_first,B_1_mean,B_1_std,B_1_min,B_1_max,B_1_last,B_2_first,B_2_mean,B_2_std,B_2_min,B_2_max,B_2_last,R_1_first,R_1_mean,R_1_std,R_1_min,R_1_max,R_1_last,S_3_first,S_3_mean,S_3_std,S_3_min,S_3_max,S_3_last,D_41_first,D_41_mean,D_41_std,D_41_min,D_41_max,D_41_last,B_3_first,B_3_mean,B_3_std,B_3_min,B_3_max,B_3_last,D_42_first,D_42_mean,D_42_std,D_42_min,D_42_max,D_42_last,D_43_first,D_43_mean,D_43_std,D_43_min,D_43_max,D_43_last,D_44_first,D_44_mean,D_44_std,D_44_min,D_44_max,D_44_last,B_4_first,B_4_mean,B_4_std,B_4_min,B_4_max,B_4_last,D_45_first,D_45_mean,D_45_std,D_45_min,D_45_max,D_45_last,B_5_first,B_5_mean,B_5_std,B_5_min,B_5_max,B_5_last,R_2_first,R_2_mean,R_2_std,R_2_min,R_2_max,R_2_last,D_46_first,D_46_mean,D_46_std,D_46_min,D_46_max,D_46_last,D_47_first,D_47_mean,D_47_std,D_47_min,D_47_max,D_47_last,D_48_first,D_48_mean,D_48_std,D_48_min,D_48_max,D_48_last,D_49_first,D_49_mean,D_49_std,D_49_min,D_49_max,D_49_last,B_6_first,B_6_mean,B_6_std,B_6_min,B_6_max,B_6_last,B_7_first,B_7_mean,B_7_std,B_7_min,B_7_max,B_7_last,B_8_first,B_8_mean,B_8_std,B_8_min,B_8_max,B_8_last,D_50_first,D_50_mean,D_50_std,D_50_min,D_50_max,D_50_last,D_51_first,D_51_mean,D_51_std,D_51_min,D_51_max,D_51_last,B_9_first,B_9_mean,B_9_std,B_9_min,B_9_max,B_9_last,R_3_first,R_3_mean,R_3_std,R_3_min,R_3_max,R_3_last,D_52_first,D_52_mean,D_52_std,D_52_min,D_52_max,D_52_last,P_3_first,P_3_mean,P_3_std,P_3_min,P_3_max,P_3_last,B_10_first,B_10_mean,B_10_std,B_10_min,B_10_max,B_10_last,D_53_first,D_53_mean,D_53_std,D_53_min,D_53_max,D_53_last,S_5_first,S_5_mean,S_5_std,S_5_min,S_5_max,S_5_last,B_11_first,B_11_mean,B_11_std,B_11_min,B_11_max,B_11_last,S_6_first,S_6_mean,S_6_std,S_6_min,S_6_max,S_6_last,D_54_first,D_54_mean,D_54_std,D_54_min,D_54_max,D_54_last,R_4_first,R_4_mean,R_4_std,R_4_min,R_4_max,R_4_last,S_7_first,S_7_mean,S_7_std,S_7_min,S_7_max,S_7_last,B_12_first,B_12_mean,B_12_std,B_12_min,B_12_max,B_12_last,S_8_first,S_8_mean,S_8_std,S_8_min,S_8_max,S_8_last,D_55_first,D_55_mean,D_55_std,D_55_min,D_55_max,D_55_last,D_56_first,D_56_mean,D_56_std,D_56_min,D_56_max,D_56_last,B_13_first,B_13_mean,B_13_std,B_13_min,B_13_max,B_13_last,R_5_first,R_5_mean,R_5_std,...,R_7_last_lag_div,D_77_last_lag_sub,D_77_last_lag_div,B_25_last_lag_sub,B_25_last_lag_div,B_26_last_lag_sub,B_26_last_lag_div,D_78_last_lag_sub,D_78_last_lag_div,D_79_last_lag_sub,D_79_last_lag_div,R_8_last_lag_sub,R_8_last_lag_div,R_9_last_lag_sub,R_9_last_lag_div,S_16_last_lag_sub,S_16_last_lag_div,D_80_last_lag_sub,D_80_last_lag_div,R_10_last_lag_sub,R_10_last_lag_div,R_11_last_lag_sub,R_11_last_lag_div,B_27_last_lag_sub,B_27_last_lag_div,D_81_last_lag_sub,D_81_last_lag_div,D_82_last_lag_sub,D_82_last_lag_div,S_17_last_lag_sub,S_17_last_lag_div,R_12_last_lag_sub,R_12_last_lag_div,B_28_last_lag_sub,B_28_last_lag_div,R_13_last_lag_sub,R_13_last_lag_div,D_83_last_lag_sub,D_83_last_lag_div,R_14_last_lag_sub,R_14_last_lag_div,R_15_last_lag_sub,R_15_last_lag_div,D_84_last_lag_sub,D_84_last_lag_div,R_16_last_lag_sub,R_16_last_lag_div,B_29_last_lag_sub,B_29_last_lag_div,S_18_last_lag_sub,S_18_last_lag_div,D_86_last_lag_sub,D_86_last_lag_div,D_87_last_lag_sub,D_87_last_lag_div,R_17_last_lag_sub,R_17_last_lag_div,R_18_last_lag_sub,R_18_last_lag_div,D_88_last_lag_sub,D_88_last_lag_div,B_31_last_lag_sub,B_31_last_lag_div,S_19_last_lag_sub,S_19_last_lag_div,R_19_last_lag_sub,R_19_last_lag_div,B_32_last_lag_sub,B_32_last_lag_div,S_20_last_lag_sub,S_20_last_lag_div,R_20_last_lag_sub,R_20_last_lag_div,R_21_last_lag_sub,R_21_last_lag_div,B_33_last_lag_sub,B_33_last_lag_div,D_89_last_lag_sub,D_89_last_lag_div,R_22_last_lag_sub,R_22_last_lag_div,R_23_last_lag_sub,R_23_last_lag_div,D_91_last_lag_sub,D_91_last_lag_div,D_92_last_lag_sub,D_92_last_lag_div,D_93_last_lag_sub,D_93_last_lag_div,D_94_last_lag_sub,D_94_last_lag_div,R_24_last_lag_sub,R_24_last_lag_div,R_25_last_lag_sub,R_25_last_lag_div,D_96_last_lag_sub,D_96_last_lag_div,S_22_last_lag_sub,S_22_last_lag_div,S_23_last_lag_sub,S_23_last_lag_div,S_24_last_lag_sub,S_24_last_lag_div,S_25_last_lag_sub,S_25_last_lag_div,S_26_last_lag_sub,S_26_last_lag_div,D_102_last_lag_sub,D_102_last_lag_div,D_103_last_lag_sub,D_103_last_lag_div,D_104_last_lag_sub,D_104_last_lag_div,D_105_last_lag_sub,D_105_last_lag_div,D_106_last_lag_sub,D_106_last_lag_div,D_107_last_lag_sub,D_107_last_lag_div,B_36_last_lag_sub,B_36_last_lag_div,B_37_last_lag_sub,B_37_last_lag_div,R_26_last_lag_sub,R_26_last_lag_div,R_27_last_lag_sub,R_27_last_lag_div,D_108_last_lag_sub,D_108_last_lag_div,D_109_last_lag_sub,D_109_last_lag_div,D_110_last_lag_sub,D_110_last_lag_div,D_111_last_lag_sub,D_111_last_lag_div,B_39_last_lag_sub,B_39_last_lag_div,D_112_last_lag_sub,D_112_last_lag_div,B_40_last_lag_sub,B_40_last_lag_div,S_27_last_lag_sub,S_27_last_lag_div,D_113_last_lag_sub,D_113_last_lag_div,D_115_last_lag_sub,D_115_last_lag_div,D_118_last_lag_sub,D_118_last_lag_div,D_119_last_lag_sub,D_119_last_lag_div,D_121_last_lag_sub,D_121_last_lag_div,D_122_last_lag_sub,D_122_last_lag_div,D_123_last_lag_sub,D_123_last_lag_div,D_124_last_lag_sub,D_124_last_lag_div,D_125_last_lag_sub,D_125_last_lag_div,D_127_last_lag_sub,D_127_last_lag_div,D_128_last_lag_sub,D_128_last_lag_div,D_129_last_lag_sub,D_129_last_lag_div,B_41_last_lag_sub,B_41_last_lag_div,B_42_last_lag_sub,B_42_last_lag_div,D_130_last_lag_sub,D_130_last_lag_div,D_131_last_lag_sub,D_131_last_lag_div,D_132_last_lag_sub,D_132_last_lag_div,D_133_last_lag_sub,D_133_last_lag_div,R_28_last_lag_sub,R_28_last_lag_div,D_134_last_lag_sub,D_134_last_lag_div,D_135_last_lag_sub,D_135_last_lag_div,D_136_last_lag_sub,D_136_last_lag_div,D_137_last_lag_sub,D_137_last_lag_div,D_138_last_lag_sub,D_138_last_lag_div,D_139_last_lag_sub,D_139_last_lag_div,D_140_last_lag_sub,D_140_last_lag_div,D_141_last_lag_sub,D_141_last_lag_div,D_142_last_lag_sub,D_142_last_lag_div,D_143_last_lag_sub,D_143_last_lag_div,D_144_last_lag_sub,D_144_last_lag_div,D_145_last_lag_sub,D_145_last_lag_div,B_30_count,B_30_first,B_30_last,B_30_nunique,B_38_count,B_38_first,B_38_last,B_38_nunique,D_114_count,D_114_first,D_114_last,D_114_nunique,D_116_count,D_116_first,D_116_last,D_116_nunique,D_117_count,D_117_first,D_117_last,D_117_nunique,D_120_count,D_120_first,D_120_last,D_120_nunique,D_126_count,D_126_first,D_126_last,D_126_nunique,D_63_count,D_63_first,D_63_last,D_63_nunique,D_64_count,D_64_first,D_64_last,D_64_nunique,D_66_count,D_66_first,D_66_last,D_66_nunique,D_68_count,D_68_first,D_68_last,D_68_nunique,target
0,0000099d6bd597052cdcda90ffabf56573fe9d7c79be5f...,0.938469,0.933824,0.024194,0.86858,0.960384,0.934745,0,0.230769,0.83205,0,3,0,0.008724,0.012007,0.006547,0.00193,0.021655,0.009382,1.006838,1.005086,0.003222,1.000242,1.009672,1.007647,0.009228,0.004509,0.003081,0.000263,0.009228,0.006104,0.124035,0.113215,0.01167,0.098882,0.135021,0.135021,0.0,0.0,0.0,0.0,0.0,0.0,0.004709,0.006456,0.002942,0.000783,0.009866,0.007174,,,,,,,,,,,,,0,0.0,0.0,0,0,0,6,2.846154,2.44425,0,6,5,0.708906,0.725369,0.009515,0.708906,0.740102,0.740102,0.1706,0.14665,0.047205,0.060492,0.231717,0.231717,0,0.0,0.0,0,0,0,0.358587,0.378074,0.085674,0.231009,0.519619,0.420521,0.525351,0.532874,0.006578,0.521311,0.542119,0.539715,0.255736,0.240978,0.076875,0.135586,0.403448,0.192376,-1,-1.0,0.0,-1,-1,-1,0.063902,0.11351,0.04736,0.063902,0.221899,0.149564,0.059416,0.036624,0.023195,0.001681,0.060502,0.058425,0.0,0.0,0.0,0.0,0.0,0.0,0.148698,0.150326,0.002922,0.145179,0.154326,0.153461,4,2.923077,0.954074,2,4,2,0.008207,0.00622,0.00318,0.000519,0.009535,0.009535,0,0.0,0.0,0,0,0,0.207334,0.204972,0.0024,0.200782,0.208214,0.203524,0.736463,0.680138,0.050671,0.581678,0.741813,0.629392,0.096219,0.27028,0.181875,0.096219,0.741934,0.326101,,,,,,,0.023381,0.029112,0.014758,0.007165,0.054221,0.034643,0.002768,0.00723,0.003031,0.002749,0.01026,0.01026,0,0.0,0.0,0,0,0,1.0,1.0,0.0,1.0,1.0,1.0,0,0.0,0.0,0,0,0,0.161345,0.098374,0.026775,0.074646,0.161345,0.105671,0.148266,0.125683,0.011772,0.11106,0.148266,0.112294,2896,2510.0,429.583519,1544,3166,1544,0.354596,0.224432,0.068116,0.148284,0.354596,0.187285,0.152025,0.158571,0.004747,0.152025,0.166636,0.166636,0.118075,0.100432,0.013723,0.074886,0.12074,0.100107,0,0.0,0.0,...,,0.004078,1.009774,-0.001254,0.837789,0.000796,3.927149,0,,0,,0,,0,1.0,-0.002245,0.011503,1,inf,0,,0,,0.004926,3.132041,0,,0,1.0,-0.001483,0.815333,0.0,1.0,6.2e-05,1.000737,0,,0,,0.0,,0,,0,,0,,,,0,,0,,0,1.0,0,,0,,,,0,1.0,0.000974,1.383913,0,,0,,0,,0,,0,,0,1.0,0,,0,,0,,-1,0.666667,-1,0.0,0,,0,,0,,0,,0,,0.023721,1.026531,-0.00376,0.972264,0.024875,1.0273,-0.002545,0.997389,3.8e-05,1.0304,0.176652,1.230409,0,1.0,0.009923,1.009877,0.180251,1.201683,0,1.0,0,1.0,-0.002527,0.746466,0.004105,1.897841,0,1.0,-0.002819,0.997206,0,1.0,0,,,,0,1.0,,,0.0,1.0,-0.109606,0.478215,0.252033,1.372322,0,,0.017536,1.073605,0.028135,1.12121,0.02039,1.086301,0.01751,1.024934,0,1.0,0,,0,1.0,0,,0,1.0,-0.008082,0.991981,0,1.0,0,,,,0.0,,0.0,,,,0.001865,1.429228,0,,,,0,1.0,0,1.0,0,1.0,0,1.0,0,,0,,0.0,,,,0,,0.00236,4.870063,0,,13,0,0,1,13,2,2,1,13,1,1,1,13,0,0,1,13,5,5,1,13,0,0,1,13,2,2,1,13,0,0,1,13,0,0,1,13,-1,-1,1,13,6,6,1,0
1,00000fd6641609c6ece5454664794f0340ad84dddce9a2...,0.929122,0.89982,0.022119,0.861109,0.929122,0.880519,13,7.153846,6.743468,0,19,6,0.025782,0.025654,0.027756,0.006711,0.109644,0.034684,1.002647,0.991083,0.051531,0.819772,1.008534,1.004028,0.005515,0.006246,0.002129,0.001023,0.008996,0.006911,0.089799,0.120578,0.023824,0.089799,0.165509,0.165509,0.0,0.0,0.0,0.0,0.0,0.0,0.00583,0.005663,0.003354,0.000861,0.012861,0.005068,,,,,,,0.5256,0.144571,0.169598,0.060646,0.5256,0.060646,0,0.0,0.0,0,0,0,1,0.846154,0.800641,0,3,1,0.239459,0.256461,0.009261,0.239459,0.267228,0.266275,0.070967,0.035462,0.043899,0.004075,0.165146,0.027,0,0.0,0.0,0,0,0,0.457826,0.452041,0.013177,0.432424,0.471737,0.438828,0.382562,0.392433,0.006671,0.382562,0.402878,0.402195,0.059342,0.048203,0.031312,0.010117,0.105999,0.014696,-1,-1.0,0.0,-1,-1,-1,0.201574,0.20227,0.015915,0.167634,0.226641,0.167634,0.03239,0.028049,0.013631,0.015836,0.068204,0.028411,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,1,1.153846,0.375534,1,2,1,0.007561,0.010298,0.011024,0.001722,0.045093,0.012926,0,0.538462,0.518875,0,1,1,0.110471,0.158313,0.06703,0.103495,0.242366,0.242366,0.619012,0.566665,0.03688,0.510142,0.619012,0.570898,0.302757,0.298815,0.003047,0.294,0.302757,0.29713,,,,,,,0.025802,0.016785,0.017104,0.002045,0.052949,0.043929,0.011677,0.013792,0.021041,0.000416,0.081246,0.01457,0,0.0,0.0,0,0,0,1.0,1.0,0.0,1.0,1.0,1.0,0,0.0,0.0,0,0,0,0.072583,0.103002,0.035143,0.072583,0.208516,0.208516,0.026337,0.025823,0.004665,0.01905,0.032917,0.01905,1880,1286.461538,772.374544,0,2402,1284,0.052813,0.048069,0.007596,0.036112,0.06077,0.036112,0.684371,0.705671,0.01854,0.684371,0.748383,0.748383,0.03649,0.046753,0.024456,0.008499,0.073904,0.017684,0,0.0,0.0,...,,0.005431,1.02443,-0.005868,0.782828,-0.005652,0.031125,0,,0,,0,,0,1.0,0.005703,5.643738,0,,0,,0,,0.002671,1.98757,0,,0,1.0,0.004617,6.794226,0.0,1.0,-0.00088,0.957201,0,,0,,0.0,,0,,0,,0,,,,0,,0,,0,1.0,0,,0,,,,0,1.0,0.002934,2.360076,0,,0,,0,,1,-0.0,0,,0,1.0,0,,0,,0,,0,,0,,0,,0,,0,,0,,0,,0.005968,1.006523,-0.002576,0.980982,0.004524,1.004885,0.001209,1.001238,-0.002829,0.531747,0.000582,1.559447,0,,0.0,,,,0,1.0,0,,0.002331,1.454646,0.008995,1.376319,0,1.0,0.003731,1.003716,0,1.0,0,,,,0,1.0,,,0.0,1.0,-0.010875,0.645599,-0.025032,0.921097,0,,0.024211,1.05629,0.027666,1.066128,0.020535,1.049321,0.024195,1.045898,0,1.0,0,,0,1.0,0,,0,,-0.00341,0.996599,0,,0,,,,0.0,,0.0,,,,0.001707,2.324799,0,,,,0,1.0,0,1.0,0,1.0,0,1.0,0,,0,,0.0,,,,0,,0.003142,117.991577,0,,13,0,0,1,13,2,2,1,13,1,1,1,13,0,0,1,13,0,0,1,13,0,0,2,13,2,2,1,13,3,3,1,13,0,0,1,13,-1,-1,1,13,6,6,1,0
2,00001b22f846c82c51f6e3958ccd81970162bae8b007e8...,0.876615,0.878454,0.028911,0.79767,0.904482,0.880875,0,0.0,0.0,0,0,0,0.001472,0.004386,0.002786,0.001472,0.009997,0.004284,0.810796,0.815677,0.003545,0.810796,0.819987,0.812649,0.005955,0.006621,0.001919,0.00354,0.009443,0.00645,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.004826,0.005493,0.002834,0.000626,0.009383,0.007196,,,,,,,,,,,,,0,0.076923,0.27735,0,1,0,1,2.230769,1.69085,1,7,2,0.222406,0.236871,0.008896,0.222406,0.251598,0.251598,0.005358,0.004618,0.003043,0.000215,0.008656,0.001557,0,0.0,0.0,0,0,0,0.438652,0.464475,0.060166,0.413028,0.647064,0.433713,0.31829,0.328617,0.007183,0.31829,0.339566,0.339125,0.081635,0.092284,0.060616,0.030227,0.255134,0.08037,-1,-1.0,0.0,-1,-1,-1,0.168822,0.176674,0.024615,0.129857,0.213943,0.183628,0.029138,0.034433,0.015459,0.021261,0.079764,0.026981,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,0,0.615385,0.50637,0,1,1,0.003663,0.00473,0.003302,0.000422,0.009521,0.009392,0,0.0,0.0,0,0,0,0.200082,0.199863,0.00299,0.195188,0.203649,0.202159,0.634722,0.618191,0.075604,0.381123,0.678706,0.628938,0.222126,0.273711,0.052875,0.162125,0.302619,0.296313,,,,,,,0.007875,0.005948,0.002943,0.001054,0.00873,0.001824,0.001677,0.004683,0.002312,0.000111,0.007619,0.005092,1,1.0,0.0,1,1,1,1.0,1.0,0.0,1.0,1.0,1.0,0,0.0,0.0,0,0,0,,,,,,,0.011923,0.011541,0.002969,0.0061,0.015486,0.007158,0,0.0,0.0,0,0,0,0.073229,0.077362,0.016318,0.057529,0.09923,0.098963,0.20153,0.208154,0.003188,0.20153,0.211538,0.209386,0.002824,0.003778,0.002688,0.000427,0.008332,0.001749,0,0.0,0.0,...,,5e-06,1.000012,0.000908,1.139309,0.004616,1.898658,0,,0,,0,,0,1.0,0.000904,1.107547,0,,0,,0,,0.003329,2.551273,0,,0,1.0,-0.004312,0.035563,0.0,1.0,0.011269,1.600885,0,,0,,0.0,,0,,0,,0,,,,0,,0,,0,1.0,0,,0,,,,0,1.0,0.002361,1.605759,0,,0,,0,,0,,0,,0,1.0,0,,0,,0,,0,,0,,0,,0,,0,,0,,0,,0.007301,1.024701,6.8e-05,1.000515,0.000476,1.005537,-0.003049,0.996874,-0.001651,0.740276,0.001335,1.15799,0,,0.0,,,,0,1.0,0,,-0.001389,0.789071,-0.001912,0.711859,0,1.0,-2.5e-05,0.999975,0,1.0,0,,,,0,1.0,,,0.0,1.0,0.007509,1.431727,,,0,,0.020057,1.054418,0.021439,1.061854,0.030788,1.091027,0.024646,1.058686,0,1.0,0,,0,1.0,0,,0,,0.0,,0,,0,,,,0.0,,0.0,,,,0.007577,4.287718,0,,,,0,1.0,0,1.0,0,1.0,0,1.0,0,,0,,0.0,,,,0,,-0.001904,0.304443,0,,13,0,0,1,13,1,1,1,13,0,1,2,13,0,0,1,13,0,0,1,13,0,0,1,13,2,2,1,13,3,3,1,13,2,2,1,13,-1,-1,1,13,6,6,1,0
3,000041bdba6ecadd89a52d11886e8eaaec9325906c9723...,0.567442,0.598969,0.020107,0.567442,0.623392,0.621776,9,1.538462,3.017046,0,9,0,0.070311,0.059876,0.080531,0.00591,0.279991,0.012564,0.812053,0.955264,0.080981,0.812053,1.009999,1.006183,0.004228,0.005665,0.003473,0.000199,0.009915,0.007829,0.40742,0.24775,0.095122,0.149216,0.40742,0.287766,0.0,0.0,0.0,0.0,0.0,0.0,0.010927,0.006423,0.00336,5.3e-05,0.010927,0.009937,,,,,,,0.006633,0.061026,0.041993,0.006633,0.149891,0.046104,0,0.0,0.0,0,0,0,8,2.230769,2.832956,0,8,0,0.056394,0.069334,0.008501,0.056394,0.085103,0.085103,0.000228,0.088374,0.074462,0.000228,0.283781,0.118818,0,0.0,0.0,0,0,0,0.471676,0.431905,0.030525,0.384254,0.471676,0.410723,0.39223,0.403269,0.006355,0.39223,0.414224,0.414224,0.176105,0.076686,0.063902,0.005276,0.177252,0.013057,-1,-1.0,0.0,-1,-1,-1,0.079987,0.160625,0.031266,0.079987,0.196887,0.174331,0.252338,0.06213,0.07359,0.004301,0.252338,0.011969,1.004358,1.004676,0.001928,1.002021,1.008767,1.005561,0.341256,0.439581,0.044539,0.341256,0.482535,0.430318,0,0.076923,0.27735,0,1,1,0.026897,0.052241,0.053342,0.001702,0.176352,0.020526,0,0.615385,0.650444,0,2,2,0.201745,0.199698,0.00213,0.1953,0.203203,0.198356,0.582652,0.610934,0.09009,0.3451,0.704214,0.67208,0.297839,0.306553,0.079528,0.192981,0.431901,0.411625,0.006409,0.004336,0.003589,0.000346,0.00999,0.001379,0.068346,0.056297,0.044583,0.002999,0.150845,0.02297,0.04314,0.044294,0.071076,0.000672,0.241378,0.005491,0,0.0,0.0,0,0,0,1.0,1.0,0.0,1.0,1.0,1.0,0,0.0,0.0,0,0,0,0.365518,0.261497,0.078128,0.152622,0.370595,0.279464,0.014082,0.048949,0.02528,0.009411,0.077831,0.074835,1454,961.307692,405.585048,528,1511,528,0.094076,0.061726,0.018374,0.0214,0.094076,0.0214,0.579588,0.564632,0.018147,0.533675,0.580167,0.554483,0.013755,0.081928,0.041875,0.013755,0.124311,0.055897,0,0.0,0.0,...,,-0.003368,0.991674,-0.019991,0.41644,0.000536,1.120597,0,,0,,0,,0,1.0,0.001893,1.392863,0,,0,,1,inf,0.005404,3.143917,0,,0,1.0,0.00265,1.529328,0.0,1.0,-0.081134,0.114552,0,,0,,0.0,,0,,0,,1,inf,,,0,,0,,0,1.0,0,,0,,,,0,1.0,-0.003136,0.625393,0,,0,,0,,0,,0,,0,1.0,0,,0,,0,,1,inf,0,,0,,0,,0,,0,,0,,-0.007693,0.991811,-0.006725,0.951811,0.007098,1.007471,-0.000634,0.99935,0.037624,7.181901,-0.006894,0.262062,0,,0.0,,,,0,1.0,0,,0.004397,13.622044,-0.06591,0.100635,0,1.0,0.000903,1.0009,0,1.0,0,,,,0,1.0,,,0.992765,138.22081,-0.285895,0.097893,0.671174,72.179962,0,1.0,-0.435693,0.119895,0.022085,1.601958,0.030592,1.951677,0.013861,1.022528,-1,0.666667,0,,-1,0.933333,0,,0,,0.001741,1.00174,0,1.0,0,,,,0.0,,0.0,,,,-0.00293,0.379152,0,,,,0,1.0,0,1.0,0,1.0,0,1.0,0,,0,,0.0,,,,0,,0.003687,2.968755,0,,13,0,0,1,13,2,2,1,13,1,1,1,13,0,0,1,13,0,7,2,13,0,0,1,13,2,2,1,13,3,3,1,13,0,0,1,13,-1,-1,1,13,2,3,3,0
4,00007889e4fcd2614b6cbe7f8f3d2e5c728eca32d9eb8a...,0.936842,0.891679,0.042325,0.805045,0.940382,0.8719,0,0.0,0.0,0,0,0,0.003433,0.005941,0.002475,0.000776,0.009806,0.007679,0.818691,0.814543,0.003143,0.81067,0.819947,0.815746,0.007243,0.00418,0.002581,0.000336,0.009076,0.001247,0.16619,0.173102,0.004669,0.16619,0.176403,0.176403,0.0,0.0,0.0,0.0,0.0,0.0,0.005927,0.005088,0.00291,4.9e-05,0.009686,0.005528,,,,,,,0.061963,0.048778,0.006847,0.037001,0.061963,0.044671,0,0.0,0.0,0,0,0,5,11.692308,9.384248,3,25,21,0.28864,0.20915,0.117203,0.06315,0.305305,0.069952,0.003367,0.004572,0.002297,0.001201,0.00783,0.004855,0,0.0,0.0,0,0,0,0.464017,0.474523,0.076167,0.366783,0.694332,0.465525,0.465739,0.471961,0.007588,0.461473,0.484715,0.480303,0.141613,0.253697,0.093176,0.13784,0.491528,0.325121,-1,-1.0,0.0,-1,-1,-1,0.044372,0.075672,0.046857,0.030852,0.195757,0.048857,0.035662,0.11529,0.070823,0.035662,0.216773,0.159818,0.0,0.386868,0.509339,0.0,1.008826,1.005185,0.136212,0.093218,0.020103,0.073834,0.136212,0.095238,1,0.153846,0.375534,0,1,0,0.005475,0.006685,0.002242,0.002925,0.009847,0.004027,1,0.153846,0.375534,0,1,0,0.193705,0.23347,0.028414,0.191802,0.25644,0.253811,0.559941,0.527254,0.088509,0.254276,0.584359,0.570419,0.058786,0.100315,0.074579,0.044728,0.260673,0.125195,,,,,,,0.008094,0.005051,0.002665,0.002389,0.00935,0.00935,0.009522,0.005017,0.003694,0.000714,0.009807,0.001001,0,0.846154,0.375534,0,1,1,1.0,1.0,0.0,1.0,1.0,1.0,0,0.0,0.0,0,0,0,0.121961,0.12029,0.008589,0.108082,0.128201,0.122915,0.151135,0.04964,0.060154,0.005756,0.151135,0.013041,0,157.076923,383.420018,0,1021,0,0.125503,0.203298,0.041725,0.125503,0.254067,0.254067,0.172873,0.178482,0.009615,0.163719,0.190924,0.183075,0.00198,0.004422,0.002974,0.000626,0.008859,0.006051,0,0.0,0.0,...,,0.329989,6.27331,0.005356,2.28369,0.000365,1.06714,0,,0,,0,,0,1.0,0.005559,3.764053,1,2.0,0,,0,,-0.003025,0.318541,0,,0,1.0,-0.001604,0.818751,0.0,1.0,0.187859,4.010813,0,,0,,0.0,,0,,0,,0,,,,0,,0,,0,1.0,0,,0,,,,0,1.0,-0.003683,0.619433,0,,0,,0,,0,,0,,0,1.0,0,,0,,0,,0,,0,,0,,0,,0,,0,,0,,-1.9e-05,0.999938,0.000427,1.003247,-0.001648,0.980259,0.002106,1.002172,0.001991,6.613118,0.220124,1.596344,0,1.0,0.00658,1.006876,0.176426,1.278698,0,1.0,0,1.0,0.00077,1.513138,0.002388,1.442392,0,1.0,0.002648,1.002637,0,1.0,0,,,,0,1.0,,,0.0,1.0,-0.073825,0.612755,,,0,,0.0227,1.053314,0.022851,1.054473,0.023399,1.056687,0.023476,1.043286,0,1.0,0,,0,1.0,0,,0,,0.004443,1.004436,0,1.0,0,,,,-0.002086,0.997931,0.0,,,,0.001658,1.489645,0,,,,0,1.0,0,1.0,0,1.0,0,1.0,0,,0,,0.0,,,,0,,0.003077,1.795758,0,,13,0,0,1,13,2,1,2,13,1,1,1,13,0,0,1,13,5,5,1,13,0,0,1,13,2,2,1,13,3,3,1,13,0,0,1,13,1,1,1,13,6,6,1,0


In [14]:
train.isnull().sum()

customer_ID        0
P_2_first       2434
P_2_mean        2434
P_2_std         7829
P_2_min         2434
                ... 
D_68_count         0
D_68_first         0
D_68_last          0
D_68_nunique       0
target             0
Length: 1462, dtype: int64