In [1]:
%%capture

## Import Libraries
import numpy as np # linear algebra
from numpy.random import seed 
import math 

import pandas as pd # data processing 
pd.options.display.max_rows = 1000
pd.options.display.max_seq_items = 2000
pd.set_option('display.max_columns', None)
pd.set_option('display.expand_frame_repr', False)
pd.set_option('max_colwidth', -1)

import datetime as dt
from datatable import dt, f

import matplotlib.pyplot as plt
import matplotlib.ticker as ticker
import matplotlib.dates as mpl_dates
plt.rcParams.update({'font.size': 14})
import seaborn as sns
plt.style.use('seaborn')
sns.set_style('whitegrid')


from sklearn.metrics import mean_squared_error
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline
from sklearn.linear_model import LinearRegression

import warnings # Supress warnings 
warnings.filterwarnings('ignore')

import statsmodels as sm

import joblib

# Fix seed for reproducible results
SEED = 42
np.random.seed(SEED)

## Import Data

In [2]:
### Used method from Kaggle to reduce memory usage. 
## Don't know original source
def reduce_mem_usage(df):
    """ iterate through all the columns of a dataframe and modify the data type
        to reduce memory usage.        
    """
    start_mem = df.memory_usage().sum() / 1024**2
    print('Memory usage of dataframe is {:.2f} MB'.format(start_mem))
    
    for col in df.columns:
        col_type = df[col].dtype
        
        if col_type != object:
            c_min = df[col].min()
            c_max = df[col].max()
            if str(col_type)[:3] == 'int':
                if c_min > np.iinfo(np.int8).min and c_max < np.iinfo(np.int8).max:
                    df[col] = df[col].astype(np.int8)
                elif c_min > np.iinfo(np.int16).min and c_max < np.iinfo(np.int16).max:
                    df[col] = df[col].astype(np.int16)
                elif c_min > np.iinfo(np.int32).min and c_max < np.iinfo(np.int32).max:
                    df[col] = df[col].astype(np.int32)
                elif c_min > np.iinfo(np.int64).min and c_max < np.iinfo(np.int64).max:
                    df[col] = df[col].astype(np.int64)  
            else:
                if c_min > np.finfo(np.float16).min and c_max < np.finfo(np.float16).max:
                    df[col] = df[col].astype(np.float16)
                elif c_min > np.finfo(np.float32).min and c_max < np.finfo(np.float32).max:
                    df[col] = df[col].astype(np.float32)
                else:
                    df[col] = df[col].astype(np.float64)
        else:
            df[col] = df[col].astype('category')

    end_mem = df.memory_usage().sum() / 1024**2
    print('Memory usage after optimization is: {:.2f} MB'.format(end_mem))
    print('Decreased by {:.1f}%'.format(100 * (start_mem - end_mem) / start_mem))
    
    return df

In [3]:
%%time

## Import data
data_folder = "../input/ubiquant-market-prediction/"
data_folder_parquet = "../input/ubiquant-parquet/"

def read_datasets(path):
    print('Loading Example Sample Submission file...')
    example_submission = pd.read_parquet(path + "example_sample_submission.parquet")
    display(example_submission.head())
    print('Loading Example Test file...')
    test = pd.read_parquet(path + "example_test.parquet")
    display(test.head())
    print('Loading Train file...')
    train = pd.read_parquet(path + "train_low_mem.parquet").drop(columns=['row_id'])
    train = reduce_mem_usage(train)
    display(train.head())
    
    return train, test, example_submission

train, test, example_submission = read_datasets(data_folder_parquet)

Loading Example Sample Submission file...


Unnamed: 0,row_id,time_id,target
0,1220_1,1220,0
1,1220_2,1220,0
2,1221_0,1221,0
3,1221_1,1221,0
4,1221_2,1221,0


Loading Example Test file...


Unnamed: 0,row_id,time_id,investment_id,f_0,f_1,f_2,f_3,f_4,f_5,f_6,f_7,f_8,f_9,f_10,f_11,f_12,f_13,f_14,f_15,f_16,f_17,f_18,f_19,f_20,f_21,f_22,f_23,f_24,f_25,f_26,f_27,f_28,f_29,f_30,f_31,f_32,f_33,f_34,f_35,f_36,f_37,f_38,f_39,f_40,f_41,f_42,f_43,f_44,f_45,f_46,f_47,f_48,f_49,f_50,f_51,f_52,f_53,f_54,f_55,f_56,f_57,f_58,f_59,f_60,f_61,f_62,f_63,f_64,f_65,f_66,f_67,f_68,f_69,f_70,f_71,f_72,f_73,f_74,f_75,f_76,f_77,f_78,f_79,f_80,f_81,f_82,f_83,f_84,f_85,f_86,f_87,f_88,f_89,f_90,f_91,f_92,f_93,f_94,f_95,f_96,f_97,f_98,f_99,f_100,f_101,f_102,f_103,f_104,f_105,f_106,f_107,f_108,f_109,f_110,f_111,f_112,f_113,f_114,f_115,f_116,f_117,f_118,f_119,f_120,f_121,f_122,f_123,f_124,f_125,f_126,f_127,f_128,f_129,f_130,f_131,f_132,f_133,f_134,f_135,f_136,f_137,f_138,f_139,f_140,f_141,f_142,f_143,f_144,f_145,f_146,f_147,f_148,f_149,f_150,f_151,f_152,f_153,f_154,f_155,f_156,f_157,f_158,f_159,f_160,f_161,f_162,f_163,f_164,f_165,f_166,f_167,f_168,f_169,f_170,f_171,f_172,f_173,f_174,f_175,f_176,f_177,f_178,f_179,f_180,f_181,f_182,f_183,f_184,f_185,f_186,f_187,f_188,f_189,f_190,f_191,f_192,f_193,f_194,f_195,f_196,f_197,f_198,f_199,f_200,f_201,f_202,f_203,f_204,f_205,f_206,f_207,f_208,f_209,f_210,f_211,f_212,f_213,f_214,f_215,f_216,f_217,f_218,f_219,f_220,f_221,f_222,f_223,f_224,f_225,f_226,f_227,f_228,f_229,f_230,f_231,f_232,f_233,f_234,f_235,f_236,f_237,f_238,f_239,f_240,f_241,f_242,f_243,f_244,f_245,f_246,f_247,f_248,f_249,f_250,f_251,f_252,f_253,f_254,f_255,f_256,f_257,f_258,f_259,f_260,f_261,f_262,f_263,f_264,f_265,f_266,f_267,f_268,f_269,f_270,f_271,f_272,f_273,f_274,f_275,f_276,f_277,f_278,f_279,f_280,f_281,f_282,f_283,f_284,f_285,f_286,f_287,f_288,f_289,f_290,f_291,f_292,f_293,f_294,f_295,f_296,f_297,f_298,f_299
0,1220_1,1220,1,0.874944,0.457875,0.962572,0.372061,0.004509,0.971304,0.097477,0.24608,0.481052,0.95113,0.968358,0.699345,0.739139,0.066587,0.808991,0.291094,0.410428,0.415464,0.475559,0.46303,0.162172,0.764135,0.988812,0.620314,0.915356,0.810174,0.79399,0.276981,0.77723,0.806242,0.094767,0.254653,0.065229,0.172443,0.42997,0.375311,0.235271,0.979103,0.739211,0.946839,0.328391,0.552147,0.291854,0.475741,0.786556,0.89868,0.115453,0.800245,0.804779,0.185797,0.230276,0.893254,0.318648,0.213987,0.186194,0.681819,0.393373,0.480479,0.473462,0.605556,0.723612,0.774659,0.326204,0.988071,0.69763,0.561397,0.748171,0.08727,0.317911,0.551137,0.733891,0.685182,0.721296,0.84073,0.990324,0.036338,0.453641,0.663457,0.109746,0.978097,0.785883,0.085453,0.101547,0.088554,0.773017,0.671386,0.260844,0.138067,0.209517,0.43256,0.543269,0.710578,0.513228,0.616471,0.400029,0.577039,0.800661,0.340733,0.522114,0.10964,0.915578,0.65428,0.103689,0.485371,0.531522,0.903273,0.265315,0.77729,0.299357,0.813668,0.616994,0.852711,0.652874,0.670269,0.599262,0.955137,0.576315,0.647672,0.96578,0.721828,0.643987,0.688608,0.148123,0.654623,0.400646,0.550776,0.927801,0.351822,0.550095,0.548258,0.565763,0.886405,0.445483,0.635064,0.228078,0.999351,0.132959,0.719205,0.079829,0.896854,0.170177,0.462065,0.06981,0.612618,0.501901,0.275765,0.452534,0.830298,0.097434,0.448382,0.138786,0.306385,0.176685,0.888951,0.296462,0.691869,0.123614,0.048984,0.965639,0.619477,0.144715,0.064928,0.641233,0.089973,0.385225,0.071957,0.437211,0.368989,0.688976,0.150254,0.993027,0.099046,0.892578,0.030713,0.241537,0.794321,0.587304,0.289077,0.154698,0.786947,0.821293,0.122905,0.163158,0.304153,0.246596,0.070908,0.095635,0.554278,0.319731,0.474685,0.850515,0.151222,0.841399,0.00989,0.074472,0.966512,0.273875,0.68707,0.035826,0.525475,0.321969,0.594598,0.079995,0.575756,0.20778,0.455963,0.933001,0.145935,0.660078,0.173596,0.654387,0.47007,0.744501,0.721583,0.336405,0.632004,0.901299,0.448609,0.686336,0.276582,0.495469,0.397506,0.671769,0.385539,0.453976,0.037179,0.758213,0.461456,0.774596,0.391214,0.80342,0.562853,0.162382,0.506769,0.79483,0.268479,0.748373,0.044955,0.867946,0.81345,0.816583,0.842692,0.204182,0.790365,0.051641,0.718111,0.299606,0.082191,0.851497,0.690467,0.77498,0.306792,0.317957,0.632447,0.01231,0.94579,0.773103,0.965834,0.390955,0.241573,0.12195,0.638299,0.553705,0.568194,0.843221,0.354727,0.942957,0.373346,0.470993,0.453147,0.185819,0.871748,0.759975,0.406774,0.909238,0.597601,0.442423,0.947923,0.657953,0.082665,0.392314,0.897332,0.961809,0.209763,0.79936,0.93861,0.407447,0.36531,0.190532,0.665701,0.514031,0.828523,0.437697,0.810764,0.693963,0.186403,0.569144,0.120386,0.419603,0.936966
1,1220_2,1220,2,0.554862,0.445478,0.714034,0.891988,0.703331,0.264478,0.600636,0.697096,0.480214,0.145306,0.069449,0.069196,0.601509,0.230276,0.24195,0.461615,0.359256,0.900353,0.638412,0.986265,0.059347,0.86269,0.223547,0.280564,0.418108,0.28895,0.194548,0.825022,0.591619,0.315725,0.747944,0.267245,0.292161,0.451214,0.354558,0.817763,0.773964,0.284626,0.032634,0.794667,0.654899,0.120214,0.919047,0.708701,0.400016,0.254817,0.408806,0.126487,0.001214,0.802471,0.739735,0.637727,0.578299,0.271214,0.38065,0.944815,0.468184,0.950008,0.317426,0.08429,0.716474,0.589799,0.16645,0.000898,0.509908,0.077301,0.429475,0.98244,0.799343,0.487084,0.757396,0.786959,0.537782,0.901183,0.608399,0.683978,0.971382,0.064081,0.548191,0.459819,0.048924,0.783429,0.20354,0.318151,0.25921,0.139392,0.330374,0.280464,0.344154,0.12046,0.832155,0.536912,0.89078,0.402692,0.698926,0.909678,0.74527,0.115225,0.252267,0.30849,0.836069,0.758805,0.959009,0.158451,0.665629,0.767955,0.14797,0.392212,0.016824,0.856039,0.31498,0.541908,0.825064,0.712387,0.68988,0.973258,0.311172,0.359401,0.425084,0.023933,0.890733,0.28989,0.30778,0.753953,0.678548,0.942726,0.682818,0.304026,0.252408,0.091805,0.131907,0.609871,0.640625,0.959626,0.613212,0.000702,0.914079,0.199958,0.234868,0.771187,0.243863,0.654885,0.846969,0.707642,0.518576,0.697802,0.614582,0.104121,0.416389,0.272118,0.542067,0.374173,0.338259,0.874038,0.781823,0.18622,0.919784,0.834826,0.158777,0.483349,0.050627,0.319686,0.986162,0.258741,0.601834,0.084021,0.97558,0.39594,0.941783,0.654708,0.242371,0.373359,0.473007,0.676264,0.140979,0.526257,0.826118,0.918556,0.836233,0.80546,0.40055,0.787823,0.803969,0.621247,0.047932,0.785387,0.780816,0.03926,0.411237,0.67541,0.830683,0.508553,0.714463,0.57085,0.239165,0.463224,0.96042,0.077512,0.516939,0.481268,0.272673,0.071394,0.408668,0.426684,0.512901,0.998265,0.728723,0.765284,0.2792,0.766072,0.479353,0.920972,0.520074,0.985969,0.082177,0.401379,0.391542,0.535378,0.393576,0.416405,0.422227,0.993134,0.609181,0.982362,0.940441,0.946577,0.112418,0.911672,0.603004,0.353734,0.415035,0.053207,0.430719,0.330779,0.215438,0.726234,0.002905,0.050879,0.215199,0.031962,0.372145,0.944105,0.279503,0.485574,0.747893,0.056336,0.320315,0.187302,0.342302,0.324092,0.868256,0.842479,0.39651,0.748494,0.73143,0.687466,0.583761,0.264759,0.975597,0.538309,0.170456,0.226513,0.441748,0.715351,0.253279,0.708022,0.596036,0.96322,0.545497,0.882219,0.495478,0.497642,0.397811,0.117196,0.302832,0.187152,0.249617,0.906675,0.404698,0.405573,0.18046,0.160347,0.923655,0.825506,0.577116,0.718669,0.313886,0.728209,0.396429,0.683919,0.620919,0.30154,0.687464,0.400168,0.908198,0.272901,0.22243,0.748324,0.858802,0.362829
2,1221_0,1221,0,0.17507,0.918464,0.044379,0.505868,0.03716,0.169001,0.211365,0.791252,0.73927,0.716251,0.3952,0.54103,0.933998,0.573351,0.849435,0.864232,0.713558,0.943668,0.271508,0.307234,0.331061,0.907405,0.173487,0.46812,0.371292,0.74216,0.367011,0.401412,0.093199,0.124326,0.258757,0.189615,0.296705,0.106573,0.527337,0.969791,0.688373,0.837134,0.726393,0.615015,0.646067,0.824383,0.713499,0.810384,0.247787,0.201922,0.651404,0.649859,0.974864,0.147858,0.673822,0.032087,0.913205,0.116901,0.95866,0.573235,0.907901,0.449704,0.838943,0.724182,0.642036,0.925969,0.561617,0.254233,0.053846,0.484396,0.371277,0.556199,0.699103,0.242123,0.563563,0.561031,0.375473,0.075126,0.680565,0.45025,0.25291,0.561373,0.357813,0.18163,0.570863,0.397596,0.810287,0.762601,0.42687,0.459234,0.804732,0.980578,0.602645,0.503345,0.900728,0.926586,0.137829,0.786825,0.624012,0.295226,0.098282,0.164054,0.330215,0.463152,0.651269,0.194205,0.101522,0.130218,0.738351,0.843158,0.470606,0.270672,0.453131,0.265281,0.827787,0.289531,0.995442,0.57251,0.797331,0.523912,0.525839,0.424539,0.663265,0.216903,0.675285,0.143207,0.419976,0.994607,0.094646,0.674384,0.251875,0.524599,0.998205,0.167782,0.691998,0.579204,0.681346,0.015986,0.228002,0.689566,0.633398,0.167923,0.407675,0.436881,0.227816,0.424478,0.384666,0.542953,0.681949,0.987851,0.898403,0.6662,0.715937,0.45946,0.752568,0.571354,0.149191,0.531775,0.67954,0.9397,0.917867,0.598337,0.297908,0.903345,0.622618,0.914378,0.610801,0.253423,0.798674,0.410668,0.095864,0.690391,0.357999,0.162343,0.017357,0.032159,0.310956,0.58249,0.930457,0.276244,0.03752,0.175832,0.016053,0.754072,0.472121,0.34537,0.380543,0.111594,0.142693,0.694863,0.642411,0.993022,0.858693,0.817972,0.402442,0.250017,0.336858,0.697542,0.229117,0.468357,0.612025,0.368334,0.557258,0.435097,0.639134,0.266842,0.932287,0.480522,0.794831,0.81418,0.3231,0.743717,0.602575,0.089587,0.46677,0.209266,0.198406,0.777109,0.401075,0.055186,0.614584,0.502547,0.856088,0.883401,0.960521,0.888387,0.206417,0.365655,0.875711,0.354252,0.377858,0.282718,0.674139,0.256629,0.797542,0.594621,0.734312,0.993158,0.271205,0.899058,0.628644,0.214884,0.867957,0.117706,0.356529,0.104547,0.13887,0.702098,0.632508,0.943359,0.94163,0.214162,0.875826,0.298466,0.314079,0.863828,0.288734,0.156625,0.133006,0.63739,0.714059,0.074468,0.82183,0.052827,0.920128,0.071622,0.62575,0.066291,0.497427,0.390427,0.478386,0.778427,0.688358,0.06032,0.74395,0.75143,0.713456,0.034523,0.677838,0.128523,0.743948,0.90541,0.160801,0.238013,0.463621,0.269969,0.668704,0.664153,0.147217,0.267242,0.590282,0.900359,0.582452,0.465953,0.39771,0.789382,0.238078,0.254068,0.795084,0.491928,0.376725,0.079489,0.995041,0.482283
3,1221_1,1221,1,0.355239,0.689773,0.452643,0.134863,0.794958,0.837197,0.036773,0.713466,0.737016,0.810984,0.002808,0.621522,0.545661,0.686604,0.477196,0.5821,0.391507,0.809941,0.861929,0.355748,0.091225,0.010061,0.102721,0.551932,0.376771,0.438377,0.781497,0.979366,0.845771,0.806906,0.922164,0.56699,0.043254,0.272494,0.075764,0.140332,0.849251,0.252356,0.572041,0.695377,0.536291,0.356062,0.584625,0.603106,0.189332,0.683456,0.484626,0.840583,0.673178,0.917813,0.666469,0.564179,0.196108,0.474049,0.872973,0.807203,0.910177,0.058867,0.305068,0.647225,0.200449,0.450214,0.11062,0.527603,0.604376,0.966088,0.634255,0.571053,0.043567,0.441599,0.176991,0.514841,0.564917,0.856312,0.173674,0.592491,0.399837,0.780205,0.348362,0.314196,0.233215,0.88785,0.480599,0.40638,0.226638,0.983861,0.207749,0.801853,0.609355,0.17383,0.598262,0.942024,0.266292,0.360514,0.75273,0.358106,0.794214,0.630142,0.106938,0.733607,0.830523,0.936358,0.063596,0.220954,0.579884,0.185934,0.738676,0.790451,0.897049,0.966433,0.509442,0.213075,0.676149,0.096877,0.240194,0.648218,0.227571,0.788699,0.040676,0.729396,0.197551,0.907724,0.55788,0.878389,0.504674,0.597467,0.766185,0.184896,0.412504,0.378112,0.827239,0.114647,0.468455,0.010597,0.299336,0.132091,0.089182,0.415325,0.165485,0.370542,0.860467,0.492369,0.753202,0.418627,0.895679,0.367738,0.711473,0.121786,0.585825,0.175189,0.21596,0.852016,0.716914,0.73483,0.760084,0.067234,0.602407,0.647395,0.419864,0.081507,0.703863,0.856977,0.104301,0.934119,0.178385,0.515179,0.396566,0.176804,0.882056,0.559357,0.400732,0.529157,0.725605,0.910405,0.482093,0.101779,0.721761,0.537093,0.648118,0.365187,0.296365,0.886688,0.894906,0.101014,0.978746,0.207387,0.699074,0.807639,0.400147,0.182086,0.03596,0.693126,0.29196,0.347788,0.673762,0.003574,0.977645,0.172107,0.226107,0.882832,0.69085,0.762693,0.854927,0.733893,0.105732,0.283915,0.454428,0.018677,0.563261,0.765661,0.910824,0.469896,0.679691,0.952398,0.819684,0.270514,0.318057,0.978455,0.566888,0.910223,0.499952,0.550827,0.604932,0.712373,0.209251,0.2646,0.511991,0.277428,0.993648,0.131619,0.897688,0.267064,0.266514,0.349514,0.015048,0.335408,0.730178,0.902669,0.16755,0.026795,0.828605,0.552593,0.577941,0.565046,0.793668,0.70941,0.942733,0.878088,0.521234,0.826444,0.587539,0.136543,0.153734,0.083449,0.536978,0.471129,0.840016,0.099243,0.625962,0.974877,0.427573,0.468903,0.286575,0.321241,0.12763,0.856989,0.630823,0.567562,0.0607,0.641342,0.055998,0.533725,0.653402,0.424693,0.467539,0.166731,0.29838,0.314889,0.023404,0.220415,0.517586,0.515492,0.294602,0.994424,0.817242,0.597223,0.14181,0.31387,0.120187,0.201747,0.893571,0.322879,0.674692,0.11416,0.818483,0.287065,0.710537,0.550434,0.899869,0.928997
4,1221_2,1221,2,0.912778,0.462684,0.454067,0.491009,0.050547,0.250051,0.686295,0.666958,0.359397,0.457957,0.337905,0.164047,0.911366,0.48321,0.439823,0.073116,0.114691,0.279528,0.115223,0.786287,0.055086,0.20244,0.176511,0.181692,0.334614,0.466641,0.064421,0.462835,0.218059,0.716125,0.645232,0.534537,0.111932,0.71871,0.185045,0.327569,0.817488,0.576675,0.36171,0.36926,0.322386,0.584184,0.270985,0.178242,0.348978,0.835184,0.440341,0.208373,0.041951,0.0575,0.709208,0.924921,0.67604,0.857796,0.938463,0.69396,0.974945,0.739172,0.298508,0.504151,0.590602,0.755497,0.474339,0.302517,0.28451,0.237999,0.117581,0.116574,0.509296,0.680959,0.964025,0.248184,0.088566,0.624053,0.977284,0.389786,0.082667,0.103577,0.74883,0.713691,0.295629,0.459462,0.943111,0.494196,0.607418,0.975053,0.448705,0.502703,0.989182,0.947898,0.399888,0.718421,0.456387,0.712919,0.756262,0.719348,0.572912,0.776472,0.02252,0.779723,0.152053,0.268952,0.955641,0.32302,0.415556,0.709192,0.386821,0.794929,0.684921,0.606077,0.31022,0.510706,0.403618,0.293436,0.884362,0.457744,0.783475,0.728955,0.756238,0.300123,0.353831,0.259495,0.266359,0.57338,0.450371,0.903673,0.927309,0.969997,0.920113,0.064838,0.942148,0.402717,0.72241,0.923984,0.806558,0.933843,0.540915,0.761637,0.236847,0.779239,0.153938,0.409059,0.338316,0.01247,0.101099,0.580242,0.209169,0.268754,0.389245,0.931403,0.576958,0.876579,0.894056,0.671356,0.109653,0.026271,0.499621,0.294456,0.436434,0.753091,0.214646,0.036391,0.374914,0.363255,0.160509,0.821415,0.909193,0.658998,0.664143,0.404421,0.945754,0.207608,0.909567,0.930762,0.774099,0.170554,0.918523,0.834796,0.330158,0.820877,0.449642,0.998789,0.527614,0.160504,0.506877,0.381217,0.192588,0.185902,0.359687,0.722125,0.878649,0.712422,0.313058,0.240844,0.029811,0.551878,0.40767,0.583744,0.470947,0.543784,0.068275,0.019369,0.226629,0.11168,0.047379,0.163472,0.972865,0.445587,0.550758,0.501665,0.918697,0.76844,0.9323,0.426325,0.926276,0.215757,0.338656,0.723855,0.722195,0.119111,0.462102,0.549665,0.054828,0.093251,0.746771,0.066501,0.376723,0.54894,0.715726,0.976165,0.771377,0.117163,0.764202,0.235999,0.574012,0.957145,0.575103,0.26642,0.219094,0.370304,0.191008,0.300847,0.804515,0.867272,0.037295,0.593709,0.576598,0.519398,0.717586,0.499761,0.936182,0.521796,0.366261,0.199075,0.150739,0.065007,0.072348,0.544865,0.115748,0.710037,0.235153,0.244598,0.532465,0.531587,0.817029,0.188395,0.559983,0.179908,0.381821,0.128143,0.392697,0.153277,0.507342,0.260192,0.648909,0.472551,0.647336,0.477583,0.017234,0.468246,0.434878,0.417025,0.916302,0.406285,0.452374,0.989654,0.294616,0.470001,0.652756,0.496342,0.031662,0.703427,0.861476,0.897927,0.659051,0.356148,0.37599,0.209798,0.175153,0.72716


Loading Train file...
Memory usage of dataframe is 3619.03 MB
Memory usage after optimization is: 1815.50 MB
Decreased by 49.8%


Unnamed: 0,time_id,investment_id,target,f_0,f_1,f_2,f_3,f_4,f_5,f_6,f_7,f_8,f_9,f_10,f_11,f_12,f_13,f_14,f_15,f_16,f_17,f_18,f_19,f_20,f_21,f_22,f_23,f_24,f_25,f_26,f_27,f_28,f_29,f_30,f_31,f_32,f_33,f_34,f_35,f_36,f_37,f_38,f_39,f_40,f_41,f_42,f_43,f_44,f_45,f_46,f_47,f_48,f_49,f_50,f_51,f_52,f_53,f_54,f_55,f_56,f_57,f_58,f_59,f_60,f_61,f_62,f_63,f_64,f_65,f_66,f_67,f_68,f_69,f_70,f_71,f_72,f_73,f_74,f_75,f_76,f_77,f_78,f_79,f_80,f_81,f_82,f_83,f_84,f_85,f_86,f_87,f_88,f_89,f_90,f_91,f_92,f_93,f_94,f_95,f_96,f_97,f_98,f_99,f_100,f_101,f_102,f_103,f_104,f_105,f_106,f_107,f_108,f_109,f_110,f_111,f_112,f_113,f_114,f_115,f_116,f_117,f_118,f_119,f_120,f_121,f_122,f_123,f_124,f_125,f_126,f_127,f_128,f_129,f_130,f_131,f_132,f_133,f_134,f_135,f_136,f_137,f_138,f_139,f_140,f_141,f_142,f_143,f_144,f_145,f_146,f_147,f_148,f_149,f_150,f_151,f_152,f_153,f_154,f_155,f_156,f_157,f_158,f_159,f_160,f_161,f_162,f_163,f_164,f_165,f_166,f_167,f_168,f_169,f_170,f_171,f_172,f_173,f_174,f_175,f_176,f_177,f_178,f_179,f_180,f_181,f_182,f_183,f_184,f_185,f_186,f_187,f_188,f_189,f_190,f_191,f_192,f_193,f_194,f_195,f_196,f_197,f_198,f_199,f_200,f_201,f_202,f_203,f_204,f_205,f_206,f_207,f_208,f_209,f_210,f_211,f_212,f_213,f_214,f_215,f_216,f_217,f_218,f_219,f_220,f_221,f_222,f_223,f_224,f_225,f_226,f_227,f_228,f_229,f_230,f_231,f_232,f_233,f_234,f_235,f_236,f_237,f_238,f_239,f_240,f_241,f_242,f_243,f_244,f_245,f_246,f_247,f_248,f_249,f_250,f_251,f_252,f_253,f_254,f_255,f_256,f_257,f_258,f_259,f_260,f_261,f_262,f_263,f_264,f_265,f_266,f_267,f_268,f_269,f_270,f_271,f_272,f_273,f_274,f_275,f_276,f_277,f_278,f_279,f_280,f_281,f_282,f_283,f_284,f_285,f_286,f_287,f_288,f_289,f_290,f_291,f_292,f_293,f_294,f_295,f_296,f_297,f_298,f_299
0,0.0,1.0,-0.300781,0.932617,0.113708,-0.4021,0.378418,-0.203979,-0.413574,0.96582,1.230469,0.114807,-2.013672,0.004936,0.28418,0.501953,-0.287842,-1.168945,-0.267334,-0.574219,-0.771973,1.012695,-1.230469,1.786133,-2.089844,0.325684,-0.87793,1.048828,0.131714,-0.349609,-1.813477,0.099243,-0.240967,1.604492,0.003637,-0.901855,0.221558,0.609863,-0.73877,2.097656,-0.914062,-0.293945,-0.037994,0.685547,0.0,0.414795,-0.469482,-1.085938,-0.106445,0.059448,0.483154,1.189453,0.506836,0.754395,0.317627,-0.183228,5.164062,0.677246,-0.440674,0.631348,-1.845703,0.227783,0.841309,0.66748,-0.854004,-0.17041,-0.11969,-0.504883,0.662598,1.933594,-0.8125,0.072815,-0.778809,-0.553711,-0.032776,-0.619141,-1.424805,0.148315,0.257812,0.735352,0.563965,-0.272217,1.19043,-0.101379,1.333984,0.191284,0.630859,1.010742,0.161865,0.609375,-0.219482,-0.013069,1.505859,-1.319336,0.448242,-0.635254,-0.075378,1.033203,-0.664062,0.139893,0.186279,0.593262,-0.301514,0.666504,0.713379,1.020508,0.879883,-1.09668,-0.21106,-0.117493,-0.778809,0.065979,0.229736,0.435303,1.233398,-0.865723,0.062347,0.382324,-1.31543,0.786621,0.770508,-0.871094,0.583496,0.115601,0.209595,0.325439,0.469238,0.0,-0.731445,-0.249512,-0.050568,-1.232422,-0.790527,0.493408,0.35791,-0.381592,0.176392,0.748047,-0.741699,0.089661,1.080078,1.137695,1.199219,0.030609,-0.356201,0.247803,1.395508,0.961914,0.078125,-1.163086,0.70752,0.256104,-0.026306,0.329102,0.196045,0.65332,0.069214,0.907715,-0.350586,-1.170898,0.65918,0.9375,0.48291,-0.09491,0.317383,0.126831,0.89209,-1.199219,-0.31543,0.704102,-0.0177,-0.513184,-0.362549,1.0,2.265625,0.360107,0.054474,1.639648,-1.0,0.876953,0.368164,0.991211,-1.224609,-1.208984,-0.879883,1.0,0.035156,0.693359,0.307129,0.143799,0.728027,1.220703,-0.939941,-0.106934,0.0,-0.569336,0.187866,-0.386475,-0.452393,0.269775,-0.56543,-0.262207,-1.473633,0.0,0.428223,1.740234,0.941406,-0.72998,-0.533203,-0.983398,-0.043152,-0.225952,-0.008301,-0.447998,0.55127,-0.153076,-2.292969,0.186646,-0.443115,0.121216,0.787598,1.996094,-1.286133,-0.157227,1.019531,0.693359,0.797363,-0.192627,0.222778,0.921387,-0.171387,0.021652,1.15332,0.689941,3.251953,0.992188,-0.779785,-0.546387,-0.37915,1.896484,-0.732422,-0.11377,1.12793,-0.007927,0.122314,0.44458,0.48584,-2.302734,0.392822,0.0,-0.779297,-0.893555,0.055939,0.201416,-0.338135,1.27832,1.367188,0.525391,-0.055664,0.145264,0.346924,-0.824219,-1.306641,-1.158203,0.709473,-0.031891,-1.020508,-1.291016,0.038666,0.187134,-0.680176,0.900391,-0.924805,-1.057617,-0.167114,0.0,1.28125,0.258789,-0.237915,-0.742188,-0.324707,0.992676,0.961426,-0.025604,-0.00626,0.473633,0.040131,0.453613,-1.597656,0.301758,0.157471,0.416748,1.505859,0.365967,-1.095703,0.200073,0.819336,0.941406,-0.086792,-1.086914,-1.044922,-0.287598,0.321533
1,0.0,2.0,-0.231079,0.811035,-0.51416,0.742188,-0.616699,-0.194214,1.771484,1.427734,1.133789,0.114807,-0.219238,-0.351807,0.84668,0.440186,0.499756,0.893066,-0.010216,-0.681641,1.253906,-1.027344,-1.69043,0.011154,0.875488,0.325684,-0.458252,-1.797852,-0.300293,0.584961,0.55127,0.806641,1.235352,-0.984863,-1.084961,3.162109,0.21106,-2.65625,-0.177002,0.486572,1.237305,-0.44751,-0.403564,-0.769531,1.0,-0.516602,-1.307617,-0.092407,0.971191,-0.069336,-0.963379,-0.84082,0.438965,0.317139,0.13855,-1.167969,0.082336,1.05957,-0.440674,0.631348,0.495117,1.163086,0.453369,0.631836,-0.651855,-0.17041,-0.11969,0.186157,-0.29248,-0.549805,-1.629883,0.902832,0.509766,0.377441,0.052094,-0.763184,-1.307617,0.148315,0.777832,-0.383301,-0.099487,-0.119995,1.466797,-0.255371,0.136353,0.191284,-0.404541,-1.220703,-1.442383,1.088867,-0.479248,0.476318,-1.238281,0.13916,-1.238281,0.277344,0.925781,-0.666016,-0.496582,-1.344727,-0.51416,-0.081726,-0.301514,-0.918945,-0.051697,1.020508,0.746582,0.911621,-0.343994,-0.948242,-0.778809,0.065979,-0.22998,-0.153564,-0.722168,-0.947266,1.321289,-0.075256,0.99707,-0.137695,0.724121,-0.722168,0.541992,0.730469,0.478027,-0.662109,0.605957,0.0,0.280518,0.781738,-0.140503,0.324951,0.540527,-0.686523,0.388916,-1.551758,-0.662109,0.312256,-1.089844,0.530762,-0.730469,-0.878906,-1.139648,-1.336914,0.804688,0.247803,-1.292969,-0.892578,0.078125,0.023346,-0.957031,-0.042419,-0.195312,0.329102,-0.181152,0.65332,0.069214,-0.818848,0.308838,0.894531,0.01049,0.904297,1.197266,1.052734,0.915039,-1.083984,-0.541992,-0.898926,-0.043518,-0.375732,0.167969,0.552246,0.772949,1.0,-1.25,0.409912,-0.695312,1.639648,-1.0,0.876953,-1.523438,-0.526855,-0.071045,-0.404785,0.269531,1.0,0.035156,-0.309326,-1.067383,1.087891,-1.145508,-0.02533,-0.398438,-1.173828,0.427002,0.043945,0.510742,1.408203,-0.71875,2.076172,-0.507812,0.942383,1.02832,0.0,1.050781,-1.009766,0.480713,-1.363281,-0.358398,0.0849,-0.012634,-1.496094,-1.260742,-0.452148,-0.253418,-1.107422,0.492188,0.727051,0.400635,-2.302734,1.443359,-0.231445,0.777344,1.995117,-0.59375,0.737793,-0.841797,-0.191528,0.222778,0.872559,0.611328,-0.113159,1.15332,0.866211,-0.269775,-0.078003,-0.332764,-0.546387,-0.678711,-0.434082,-0.584473,0.332031,-0.646973,-0.176514,0.122314,-0.068176,-0.868164,0.844727,0.863281,1.179688,-0.049469,0.484863,-0.050537,-0.491943,-0.164429,0.133667,-0.952637,-0.387451,0.090637,-0.811035,-0.821289,-0.546875,-0.067871,-0.76709,-0.015457,-0.158325,0.980469,0.799316,0.79834,-0.633301,0.779785,0.171265,1.166016,0.59082,0.11853,0.0,-0.650879,0.852051,0.086182,1.135742,0.299072,-1.583008,-0.481934,0.532227,0.226685,-0.894531,-0.514648,-1.0,0.884277,-0.557617,-0.875488,-0.156128,0.537109,-0.154175,0.912598,-0.734375,0.819336,0.941406,-0.387695,-1.086914,-0.929688,-0.974121,-0.343506
2,0.0,6.0,0.568848,0.394043,0.615723,0.567871,-0.60791,0.068909,-1.083008,0.979492,-1.125977,0.114807,-1.035156,0.465088,0.150879,-0.044006,0.091248,-1.168945,-0.451904,-0.467285,0.095276,1.140625,-0.16687,-0.007294,-0.449463,0.325684,-0.682617,0.016266,0.026123,-0.547363,0.55127,-0.261475,-0.169678,0.857422,-0.09845,-0.860352,0.180176,0.609863,0.524902,-0.400391,0.751465,-0.287598,0.568359,0.829102,0.0,-0.253174,-0.235474,0.500977,-0.655762,-0.750977,0.664062,1.189453,1.087891,0.859375,-0.133545,-0.183228,0.082336,-0.060181,-0.440674,0.631348,-0.026169,0.015625,-0.855957,1.052734,-0.526855,-0.17041,-0.11969,0.038177,0.309814,-0.549805,1.638672,-0.476562,-0.90918,-0.544922,-0.546387,0.163452,1.748047,0.148315,0.365234,0.342773,-0.813965,-0.046417,-0.484863,-0.270264,0.136353,-1.441406,-0.079163,-0.530762,0.130981,0.221558,-0.228882,0.700195,0.023468,0.269287,0.039825,-0.963867,-0.790039,0.693359,-0.59375,0.295166,-0.096008,0.447754,-0.301514,1.039062,-0.291748,1.020508,0.529297,-1.09668,0.150757,-0.074646,1.254883,0.065979,0.869141,0.518066,0.494385,-0.02858,-0.478271,-0.733887,0.200806,-0.174561,-0.255127,0.558594,0.586426,-2.177734,-0.765137,0.200317,0.346436,0.0,-0.065796,-0.29834,-0.040955,-0.875977,-0.625,1.005859,-0.471924,0.788574,-0.547363,-0.039612,-0.885254,-0.161743,0.186157,1.137695,0.052643,0.323242,1.15625,0.247803,0.859375,0.873047,0.078125,-0.250977,-0.418213,0.927246,0.648438,0.329102,0.015572,0.65332,0.069214,0.907715,-0.642578,-1.170898,-0.100586,0.122498,-0.247559,0.694336,-0.167358,1.0625,0.718262,-0.844238,-0.105347,0.166626,-0.375732,-0.513184,-0.393555,1.0,0.596191,-0.446289,-0.115051,-0.709961,-1.0,-1.431641,-0.577637,-0.418457,-0.515137,-0.307617,-0.283691,1.0,0.035156,-0.393799,0.288086,0.366455,0.103333,-0.098328,0.133911,0.21228,0.384521,0.501465,-0.339355,0.010094,-0.007168,-1.117188,-0.564941,0.672852,-0.775879,0.0,-0.070007,0.883301,0.579102,0.942871,-0.793457,-0.955078,0.131836,-0.546875,0.905273,-0.452148,0.675293,-0.036041,-1.169922,-0.167603,-0.274414,0.114014,0.10321,0.071045,-1.286133,-0.407959,0.137207,-0.399414,0.335693,-0.149292,0.222778,0.156128,-0.171387,0.258301,1.15332,-0.964355,-0.269775,-0.654297,0.180542,-1.220703,0.45752,-0.461182,-0.976562,0.147339,0.060364,-0.271729,0.122314,1.450195,1.163086,0.402588,-0.101135,0.0,0.019119,0.523438,-0.005413,-0.092407,-0.001884,0.259277,0.507324,0.202515,-0.37085,0.828125,0.25708,0.027908,-0.662598,1.066406,-0.52832,0.189453,-1.020508,0.169678,-0.911133,-0.222046,0.536621,-0.161743,-0.114319,0.43335,-0.207153,0.0,0.098938,-0.725098,-0.388184,0.062622,0.260254,0.980957,0.899414,-0.31543,0.150146,0.245605,-1.429688,-1.0,-0.033508,-0.147095,-0.087524,0.09845,-0.528809,-0.138062,0.912598,-0.551758,-1.220703,-1.060547,-0.219116,-1.086914,-0.612305,-0.113953,0.243652
3,0.0,7.0,-1.064453,-2.34375,-0.011871,1.875,-0.606445,-0.586914,-0.815918,0.77832,0.299072,0.114807,-1.176758,0.30127,-0.015671,-0.65625,-0.150879,-1.168945,-1.12207,-0.681641,2.921875,1.179688,0.364014,0.365723,-1.478516,0.325684,0.955566,-0.105042,-0.588867,0.649902,-1.813477,-1.421875,1.526367,-0.054657,-0.345459,0.259277,0.124939,-0.47876,-0.457764,-0.072266,0.577637,-0.266113,-0.699707,-0.306152,0.0,-0.680664,-1.658203,1.000977,-0.361084,-1.085938,-1.008789,1.189453,-1.285156,-1.00293,-0.512695,-0.248047,0.082336,-0.523926,-0.440674,-1.583984,-1.106445,-1.330078,-0.834961,0.544434,0.098022,-0.17041,-0.11969,-0.786133,0.464844,-0.549805,-0.831055,-0.653809,-0.940918,-0.424805,-0.41333,1.552734,-0.490479,0.148315,0.973145,1.689453,-0.339355,-0.110779,-0.607422,-0.52832,1.333984,-0.625,0.363037,0.70459,-1.298828,-0.821289,-0.659668,1.354492,-0.819824,-1.084961,0.057983,-0.514648,0.664551,0.183716,1.689453,-2.169922,-0.973633,-0.181396,-0.301514,-0.918945,-1.126953,-0.980469,1.055664,-1.09668,-1.319336,-1.138672,-0.778809,0.065979,0.476807,-0.751465,-1.316406,-0.743652,-0.62793,0.326416,0.838379,-1.037109,-0.126465,-0.462402,0.656738,-0.275879,-0.213379,-4.339844,-1.129883,0.0,0.814941,1.477539,-0.321289,-0.170044,0.584473,0.937012,-0.263428,-1.551758,-1.373047,-1.479492,-1.654297,-0.632812,-0.716309,-0.878906,-0.921875,-0.945801,1.65625,0.247803,-1.026367,-0.593262,0.078125,-0.492188,-1.001953,-1.634766,-0.667969,0.329102,-0.092896,-1.530273,0.069214,-0.818848,-0.638672,-1.170898,-1.87207,-0.772949,-0.450928,-0.500977,-0.847168,-0.526855,-1.0625,0.87793,-0.075806,-0.375732,0.736328,-0.513184,1.615234,1.0,-2.492188,-0.615234,-1.108398,0.117249,-1.0,0.876953,-0.577637,-0.743652,-0.147461,1.013672,-1.297852,1.0,0.035187,-0.4021,-0.655762,-0.615234,-1.145508,-0.62793,-0.152344,-1.62793,0.0,0.092651,-0.732422,-0.189575,-2.15625,-1.526367,-0.564941,0.869141,-1.160156,0.0,-0.195068,-0.347168,-1.09668,-0.388672,1.426758,0.249634,-1.492188,0.243286,0.652344,-0.45166,0.54541,-1.585938,-1.117188,-0.63623,0.738281,-0.87793,-1.006836,-0.470947,-1.286133,0.137573,0.0401,1.080078,-0.867188,-0.168701,0.222778,-1.354492,0.219971,-0.830566,-0.897949,-0.226685,-0.261719,0.137817,-1.24707,-0.209229,-0.476807,1.494141,0.187256,-0.150513,-0.377686,-0.250244,0.122314,1.075195,-0.868164,-1.424805,-0.616211,0.0,-1.522461,0.403076,-0.014435,0.020172,-0.431396,-1.279297,0.835938,-1.455078,-0.438477,-0.561523,-1.1875,1.179688,-1.575195,-1.43457,0.084229,-0.836426,-1.020508,1.272461,-0.667969,-1.452148,1.168945,-1.025391,-0.924805,1.013672,-0.324463,0.0,-0.817871,-0.624023,0.012917,0.599121,-1.795898,-1.84375,2.927734,-0.640625,2.324219,-0.666504,-0.049957,-1.0,-0.172485,-0.557617,-0.986816,-0.744629,0.237793,0.38208,0.912598,-0.266357,-1.220703,0.941406,-0.608887,0.104919,-0.783203,1.151367,-0.773438
4,0.0,8.0,-0.531738,0.842285,-0.262939,2.330078,-0.583496,-0.618164,-0.742676,-0.946777,1.230469,0.114807,-0.005859,0.498779,-0.235474,-0.17334,0.106506,-0.138062,-0.829102,-0.826172,4.070312,0.148315,0.269531,-0.046692,0.194336,0.325684,1.933594,-1.120117,-0.585449,0.535645,0.55127,-0.770996,0.216187,0.022415,-0.924316,0.19812,0.232422,-1.567383,-0.317383,-1.020508,0.079224,-0.355225,-0.709961,-0.278076,-2.0,-0.327881,0.957031,-0.331787,-0.538086,-0.212158,-0.999512,-0.84082,-1.991211,-1.635742,-1.121094,-0.183228,0.082336,-0.94043,-0.440674,-1.583984,0.059174,-1.172852,-0.605469,-0.138306,0.668945,-0.17041,-0.11969,-0.90625,-1.241211,-0.549805,-0.8125,-0.696289,-0.410889,-0.783203,-0.695801,1.394531,-1.424805,0.148315,0.677246,1.110352,-0.384277,-0.089661,-0.80127,-0.934082,0.136353,-1.712891,0.758301,0.370605,-1.555664,-1.160156,-0.699219,0.644043,-0.774902,-1.143555,-0.107422,0.00943,0.768555,-0.835938,1.977539,0.378418,-1.108398,-0.651367,-0.301514,-0.918945,-0.960449,-0.980469,-0.484131,-1.09668,0.914551,-1.578125,1.254883,0.065979,0.779785,-0.684082,-1.149414,-0.381104,-1.0,-0.27124,1.0,-1.216797,-0.800781,-0.421631,0.497803,-1.394531,-0.467041,-0.208984,-1.168945,0.0,0.73291,2.537109,-0.015411,0.255859,1.038086,0.279053,-1.011719,0.788574,-0.682617,-1.686523,-0.496826,-0.74707,-0.498779,-0.878906,-0.773438,-1.15625,-0.006191,0.247803,-0.749512,-0.875,0.078125,-1.523438,-0.912109,-1.753906,0.334961,0.329102,0.801758,-1.530273,0.069214,-0.490723,-0.573242,-0.137939,-1.772461,-1.542969,-1.138672,-0.739746,-1.0,0.8125,-0.588867,1.361328,-0.043549,0.166626,-1.019531,-2.628906,5.019531,1.0,-0.414551,-0.568848,-1.254883,-0.709961,-1.0,0.876953,-0.577637,1.533203,0.0,1.209961,0.549805,1.0,0.035187,-0.658203,-1.384766,-0.275146,-0.833496,-0.733398,-1.458984,-2.023438,-1.419922,0.400391,-0.786133,0.344482,0.666016,0.11908,-0.558105,0.88916,0.612793,0.0,-0.114563,-0.347168,-1.22168,-0.553711,1.799805,0.91748,-1.271484,0.802246,-0.346924,-0.452148,-1.831055,-1.664062,-0.095825,-0.895508,0.231812,-1.511719,-1.117188,-0.81543,-1.286133,-0.921387,-0.638184,0.615234,0.34668,-0.211792,0.222778,-1.454102,-0.171387,-0.874023,-0.897949,0.192017,-0.269775,-0.185913,-0.077209,-1.204102,0.365234,-0.468018,0.760254,-2.261719,-1.264648,-0.629883,0.122314,1.214844,-0.868164,1.074219,-0.88623,0.0,-1.506836,1.635742,-0.050537,-0.775391,-0.499512,-1.524414,-0.461426,-1.363281,-0.683594,-0.660645,-0.821289,0.109375,0.275146,0.792969,-1.657227,-0.875,0.980469,0.778809,-0.916504,-0.556152,0.925781,-1.507812,1.166016,0.941406,-0.501465,0.0,-1.333008,-0.767578,-0.237915,0.330811,-1.464844,-0.585449,-1.314453,-0.78125,-1.918945,-0.438721,-1.576172,-1.226562,1.067383,-0.519043,-1.22168,-0.768555,-0.724121,-0.17041,0.912598,-0.741211,-1.220703,0.941406,-0.588379,0.104919,0.753418,1.345703,-0.737793


CPU times: user 1min 28s, sys: 2min 1s, total: 3min 29s
Wall time: 3min 50s


## Dealing with Multicollinearity
### Remove highly correlated features using VIF

In [4]:
### Important! ###
## This method fails and returns a 'Out of memory error' in Kaggle kernel. 
## I calculated the VIF seperately in a Google Colab notebook that did finish
## 44 columns were identified to be dropped from the calculate_vif() method
## ['f_148', 'f_95', 'f_277', 'f_61', 'f_173', 'f_72', 'f_206', 'f_254', 'f_97', 'f_273', 'f_262', 'f_180', 'f_51', 'f_54', 'f_214', 'f_203', 'f_106', 'f_134', 'f_228', 'f_28', 'f_255', 'f_247', 'f_280', 'f_136', 'f_164', 'f_4', 'f_205', 'f_186', 'f_193', 'f_15', 'f_212', 'f_161', 'f_157', 'f_146', 'f_274', 'f_240', 'f_211', 'f_3', 'f_158', 'f_41', 'f_288', 'f_207', 'f_245', 'f_226']

# Get a list of all the features first and the target
features = [f"f_{i}" for i in range(300)]
target = 'target'

# Generate a df with only features
df_features = train.loc[:, features]
display(df_features.shape)

### Important! ###
## This method fails and returns a 'Out of memory error in '
# Calculate VIF
def calculate_vif(df, features): 
    vif, tolerance = {}, {}

    for feature in features:
        X = [f for f in features if f != feature]
        X, y = df[X], df[feature]
        r2 = LinearRegression().fit(X, y).score(X, y)
        tolerance[feature] = 1 - r2
        vif[feature] = 1/(tolerance[feature])
    return pd.DataFrame({'VIF': vif, 'Tolerance': tolerance})

# dfx = calculate_vif(df_features, features)

# drop_columns = set()
# mc_threshold = 5 
# for feature in features:
#     if dfx.loc[feature].VIF > mc_threshold:
#         drop_columns.add(feature)

drop_columns = ['f_148', 'f_95', 'f_277', 'f_61', 'f_173', 'f_72', 'f_206', 'f_254', 'f_97', 'f_273', 'f_262', 'f_180', 'f_51', 'f_54', 'f_214', 'f_203', 'f_106', 'f_134', 'f_228', 'f_28', 'f_255', 'f_247', 'f_280', 'f_136', 'f_164', 'f_4', 'f_205', 'f_186', 'f_193', 'f_15', 'f_212', 'f_161', 'f_157', 'f_146', 'f_274', 'f_240', 'f_211', 'f_3', 'f_158', 'f_41', 'f_288', 'f_207', 'f_245', 'f_226']
df_features = df_features.drop(columns=drop_columns)
print(f'Columns drop size : {len(drop_columns)}')
display(df_features.head())

(3141410, 300)

Columns drop size : 44


Unnamed: 0,f_0,f_1,f_2,f_5,f_6,f_7,f_8,f_9,f_10,f_11,f_12,f_13,f_14,f_16,f_17,f_18,f_19,f_20,f_21,f_22,f_23,f_24,f_25,f_26,f_27,f_29,f_30,f_31,f_32,f_33,f_34,f_35,f_36,f_37,f_38,f_39,f_40,f_42,f_43,f_44,f_45,f_46,f_47,f_48,f_49,f_50,f_52,f_53,f_55,f_56,f_57,f_58,f_59,f_60,f_62,f_63,f_64,f_65,f_66,f_67,f_68,f_69,f_70,f_71,f_73,f_74,f_75,f_76,f_77,f_78,f_79,f_80,f_81,f_82,f_83,f_84,f_85,f_86,f_87,f_88,f_89,f_90,f_91,f_92,f_93,f_94,f_96,f_98,f_99,f_100,f_101,f_102,f_103,f_104,f_105,f_107,f_108,f_109,f_110,f_111,f_112,f_113,f_114,f_115,f_116,f_117,f_118,f_119,f_120,f_121,f_122,f_123,f_124,f_125,f_126,f_127,f_128,f_129,f_130,f_131,f_132,f_133,f_135,f_137,f_138,f_139,f_140,f_141,f_142,f_143,f_144,f_145,f_147,f_149,f_150,f_151,f_152,f_153,f_154,f_155,f_156,f_159,f_160,f_162,f_163,f_165,f_166,f_167,f_168,f_169,f_170,f_171,f_172,f_174,f_175,f_176,f_177,f_178,f_179,f_181,f_182,f_183,f_184,f_185,f_187,f_188,f_189,f_190,f_191,f_192,f_194,f_195,f_196,f_197,f_198,f_199,f_200,f_201,f_202,f_204,f_208,f_209,f_210,f_213,f_215,f_216,f_217,f_218,f_219,f_220,f_221,f_222,f_223,f_224,f_225,f_227,f_229,f_230,f_231,f_232,f_233,f_234,f_235,f_236,f_237,f_238,f_239,f_241,f_242,f_243,f_244,f_246,f_248,f_249,f_250,f_251,f_252,f_253,f_256,f_257,f_258,f_259,f_260,f_261,f_263,f_264,f_265,f_266,f_267,f_268,f_269,f_270,f_271,f_272,f_275,f_276,f_278,f_279,f_281,f_282,f_283,f_284,f_285,f_286,f_287,f_289,f_290,f_291,f_292,f_293,f_294,f_295,f_296,f_297,f_298,f_299
0,0.932617,0.113708,-0.4021,-0.413574,0.96582,1.230469,0.114807,-2.013672,0.004936,0.28418,0.501953,-0.287842,-1.168945,-0.574219,-0.771973,1.012695,-1.230469,1.786133,-2.089844,0.325684,-0.87793,1.048828,0.131714,-0.349609,-1.813477,-0.240967,1.604492,0.003637,-0.901855,0.221558,0.609863,-0.73877,2.097656,-0.914062,-0.293945,-0.037994,0.685547,0.414795,-0.469482,-1.085938,-0.106445,0.059448,0.483154,1.189453,0.506836,0.754395,-0.183228,5.164062,-0.440674,0.631348,-1.845703,0.227783,0.841309,0.66748,-0.17041,-0.11969,-0.504883,0.662598,1.933594,-0.8125,0.072815,-0.778809,-0.553711,-0.032776,-1.424805,0.148315,0.257812,0.735352,0.563965,-0.272217,1.19043,-0.101379,1.333984,0.191284,0.630859,1.010742,0.161865,0.609375,-0.219482,-0.013069,1.505859,-1.319336,0.448242,-0.635254,-0.075378,1.033203,0.139893,0.593262,-0.301514,0.666504,0.713379,1.020508,0.879883,-1.09668,-0.21106,-0.778809,0.065979,0.229736,0.435303,1.233398,-0.865723,0.062347,0.382324,-1.31543,0.786621,0.770508,-0.871094,0.583496,0.115601,0.209595,0.325439,0.469238,0.0,-0.731445,-0.249512,-0.050568,-1.232422,-0.790527,0.493408,0.35791,-0.381592,0.176392,-0.741699,1.080078,1.137695,1.199219,0.030609,-0.356201,0.247803,1.395508,0.961914,0.078125,0.70752,-0.026306,0.329102,0.196045,0.65332,0.069214,0.907715,-0.350586,-1.170898,0.48291,-0.09491,0.126831,0.89209,-0.31543,0.704102,-0.0177,-0.513184,-0.362549,1.0,2.265625,0.360107,1.639648,-1.0,0.876953,0.368164,0.991211,-1.224609,-0.879883,1.0,0.035156,0.693359,0.307129,0.728027,1.220703,-0.939941,-0.106934,0.0,-0.569336,-0.386475,-0.452393,0.269775,-0.56543,-0.262207,-1.473633,0.0,0.428223,1.740234,-0.72998,-0.225952,-0.008301,-0.447998,-2.292969,-0.443115,0.121216,0.787598,1.996094,-1.286133,-0.157227,1.019531,0.693359,0.797363,-0.192627,0.222778,-0.171387,1.15332,0.689941,3.251953,0.992188,-0.779785,-0.546387,-0.37915,1.896484,-0.732422,-0.11377,1.12793,0.122314,0.44458,0.48584,-2.302734,0.0,-0.893555,0.055939,0.201416,-0.338135,1.27832,1.367188,0.145264,0.346924,-0.824219,-1.306641,-1.158203,0.709473,-1.020508,-1.291016,0.038666,0.187134,-0.680176,0.900391,-0.924805,-1.057617,-0.167114,0.0,-0.237915,-0.742188,0.992676,0.961426,-0.00626,0.473633,0.040131,0.453613,-1.597656,0.301758,0.157471,1.505859,0.365967,-1.095703,0.200073,0.819336,0.941406,-0.086792,-1.086914,-1.044922,-0.287598,0.321533
1,0.811035,-0.51416,0.742188,1.771484,1.427734,1.133789,0.114807,-0.219238,-0.351807,0.84668,0.440186,0.499756,0.893066,-0.681641,1.253906,-1.027344,-1.69043,0.011154,0.875488,0.325684,-0.458252,-1.797852,-0.300293,0.584961,0.55127,1.235352,-0.984863,-1.084961,3.162109,0.21106,-2.65625,-0.177002,0.486572,1.237305,-0.44751,-0.403564,-0.769531,-0.516602,-1.307617,-0.092407,0.971191,-0.069336,-0.963379,-0.84082,0.438965,0.317139,-1.167969,0.082336,-0.440674,0.631348,0.495117,1.163086,0.453369,0.631836,-0.17041,-0.11969,0.186157,-0.29248,-0.549805,-1.629883,0.902832,0.509766,0.377441,0.052094,-1.307617,0.148315,0.777832,-0.383301,-0.099487,-0.119995,1.466797,-0.255371,0.136353,0.191284,-0.404541,-1.220703,-1.442383,1.088867,-0.479248,0.476318,-1.238281,0.13916,-1.238281,0.277344,0.925781,-0.666016,-1.344727,-0.081726,-0.301514,-0.918945,-0.051697,1.020508,0.746582,0.911621,-0.343994,-0.778809,0.065979,-0.22998,-0.153564,-0.722168,-0.947266,1.321289,-0.075256,0.99707,-0.137695,0.724121,-0.722168,0.541992,0.730469,0.478027,-0.662109,0.605957,0.0,0.280518,0.781738,-0.140503,0.324951,0.540527,-0.686523,0.388916,-1.551758,-0.662109,-1.089844,-0.730469,-0.878906,-1.139648,-1.336914,0.804688,0.247803,-1.292969,-0.892578,0.078125,-0.957031,-0.195312,0.329102,-0.181152,0.65332,0.069214,-0.818848,0.308838,0.894531,1.197266,1.052734,-1.083984,-0.541992,-0.043518,-0.375732,0.167969,0.552246,0.772949,1.0,-1.25,0.409912,1.639648,-1.0,0.876953,-1.523438,-0.526855,-0.071045,0.269531,1.0,0.035156,-0.309326,-1.067383,-1.145508,-0.02533,-0.398438,-1.173828,0.427002,0.043945,1.408203,-0.71875,2.076172,-0.507812,0.942383,1.02832,0.0,1.050781,-1.009766,-1.363281,-1.496094,-1.260742,-0.452148,0.492188,0.400635,-2.302734,1.443359,-0.231445,0.777344,1.995117,-0.59375,0.737793,-0.841797,-0.191528,0.222778,0.611328,1.15332,0.866211,-0.269775,-0.078003,-0.332764,-0.546387,-0.678711,-0.434082,-0.584473,0.332031,-0.646973,0.122314,-0.068176,-0.868164,0.844727,1.179688,0.484863,-0.050537,-0.491943,-0.164429,0.133667,-0.952637,-0.811035,-0.821289,-0.546875,-0.067871,-0.76709,-0.015457,0.980469,0.799316,0.79834,-0.633301,0.779785,0.171265,1.166016,0.59082,0.11853,0.0,0.086182,1.135742,-1.583008,-0.481934,0.226685,-0.894531,-0.514648,-1.0,0.884277,-0.557617,-0.875488,0.537109,-0.154175,0.912598,-0.734375,0.819336,0.941406,-0.387695,-1.086914,-0.929688,-0.974121,-0.343506
2,0.394043,0.615723,0.567871,-1.083008,0.979492,-1.125977,0.114807,-1.035156,0.465088,0.150879,-0.044006,0.091248,-1.168945,-0.467285,0.095276,1.140625,-0.16687,-0.007294,-0.449463,0.325684,-0.682617,0.016266,0.026123,-0.547363,0.55127,-0.169678,0.857422,-0.09845,-0.860352,0.180176,0.609863,0.524902,-0.400391,0.751465,-0.287598,0.568359,0.829102,-0.253174,-0.235474,0.500977,-0.655762,-0.750977,0.664062,1.189453,1.087891,0.859375,-0.183228,0.082336,-0.440674,0.631348,-0.026169,0.015625,-0.855957,1.052734,-0.17041,-0.11969,0.038177,0.309814,-0.549805,1.638672,-0.476562,-0.90918,-0.544922,-0.546387,1.748047,0.148315,0.365234,0.342773,-0.813965,-0.046417,-0.484863,-0.270264,0.136353,-1.441406,-0.079163,-0.530762,0.130981,0.221558,-0.228882,0.700195,0.023468,0.269287,0.039825,-0.963867,-0.790039,0.693359,0.295166,0.447754,-0.301514,1.039062,-0.291748,1.020508,0.529297,-1.09668,0.150757,1.254883,0.065979,0.869141,0.518066,0.494385,-0.02858,-0.478271,-0.733887,0.200806,-0.174561,-0.255127,0.558594,0.586426,-2.177734,-0.765137,0.200317,0.346436,0.0,-0.065796,-0.29834,-0.040955,-0.875977,-0.625,1.005859,-0.471924,0.788574,-0.547363,-0.885254,0.186157,1.137695,0.052643,0.323242,1.15625,0.247803,0.859375,0.873047,0.078125,-0.418213,0.648438,0.329102,0.015572,0.65332,0.069214,0.907715,-0.642578,-1.170898,-0.247559,0.694336,1.0625,0.718262,-0.105347,0.166626,-0.375732,-0.513184,-0.393555,1.0,0.596191,-0.446289,-0.709961,-1.0,-1.431641,-0.577637,-0.418457,-0.515137,-0.283691,1.0,0.035156,-0.393799,0.288086,0.103333,-0.098328,0.133911,0.21228,0.384521,0.501465,0.010094,-0.007168,-1.117188,-0.564941,0.672852,-0.775879,0.0,-0.070007,0.883301,0.942871,-0.546875,0.905273,-0.452148,-1.169922,-0.274414,0.114014,0.10321,0.071045,-1.286133,-0.407959,0.137207,-0.399414,0.335693,-0.149292,0.222778,-0.171387,1.15332,-0.964355,-0.269775,-0.654297,0.180542,-1.220703,0.45752,-0.461182,-0.976562,0.147339,0.060364,0.122314,1.450195,1.163086,0.402588,0.0,0.523438,-0.005413,-0.092407,-0.001884,0.259277,0.507324,0.828125,0.25708,0.027908,-0.662598,1.066406,-0.52832,-1.020508,0.169678,-0.911133,-0.222046,0.536621,-0.161743,-0.114319,0.43335,-0.207153,0.0,-0.388184,0.062622,0.980957,0.899414,0.150146,0.245605,-1.429688,-1.0,-0.033508,-0.147095,-0.087524,-0.528809,-0.138062,0.912598,-0.551758,-1.220703,-1.060547,-0.219116,-1.086914,-0.612305,-0.113953,0.243652
3,-2.34375,-0.011871,1.875,-0.815918,0.77832,0.299072,0.114807,-1.176758,0.30127,-0.015671,-0.65625,-0.150879,-1.168945,-0.681641,2.921875,1.179688,0.364014,0.365723,-1.478516,0.325684,0.955566,-0.105042,-0.588867,0.649902,-1.813477,1.526367,-0.054657,-0.345459,0.259277,0.124939,-0.47876,-0.457764,-0.072266,0.577637,-0.266113,-0.699707,-0.306152,-0.680664,-1.658203,1.000977,-0.361084,-1.085938,-1.008789,1.189453,-1.285156,-1.00293,-0.248047,0.082336,-0.440674,-1.583984,-1.106445,-1.330078,-0.834961,0.544434,-0.17041,-0.11969,-0.786133,0.464844,-0.549805,-0.831055,-0.653809,-0.940918,-0.424805,-0.41333,-0.490479,0.148315,0.973145,1.689453,-0.339355,-0.110779,-0.607422,-0.52832,1.333984,-0.625,0.363037,0.70459,-1.298828,-0.821289,-0.659668,1.354492,-0.819824,-1.084961,0.057983,-0.514648,0.664551,0.183716,-2.169922,-0.181396,-0.301514,-0.918945,-1.126953,-0.980469,1.055664,-1.09668,-1.319336,-0.778809,0.065979,0.476807,-0.751465,-1.316406,-0.743652,-0.62793,0.326416,0.838379,-1.037109,-0.126465,-0.462402,0.656738,-0.275879,-0.213379,-4.339844,-1.129883,0.0,0.814941,1.477539,-0.321289,-0.170044,0.584473,0.937012,-0.263428,-1.551758,-1.373047,-1.654297,-0.716309,-0.878906,-0.921875,-0.945801,1.65625,0.247803,-1.026367,-0.593262,0.078125,-1.001953,-0.667969,0.329102,-0.092896,-1.530273,0.069214,-0.818848,-0.638672,-1.170898,-0.450928,-0.500977,-0.526855,-1.0625,-0.075806,-0.375732,0.736328,-0.513184,1.615234,1.0,-2.492188,-0.615234,0.117249,-1.0,0.876953,-0.577637,-0.743652,-0.147461,-1.297852,1.0,0.035187,-0.4021,-0.655762,-1.145508,-0.62793,-0.152344,-1.62793,0.0,0.092651,-0.189575,-2.15625,-1.526367,-0.564941,0.869141,-1.160156,0.0,-0.195068,-0.347168,-0.388672,0.243286,0.652344,-0.45166,-1.117188,0.738281,-0.87793,-1.006836,-0.470947,-1.286133,0.137573,0.0401,1.080078,-0.867188,-0.168701,0.222778,0.219971,-0.897949,-0.226685,-0.261719,0.137817,-1.24707,-0.209229,-0.476807,1.494141,0.187256,-0.150513,-0.377686,0.122314,1.075195,-0.868164,-1.424805,0.0,0.403076,-0.014435,0.020172,-0.431396,-1.279297,0.835938,-0.561523,-1.1875,1.179688,-1.575195,-1.43457,0.084229,-1.020508,1.272461,-0.667969,-1.452148,1.168945,-1.025391,-0.924805,1.013672,-0.324463,0.0,0.012917,0.599121,-1.84375,2.927734,2.324219,-0.666504,-0.049957,-1.0,-0.172485,-0.557617,-0.986816,0.237793,0.38208,0.912598,-0.266357,-1.220703,0.941406,-0.608887,0.104919,-0.783203,1.151367,-0.773438
4,0.842285,-0.262939,2.330078,-0.742676,-0.946777,1.230469,0.114807,-0.005859,0.498779,-0.235474,-0.17334,0.106506,-0.138062,-0.826172,4.070312,0.148315,0.269531,-0.046692,0.194336,0.325684,1.933594,-1.120117,-0.585449,0.535645,0.55127,0.216187,0.022415,-0.924316,0.19812,0.232422,-1.567383,-0.317383,-1.020508,0.079224,-0.355225,-0.709961,-0.278076,-0.327881,0.957031,-0.331787,-0.538086,-0.212158,-0.999512,-0.84082,-1.991211,-1.635742,-0.183228,0.082336,-0.440674,-1.583984,0.059174,-1.172852,-0.605469,-0.138306,-0.17041,-0.11969,-0.90625,-1.241211,-0.549805,-0.8125,-0.696289,-0.410889,-0.783203,-0.695801,-1.424805,0.148315,0.677246,1.110352,-0.384277,-0.089661,-0.80127,-0.934082,0.136353,-1.712891,0.758301,0.370605,-1.555664,-1.160156,-0.699219,0.644043,-0.774902,-1.143555,-0.107422,0.00943,0.768555,-0.835938,0.378418,-0.651367,-0.301514,-0.918945,-0.960449,-0.980469,-0.484131,-1.09668,0.914551,1.254883,0.065979,0.779785,-0.684082,-1.149414,-0.381104,-1.0,-0.27124,1.0,-1.216797,-0.800781,-0.421631,0.497803,-1.394531,-0.467041,-0.208984,-1.168945,0.0,0.73291,2.537109,-0.015411,0.255859,1.038086,0.279053,-1.011719,0.788574,-0.682617,-0.496826,-0.498779,-0.878906,-0.773438,-1.15625,-0.006191,0.247803,-0.749512,-0.875,0.078125,-0.912109,0.334961,0.329102,0.801758,-1.530273,0.069214,-0.490723,-0.573242,-0.137939,-1.138672,-0.739746,0.8125,-0.588867,-0.043549,0.166626,-1.019531,-2.628906,5.019531,1.0,-0.414551,-0.568848,-0.709961,-1.0,0.876953,-0.577637,1.533203,0.0,0.549805,1.0,0.035187,-0.658203,-1.384766,-0.833496,-0.733398,-1.458984,-2.023438,-1.419922,0.400391,0.344482,0.666016,0.11908,-0.558105,0.88916,0.612793,0.0,-0.114563,-0.347168,-0.553711,0.802246,-0.346924,-0.452148,-0.095825,0.231812,-1.511719,-1.117188,-0.81543,-1.286133,-0.921387,-0.638184,0.615234,0.34668,-0.211792,0.222778,-0.171387,-0.897949,0.192017,-0.269775,-0.185913,-0.077209,-1.204102,0.365234,-0.468018,0.760254,-2.261719,-1.264648,0.122314,1.214844,-0.868164,1.074219,0.0,1.635742,-0.050537,-0.775391,-0.499512,-1.524414,-0.461426,-0.660645,-0.821289,0.109375,0.275146,0.792969,-1.657227,0.980469,0.778809,-0.916504,-0.556152,0.925781,-1.507812,1.166016,0.941406,-0.501465,0.0,-0.237915,0.330811,-0.585449,-1.314453,-1.918945,-0.438721,-1.576172,-1.226562,1.067383,-0.519043,-1.22168,-0.724121,-0.17041,0.912598,-0.741211,-1.220703,0.941406,-0.588379,0.104919,0.753418,1.345703,-0.737793


In [5]:
## Include back target to have a df with features for modeling and the target
columns = list(df_features.columns)
columns.insert(0, target)
df_features_target = train.loc[:, columns]
display(df_features_target.head())

Unnamed: 0,target,f_0,f_1,f_2,f_5,f_6,f_7,f_8,f_9,f_10,f_11,f_12,f_13,f_14,f_16,f_17,f_18,f_19,f_20,f_21,f_22,f_23,f_24,f_25,f_26,f_27,f_29,f_30,f_31,f_32,f_33,f_34,f_35,f_36,f_37,f_38,f_39,f_40,f_42,f_43,f_44,f_45,f_46,f_47,f_48,f_49,f_50,f_52,f_53,f_55,f_56,f_57,f_58,f_59,f_60,f_62,f_63,f_64,f_65,f_66,f_67,f_68,f_69,f_70,f_71,f_73,f_74,f_75,f_76,f_77,f_78,f_79,f_80,f_81,f_82,f_83,f_84,f_85,f_86,f_87,f_88,f_89,f_90,f_91,f_92,f_93,f_94,f_96,f_98,f_99,f_100,f_101,f_102,f_103,f_104,f_105,f_107,f_108,f_109,f_110,f_111,f_112,f_113,f_114,f_115,f_116,f_117,f_118,f_119,f_120,f_121,f_122,f_123,f_124,f_125,f_126,f_127,f_128,f_129,f_130,f_131,f_132,f_133,f_135,f_137,f_138,f_139,f_140,f_141,f_142,f_143,f_144,f_145,f_147,f_149,f_150,f_151,f_152,f_153,f_154,f_155,f_156,f_159,f_160,f_162,f_163,f_165,f_166,f_167,f_168,f_169,f_170,f_171,f_172,f_174,f_175,f_176,f_177,f_178,f_179,f_181,f_182,f_183,f_184,f_185,f_187,f_188,f_189,f_190,f_191,f_192,f_194,f_195,f_196,f_197,f_198,f_199,f_200,f_201,f_202,f_204,f_208,f_209,f_210,f_213,f_215,f_216,f_217,f_218,f_219,f_220,f_221,f_222,f_223,f_224,f_225,f_227,f_229,f_230,f_231,f_232,f_233,f_234,f_235,f_236,f_237,f_238,f_239,f_241,f_242,f_243,f_244,f_246,f_248,f_249,f_250,f_251,f_252,f_253,f_256,f_257,f_258,f_259,f_260,f_261,f_263,f_264,f_265,f_266,f_267,f_268,f_269,f_270,f_271,f_272,f_275,f_276,f_278,f_279,f_281,f_282,f_283,f_284,f_285,f_286,f_287,f_289,f_290,f_291,f_292,f_293,f_294,f_295,f_296,f_297,f_298,f_299
0,-0.300781,0.932617,0.113708,-0.4021,-0.413574,0.96582,1.230469,0.114807,-2.013672,0.004936,0.28418,0.501953,-0.287842,-1.168945,-0.574219,-0.771973,1.012695,-1.230469,1.786133,-2.089844,0.325684,-0.87793,1.048828,0.131714,-0.349609,-1.813477,-0.240967,1.604492,0.003637,-0.901855,0.221558,0.609863,-0.73877,2.097656,-0.914062,-0.293945,-0.037994,0.685547,0.414795,-0.469482,-1.085938,-0.106445,0.059448,0.483154,1.189453,0.506836,0.754395,-0.183228,5.164062,-0.440674,0.631348,-1.845703,0.227783,0.841309,0.66748,-0.17041,-0.11969,-0.504883,0.662598,1.933594,-0.8125,0.072815,-0.778809,-0.553711,-0.032776,-1.424805,0.148315,0.257812,0.735352,0.563965,-0.272217,1.19043,-0.101379,1.333984,0.191284,0.630859,1.010742,0.161865,0.609375,-0.219482,-0.013069,1.505859,-1.319336,0.448242,-0.635254,-0.075378,1.033203,0.139893,0.593262,-0.301514,0.666504,0.713379,1.020508,0.879883,-1.09668,-0.21106,-0.778809,0.065979,0.229736,0.435303,1.233398,-0.865723,0.062347,0.382324,-1.31543,0.786621,0.770508,-0.871094,0.583496,0.115601,0.209595,0.325439,0.469238,0.0,-0.731445,-0.249512,-0.050568,-1.232422,-0.790527,0.493408,0.35791,-0.381592,0.176392,-0.741699,1.080078,1.137695,1.199219,0.030609,-0.356201,0.247803,1.395508,0.961914,0.078125,0.70752,-0.026306,0.329102,0.196045,0.65332,0.069214,0.907715,-0.350586,-1.170898,0.48291,-0.09491,0.126831,0.89209,-0.31543,0.704102,-0.0177,-0.513184,-0.362549,1.0,2.265625,0.360107,1.639648,-1.0,0.876953,0.368164,0.991211,-1.224609,-0.879883,1.0,0.035156,0.693359,0.307129,0.728027,1.220703,-0.939941,-0.106934,0.0,-0.569336,-0.386475,-0.452393,0.269775,-0.56543,-0.262207,-1.473633,0.0,0.428223,1.740234,-0.72998,-0.225952,-0.008301,-0.447998,-2.292969,-0.443115,0.121216,0.787598,1.996094,-1.286133,-0.157227,1.019531,0.693359,0.797363,-0.192627,0.222778,-0.171387,1.15332,0.689941,3.251953,0.992188,-0.779785,-0.546387,-0.37915,1.896484,-0.732422,-0.11377,1.12793,0.122314,0.44458,0.48584,-2.302734,0.0,-0.893555,0.055939,0.201416,-0.338135,1.27832,1.367188,0.145264,0.346924,-0.824219,-1.306641,-1.158203,0.709473,-1.020508,-1.291016,0.038666,0.187134,-0.680176,0.900391,-0.924805,-1.057617,-0.167114,0.0,-0.237915,-0.742188,0.992676,0.961426,-0.00626,0.473633,0.040131,0.453613,-1.597656,0.301758,0.157471,1.505859,0.365967,-1.095703,0.200073,0.819336,0.941406,-0.086792,-1.086914,-1.044922,-0.287598,0.321533
1,-0.231079,0.811035,-0.51416,0.742188,1.771484,1.427734,1.133789,0.114807,-0.219238,-0.351807,0.84668,0.440186,0.499756,0.893066,-0.681641,1.253906,-1.027344,-1.69043,0.011154,0.875488,0.325684,-0.458252,-1.797852,-0.300293,0.584961,0.55127,1.235352,-0.984863,-1.084961,3.162109,0.21106,-2.65625,-0.177002,0.486572,1.237305,-0.44751,-0.403564,-0.769531,-0.516602,-1.307617,-0.092407,0.971191,-0.069336,-0.963379,-0.84082,0.438965,0.317139,-1.167969,0.082336,-0.440674,0.631348,0.495117,1.163086,0.453369,0.631836,-0.17041,-0.11969,0.186157,-0.29248,-0.549805,-1.629883,0.902832,0.509766,0.377441,0.052094,-1.307617,0.148315,0.777832,-0.383301,-0.099487,-0.119995,1.466797,-0.255371,0.136353,0.191284,-0.404541,-1.220703,-1.442383,1.088867,-0.479248,0.476318,-1.238281,0.13916,-1.238281,0.277344,0.925781,-0.666016,-1.344727,-0.081726,-0.301514,-0.918945,-0.051697,1.020508,0.746582,0.911621,-0.343994,-0.778809,0.065979,-0.22998,-0.153564,-0.722168,-0.947266,1.321289,-0.075256,0.99707,-0.137695,0.724121,-0.722168,0.541992,0.730469,0.478027,-0.662109,0.605957,0.0,0.280518,0.781738,-0.140503,0.324951,0.540527,-0.686523,0.388916,-1.551758,-0.662109,-1.089844,-0.730469,-0.878906,-1.139648,-1.336914,0.804688,0.247803,-1.292969,-0.892578,0.078125,-0.957031,-0.195312,0.329102,-0.181152,0.65332,0.069214,-0.818848,0.308838,0.894531,1.197266,1.052734,-1.083984,-0.541992,-0.043518,-0.375732,0.167969,0.552246,0.772949,1.0,-1.25,0.409912,1.639648,-1.0,0.876953,-1.523438,-0.526855,-0.071045,0.269531,1.0,0.035156,-0.309326,-1.067383,-1.145508,-0.02533,-0.398438,-1.173828,0.427002,0.043945,1.408203,-0.71875,2.076172,-0.507812,0.942383,1.02832,0.0,1.050781,-1.009766,-1.363281,-1.496094,-1.260742,-0.452148,0.492188,0.400635,-2.302734,1.443359,-0.231445,0.777344,1.995117,-0.59375,0.737793,-0.841797,-0.191528,0.222778,0.611328,1.15332,0.866211,-0.269775,-0.078003,-0.332764,-0.546387,-0.678711,-0.434082,-0.584473,0.332031,-0.646973,0.122314,-0.068176,-0.868164,0.844727,1.179688,0.484863,-0.050537,-0.491943,-0.164429,0.133667,-0.952637,-0.811035,-0.821289,-0.546875,-0.067871,-0.76709,-0.015457,0.980469,0.799316,0.79834,-0.633301,0.779785,0.171265,1.166016,0.59082,0.11853,0.0,0.086182,1.135742,-1.583008,-0.481934,0.226685,-0.894531,-0.514648,-1.0,0.884277,-0.557617,-0.875488,0.537109,-0.154175,0.912598,-0.734375,0.819336,0.941406,-0.387695,-1.086914,-0.929688,-0.974121,-0.343506
2,0.568848,0.394043,0.615723,0.567871,-1.083008,0.979492,-1.125977,0.114807,-1.035156,0.465088,0.150879,-0.044006,0.091248,-1.168945,-0.467285,0.095276,1.140625,-0.16687,-0.007294,-0.449463,0.325684,-0.682617,0.016266,0.026123,-0.547363,0.55127,-0.169678,0.857422,-0.09845,-0.860352,0.180176,0.609863,0.524902,-0.400391,0.751465,-0.287598,0.568359,0.829102,-0.253174,-0.235474,0.500977,-0.655762,-0.750977,0.664062,1.189453,1.087891,0.859375,-0.183228,0.082336,-0.440674,0.631348,-0.026169,0.015625,-0.855957,1.052734,-0.17041,-0.11969,0.038177,0.309814,-0.549805,1.638672,-0.476562,-0.90918,-0.544922,-0.546387,1.748047,0.148315,0.365234,0.342773,-0.813965,-0.046417,-0.484863,-0.270264,0.136353,-1.441406,-0.079163,-0.530762,0.130981,0.221558,-0.228882,0.700195,0.023468,0.269287,0.039825,-0.963867,-0.790039,0.693359,0.295166,0.447754,-0.301514,1.039062,-0.291748,1.020508,0.529297,-1.09668,0.150757,1.254883,0.065979,0.869141,0.518066,0.494385,-0.02858,-0.478271,-0.733887,0.200806,-0.174561,-0.255127,0.558594,0.586426,-2.177734,-0.765137,0.200317,0.346436,0.0,-0.065796,-0.29834,-0.040955,-0.875977,-0.625,1.005859,-0.471924,0.788574,-0.547363,-0.885254,0.186157,1.137695,0.052643,0.323242,1.15625,0.247803,0.859375,0.873047,0.078125,-0.418213,0.648438,0.329102,0.015572,0.65332,0.069214,0.907715,-0.642578,-1.170898,-0.247559,0.694336,1.0625,0.718262,-0.105347,0.166626,-0.375732,-0.513184,-0.393555,1.0,0.596191,-0.446289,-0.709961,-1.0,-1.431641,-0.577637,-0.418457,-0.515137,-0.283691,1.0,0.035156,-0.393799,0.288086,0.103333,-0.098328,0.133911,0.21228,0.384521,0.501465,0.010094,-0.007168,-1.117188,-0.564941,0.672852,-0.775879,0.0,-0.070007,0.883301,0.942871,-0.546875,0.905273,-0.452148,-1.169922,-0.274414,0.114014,0.10321,0.071045,-1.286133,-0.407959,0.137207,-0.399414,0.335693,-0.149292,0.222778,-0.171387,1.15332,-0.964355,-0.269775,-0.654297,0.180542,-1.220703,0.45752,-0.461182,-0.976562,0.147339,0.060364,0.122314,1.450195,1.163086,0.402588,0.0,0.523438,-0.005413,-0.092407,-0.001884,0.259277,0.507324,0.828125,0.25708,0.027908,-0.662598,1.066406,-0.52832,-1.020508,0.169678,-0.911133,-0.222046,0.536621,-0.161743,-0.114319,0.43335,-0.207153,0.0,-0.388184,0.062622,0.980957,0.899414,0.150146,0.245605,-1.429688,-1.0,-0.033508,-0.147095,-0.087524,-0.528809,-0.138062,0.912598,-0.551758,-1.220703,-1.060547,-0.219116,-1.086914,-0.612305,-0.113953,0.243652
3,-1.064453,-2.34375,-0.011871,1.875,-0.815918,0.77832,0.299072,0.114807,-1.176758,0.30127,-0.015671,-0.65625,-0.150879,-1.168945,-0.681641,2.921875,1.179688,0.364014,0.365723,-1.478516,0.325684,0.955566,-0.105042,-0.588867,0.649902,-1.813477,1.526367,-0.054657,-0.345459,0.259277,0.124939,-0.47876,-0.457764,-0.072266,0.577637,-0.266113,-0.699707,-0.306152,-0.680664,-1.658203,1.000977,-0.361084,-1.085938,-1.008789,1.189453,-1.285156,-1.00293,-0.248047,0.082336,-0.440674,-1.583984,-1.106445,-1.330078,-0.834961,0.544434,-0.17041,-0.11969,-0.786133,0.464844,-0.549805,-0.831055,-0.653809,-0.940918,-0.424805,-0.41333,-0.490479,0.148315,0.973145,1.689453,-0.339355,-0.110779,-0.607422,-0.52832,1.333984,-0.625,0.363037,0.70459,-1.298828,-0.821289,-0.659668,1.354492,-0.819824,-1.084961,0.057983,-0.514648,0.664551,0.183716,-2.169922,-0.181396,-0.301514,-0.918945,-1.126953,-0.980469,1.055664,-1.09668,-1.319336,-0.778809,0.065979,0.476807,-0.751465,-1.316406,-0.743652,-0.62793,0.326416,0.838379,-1.037109,-0.126465,-0.462402,0.656738,-0.275879,-0.213379,-4.339844,-1.129883,0.0,0.814941,1.477539,-0.321289,-0.170044,0.584473,0.937012,-0.263428,-1.551758,-1.373047,-1.654297,-0.716309,-0.878906,-0.921875,-0.945801,1.65625,0.247803,-1.026367,-0.593262,0.078125,-1.001953,-0.667969,0.329102,-0.092896,-1.530273,0.069214,-0.818848,-0.638672,-1.170898,-0.450928,-0.500977,-0.526855,-1.0625,-0.075806,-0.375732,0.736328,-0.513184,1.615234,1.0,-2.492188,-0.615234,0.117249,-1.0,0.876953,-0.577637,-0.743652,-0.147461,-1.297852,1.0,0.035187,-0.4021,-0.655762,-1.145508,-0.62793,-0.152344,-1.62793,0.0,0.092651,-0.189575,-2.15625,-1.526367,-0.564941,0.869141,-1.160156,0.0,-0.195068,-0.347168,-0.388672,0.243286,0.652344,-0.45166,-1.117188,0.738281,-0.87793,-1.006836,-0.470947,-1.286133,0.137573,0.0401,1.080078,-0.867188,-0.168701,0.222778,0.219971,-0.897949,-0.226685,-0.261719,0.137817,-1.24707,-0.209229,-0.476807,1.494141,0.187256,-0.150513,-0.377686,0.122314,1.075195,-0.868164,-1.424805,0.0,0.403076,-0.014435,0.020172,-0.431396,-1.279297,0.835938,-0.561523,-1.1875,1.179688,-1.575195,-1.43457,0.084229,-1.020508,1.272461,-0.667969,-1.452148,1.168945,-1.025391,-0.924805,1.013672,-0.324463,0.0,0.012917,0.599121,-1.84375,2.927734,2.324219,-0.666504,-0.049957,-1.0,-0.172485,-0.557617,-0.986816,0.237793,0.38208,0.912598,-0.266357,-1.220703,0.941406,-0.608887,0.104919,-0.783203,1.151367,-0.773438
4,-0.531738,0.842285,-0.262939,2.330078,-0.742676,-0.946777,1.230469,0.114807,-0.005859,0.498779,-0.235474,-0.17334,0.106506,-0.138062,-0.826172,4.070312,0.148315,0.269531,-0.046692,0.194336,0.325684,1.933594,-1.120117,-0.585449,0.535645,0.55127,0.216187,0.022415,-0.924316,0.19812,0.232422,-1.567383,-0.317383,-1.020508,0.079224,-0.355225,-0.709961,-0.278076,-0.327881,0.957031,-0.331787,-0.538086,-0.212158,-0.999512,-0.84082,-1.991211,-1.635742,-0.183228,0.082336,-0.440674,-1.583984,0.059174,-1.172852,-0.605469,-0.138306,-0.17041,-0.11969,-0.90625,-1.241211,-0.549805,-0.8125,-0.696289,-0.410889,-0.783203,-0.695801,-1.424805,0.148315,0.677246,1.110352,-0.384277,-0.089661,-0.80127,-0.934082,0.136353,-1.712891,0.758301,0.370605,-1.555664,-1.160156,-0.699219,0.644043,-0.774902,-1.143555,-0.107422,0.00943,0.768555,-0.835938,0.378418,-0.651367,-0.301514,-0.918945,-0.960449,-0.980469,-0.484131,-1.09668,0.914551,1.254883,0.065979,0.779785,-0.684082,-1.149414,-0.381104,-1.0,-0.27124,1.0,-1.216797,-0.800781,-0.421631,0.497803,-1.394531,-0.467041,-0.208984,-1.168945,0.0,0.73291,2.537109,-0.015411,0.255859,1.038086,0.279053,-1.011719,0.788574,-0.682617,-0.496826,-0.498779,-0.878906,-0.773438,-1.15625,-0.006191,0.247803,-0.749512,-0.875,0.078125,-0.912109,0.334961,0.329102,0.801758,-1.530273,0.069214,-0.490723,-0.573242,-0.137939,-1.138672,-0.739746,0.8125,-0.588867,-0.043549,0.166626,-1.019531,-2.628906,5.019531,1.0,-0.414551,-0.568848,-0.709961,-1.0,0.876953,-0.577637,1.533203,0.0,0.549805,1.0,0.035187,-0.658203,-1.384766,-0.833496,-0.733398,-1.458984,-2.023438,-1.419922,0.400391,0.344482,0.666016,0.11908,-0.558105,0.88916,0.612793,0.0,-0.114563,-0.347168,-0.553711,0.802246,-0.346924,-0.452148,-0.095825,0.231812,-1.511719,-1.117188,-0.81543,-1.286133,-0.921387,-0.638184,0.615234,0.34668,-0.211792,0.222778,-0.171387,-0.897949,0.192017,-0.269775,-0.185913,-0.077209,-1.204102,0.365234,-0.468018,0.760254,-2.261719,-1.264648,0.122314,1.214844,-0.868164,1.074219,0.0,1.635742,-0.050537,-0.775391,-0.499512,-1.524414,-0.461426,-0.660645,-0.821289,0.109375,0.275146,0.792969,-1.657227,0.980469,0.778809,-0.916504,-0.556152,0.925781,-1.507812,1.166016,0.941406,-0.501465,0.0,-0.237915,0.330811,-0.585449,-1.314453,-1.918945,-0.438721,-1.576172,-1.226562,1.067383,-0.519043,-1.22168,-0.724121,-0.17041,0.912598,-0.741211,-1.220703,0.941406,-0.588379,0.104919,0.753418,1.345703,-0.737793


## Modeling

In [6]:
%%time 
from sklearn.model_selection import train_test_split

def prep_data_for_modeling(df):
    X = df.drop(columns='target')
    y = df['target']
    print(f"X shape: {X.shape}")
    print(f"y shape: {y.shape}")
    print('\n')

    x_train,x_test,y_train,y_test = train_test_split(X, y, test_size=0.3, random_state=1111)
    print(f"X_train shape: {x_train.shape}")
    print(f"y_train shape: {y_train.shape}")
    print(f"X_test shape: {x_test.shape}")
    print(f"y_test shape: {y_test.shape}")
    
    return x_train, y_train, x_test, y_test

x_train, y_train, x_test, y_test = prep_data_for_modeling(df_features_target)

X shape: (3141410, 256)
y shape: (3141410,)


X_train shape: (2198987, 256)
y_train shape: (2198987,)
X_test shape: (942423, 256)
y_test shape: (942423,)
CPU times: user 13.8 s, sys: 3.7 s, total: 17.5 s
Wall time: 17.5 s


### Use Hyperopt for hyperparameter tuning

In [7]:
## Hyper Parameter Tuning for LGBM with HypterOPT
from hyperopt import hp, tpe, Trials, STATUS_OK
from hyperopt.fmin import fmin
from hyperopt.pyll.stochastic import sample
import lightgbm as lgb
import gc

#GLOBAL HYPEROPT PARAMETERS
NUM_EVALS = 1000 #number of hyperopt evaluation rounds
N_FOLDS = 5 #number of cross-validation folds on data in each evaluation round

#LIGHTGBM PARAMETERS
LGBM_MAX_LEAVES = 2**11 # maximum number of leaves per tree for LightGBM
LGBM_MAX_DEPTH = 25 # maximum tree depth for LightGBM
EVAL_METRIC_LGBM_REG = 'rmse' # LightGBM regression metric. Note that 'rmse' is more commonly used .. was 'mae'

def hyperopt_lgbm(data_train, labels_train, data_eval, labels_eval, num_evals=NUM_EVALS, diagnostic=False):
    
    print(f"'Running {num_evals} round(s) of LightGBM hyperparameter optimisation:")
    
    integer_params = ['max_depth', 'num_leaves', 'min_data_in_leaf', 'n_estimators']
    
    def objective(params):
        print(params)
        
        #cast integer params from float to int
        for param in integer_params:
            params[param] = int(params[param])

        num_round = int(params['n_estimators'])

        # Use train and predict
        # In case want to train and predict
        model = lgb.train(params, dtrain, num_round, valid_sets=dvalid, early_stopping_rounds=100, verbose_eval=False)
        y_pred = model.predict(data_eval)

        rmse = np.sqrt(mean_squared_error(y_test, y_pred))
        print(f"RMSE: {rmse}")
            
        return {'loss': rmse, 'status': STATUS_OK}
    
    dtrain = lgb.Dataset(data_train, label=labels_train)
    dvalid = lgb.Dataset(data_eval, label=labels_eval)
    watchlist = [(dvalid, 'eval'), (dtrain, 'train')]
                
    #integer and string parameters, used with hp.choice()
    objective_list_reg = ['huber', 'fair']
    objective_list = objective_list_reg

    space = {'n_estimators': hp.quniform('n_estimators', 100, 250, 1),
             'boosting' : 'gbdt',
             'num_leaves' : hp.quniform('num_leaves', 2, LGBM_MAX_LEAVES, 1),
             'max_depth': hp.quniform('max_depth', 2, LGBM_MAX_DEPTH, 1),
             'min_data_in_leaf': hp.quniform('min_data_in_leaf', 1, 256, 1),
             'min_gain_to_split' : hp.quniform('min_gain_to_split', 0.1, 5, 0.01),
             'lambda_l1' : hp.uniform('lambda_l1', 0, 5),
             'lambda_l2' : hp.uniform('lambda_l2', 0, 5),
             'learning_rate' : hp.loguniform('learning_rate', np.log(0.005), np.log(0.2)),
             'metric' : 'RMSE',
             'objective' : 'regression',
             'feature_fraction' : hp.quniform('feature_fraction', 0.5, 1, 0.01),
             'bagging_fraction' : hp.quniform('bagging_fraction', 0.5, 1, 0.01),
             'verbose': -1,  # shut down logger output
             'feature_pre_filter' : False}

    # Define best trials object
    trials = Trials()
    best = fmin(fn=objective,
                space=space,
                algo=tpe.suggest,
                max_evals=num_evals, 
                trials=trials)

    # Print out best metrics and methods
    # best['objective'] = objective_list[best['objective']]
    
    #cast floats of integer params to int
    for param in integer_params:
        best[param] = int(best[param])
    
    print('{' + '\n'.join(f"{k}: {v}" for k, v in best.items()) + '}')
    
    if diagnostic:
        return (best, trials)
    else:
        return (best)

In [8]:
%%time
# lgbm_params, trials = hyperopt_lgbm(x_train, y_train, x_test, y_test, 1, diagnostic=True)

CPU times: user 2 µs, sys: 2 µs, total: 4 µs
Wall time: 9.06 µs


In [9]:
## IMPORTANT ##
## Using Hyperopt in Kaggle takes too much time or either returns an error 'Out of Memory'. I took the Hyperopt 
## training to a Google Colab notebook with 300 evals to find the best LGBM hyper parameters. Hence, 
## there is also only 1 eval conducted in the cell above just for demonstration purposes
## See below the best LGBM parameters from the training in Google Colab

best_lgbm_params = {'bagging_fraction': 0.99,
                    'boosting': 'gbdt',
                    'feature_fraction': 0.81,
                    'feature_pre_filter': False,
                    'lambda_l1': 4.293930802891639,
                    'lambda_l2': 1.1593070193619666,
                    'learning_rate': 0.06464035186294781,
                    'max_depth': 21,
                    'metric': 'RMSE',
                    'min_data_in_leaf': 151,
                    'min_gain_to_split': 0.58,
                    'n_estimators': 250,
                    'num_leaves': 1183,
                    'objective': 'regression',
                    'verbose': 1}

In [10]:
%%time
## Model with LGBM
import lightgbm as lgb

lgb_train = lgb.Dataset(x_train, y_train)
lgb_eval = lgb.Dataset(x_test, y_test)

model = lgb.train(best_lgbm_params, lgb_train, valid_sets=lgb_eval, early_stopping_rounds=100)

y_expect  = y_test
y_pred = model.predict(x_test)

You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 65280
[LightGBM] [Info] Number of data points in the train set: 2198987, number of used features: 256
[LightGBM] [Info] Start training from score -0.021636
[1]	valid_0's rmse: 0.920059
Training until validation scores don't improve for 100 rounds
[2]	valid_0's rmse: 0.919207
[3]	valid_0's rmse: 0.918451
[4]	valid_0's rmse: 0.917672
[5]	valid_0's rmse: 0.916922
[6]	valid_0's rmse: 0.916303
[7]	valid_0's rmse: 0.915752
[8]	valid_0's rmse: 0.915211
[9]	valid_0's rmse: 0.914714
[10]	valid_0's rmse: 0.914305
[11]	valid_0's rmse: 0.913847
[12]	valid_0's rmse: 0.913453
[13]	valid_0's rmse: 0.913078
[14]	valid_0's rmse: 0.912687
[15]	valid_0's rmse: 0.912338
[16]	valid_0's rmse: 0.911995
[17]	valid_0's rmse: 0.91167
[18]	valid_0's rmse: 0.911392
[19]	valid_0's rmse: 0.911105
[20]	valid_0's rmse: 0.910825
[21]	valid_0's rmse: 0.910549
[22]	valid_0's rmse: 0.910292
[23]	valid_0's rmse: 0.910085
[24]	valid_0's 

In [11]:
#RMSE
from sklearn.metrics import mean_squared_error

rmse = np.sqrt(mean_squared_error(y_expect, y_pred))
print(f"RMSE: {rmse}")

RMSE: 0.8903406784306958


## Submit

In [12]:
import ubiquant
env = ubiquant.make_env()  
iter_test = env.iter_test()

for (test_df, sample_prediction_df) in iter_test:
    
    test_df_feat = test_df.loc[:, list(x_train.columns)]
#     print(test_df_feat)
    lgb_pred = model.predict(test_df_feat)
    
    sample_prediction_df['target'] = lgb_pred
    print(sample_prediction_df)
    env.predict(sample_prediction_df) 
    display(sample_prediction_df)

This version of the API is not optimized and should not be used to estimate the runtime of your code on the hidden test set.
   row_id    target
0  1220_1 -0.157919
1  1220_2 -0.129462


Unnamed: 0,row_id,target
0,1220_1,-0.157919
1,1220_2,-0.129462


   row_id    target
0  1221_0 -0.129720
1  1221_1 -0.035262
2  1221_2 -0.246631


Unnamed: 0,row_id,target
0,1221_0,-0.12972
1,1221_1,-0.035262
2,1221_2,-0.246631


   row_id    target
0  1222_0 -0.053578
1  1222_1 -0.134988
2  1222_2 -0.071404


Unnamed: 0,row_id,target
0,1222_0,-0.053578
1,1222_1,-0.134988
2,1222_2,-0.071404


   row_id    target
0  1223_0 -0.231389


Unnamed: 0,row_id,target
0,1223_0,-0.231389
