# Importing Data

In [1]:
import os
import cv2
import glob
import time
import random
import warnings

import numpy as np
import pandas as pd


from sklearn import svm
from sklearn import tree
from sklearn import impute
from sklearn import metrics
from sklearn import ensemble
from sklearn import linear_model
from sklearn import decomposition
from sklearn import preprocessing
from sklearn import model_selection
from sklearn.impute import SimpleImputer
from sklearn.model_selection import StratifiedKFold
from sklearn.metrics import roc_auc_score

from xgboost import XGBClassifier
from lightgbm import LGBMClassifier
from catboost import CatBoostClassifier


warnings.filterwarnings('ignore')

SEED = 42
np.random.seed(SEED)

pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)
pd.set_option('float_format', '{:f}'.format)



# Loading Data 

In [2]:
submission = pd.read_csv("sample_solution.csv")

In [3]:
train_data = pd.read_csv("train.csv").drop(columns = ["id"])
test_data = pd.read_csv("test.csv").drop(columns = ["id"])

N_FOLDS = 5
target = 'claim'
TARGET = train_data['claim']

train_data.head()

Unnamed: 0,f1,f2,f3,f4,f5,f6,f7,f8,f9,f10,f11,f12,f13,f14,f15,f16,f17,f18,f19,f20,f21,f22,f23,f24,f25,f26,f27,f28,f29,f30,f31,f32,f33,f34,f35,f36,f37,f38,f39,f40,f41,f42,f43,f44,f45,f46,f47,f48,f49,f50,f51,f52,f53,f54,f55,f56,f57,f58,f59,f60,f61,f62,f63,f64,f65,f66,f67,f68,f69,f70,f71,f72,f73,f74,f75,f76,f77,f78,f79,f80,f81,f82,f83,f84,f85,f86,f87,f88,f89,f90,f91,f92,f93,f94,f95,f96,f97,f98,f99,f100,f101,f102,f103,f104,f105,f106,f107,f108,f109,f110,f111,f112,f113,f114,f115,f116,f117,f118,claim
0,0.10859,0.004314,-37.566,0.017364,0.28915,-10.251,135.12,168900.0,399240000000000.0,86.489,0.59881,1423200000.0,0.2724,9.4556,-0.050305,1938.3,8.6331,4.0607,26.867,-1.18,10961.0,1.5397,135.32,-1.4965,440.08,2590100000000.0,2194200000.0,2968800.0,0.001431,13.327,0.7505,18509.0,146820.0,-0.000276,1.0906e+16,1705.4,414.29,3.5392,1888.0,0.96893,18.388,-0.001583,7.7059,5.9325,0.025693,4.5604,0.61122,10.795,0.34193,0.23501,,5237.7,1.2961,163.66,0.40378,0.1886,-0.001446,-0.35416,6.6432,0.30534,0.51402,1907300000.0,29.861,0.96501,1797.2,72.178,108.62,1.9799,1.2907,0.99519,1.3228,827.34,777990000000000.0,41299000000.0,0.006994,6.9835,43956.0,1978.2,5.5084,-0.001081,6.1244,123180000000.0,275.92,5308500.0,1704.0,50224000000.0,53.398,-2.2012,6871.0,3.8862,-0.00558,5252.1,166.69,1.6074,0.66534,7768.9,0.99662,112570000000.0,2.2432,0.93416,0.65056,94569.0,21.471,8214.1,0.28801,0.097826,0.001071,1412400000.0,0.11093,-12.228,1.7482,1.9096,-7.1157,4378.8,1.2096,861340000000000.0,140.1,1.0177,1
1,0.1009,0.29961,11822.0,0.2765,0.4597,-0.83733,1721.9,119810.0,3874100000000000.0,9953.6,1.2093,3334100000.0,0.28631,-0.012858,-0.019912,10.284,6.1872,1.0419,4.6404,31.877,123620.0,1.3951,125.81,1.1989,136.45,9098100000.0,40041000000.0,1564000.0,0.000204,3.1074,1.5033,238000.0,21440.0,-0.001344,3.0794e+16,229.1,844.82,1.468,4726.5,0.91538,-1.5321,0.9826,7.1112,2.0797,0.042321,4.2523,0.41871,5.4499,0.012737,0.38647,7.3082,283.21,-0.92552,140.8,0.24739,-0.001656,-0.000975,-0.22629,2.4246,0.77147,0.011613,1803700000.0,64.604,0.26265,4455.0,78.339,745.51,2.9069,1.4826,1.0051,1.4974,84.446,3505600000000000.0,2242300000.0,0.8963,4.6749,17713.0,9003.1,-4.3546,0.2541,6.9191,183240000000.0,9.651,32800.0,1480.6,23006000000.0,44.051,205.69,4295.3,13.388,0.46843,754.61,83.233,1.189,29.55,7343.7,0.99815,48777000000000.0,1.2708,-0.000969,5.2952,6779.0,227.72,34.342,0.3403,0.14337,0.049276,1903200000.0,0.97673,-56.758,4.1684,0.34808,4.142,913.23,1.2464,7575100000000000.0,1861.0,0.28359,0
2,0.17803,-0.00698,907.27,0.27214,0.45948,0.17327,2298.0,360650.0,12245000000000.0,15827.0,0.38164,1230300000.0,0.25807,2.4556,,26.873,7.5463,1.9967,1.9526,817.76,-2948.7,2.0054,1.6826,1.1968,74.624,-32739000000.0,57189000000.0,11058.0,-0.003097,8.0241,1.1318,27940.0,862460.0,-0.002207,58491000000000.0,-897.84,,1.3561,3063.4,0.086232,16.106,0.001481,11.476,5.343,0.012162,4.1018,-0.8827,8.1228,-0.67669,0.3377,-1.0732,4097.0,13.458,159.24,0.3223,0.56009,0.000455,-0.16083,3.5753,0.6097,0.028301,527130000.0,14.454,0.11549,14605.0,36.992,-9.6391,64.267,,0.99278,2.5891,430.4,-44535000000000.0,5144900000000.0,0.099591,6.5516,1887.5,43319.0,4.3931,0.26026,6.1052,101330000000.0,357.27,1476600.0,90.845,1306200000.0,2.3731,391.37,2965.3,,0.49459,43.524,138.52,1.1079,0.91948,47.915,,1510500000000.0,3.4663,0.56095,4.1309,95531.0,39.486,-83.148,0.084881,0.032222,0.001668,14365000.0,0.20102,-5.7688,1.2042,0.2629,8.1312,45119.0,1.1764,321810000000000.0,3838.2,0.4069,1
3,0.15236,0.007259,780.1,0.025179,0.51947,7.4914,112.51,259490.0,77814000000000.0,-36.837,1.1096,1223100000.0,0.30944,10.37,-0.10626,533.84,7.849,1.0379,8.003,12.349,-195.28,2.5598,92.142,0.63789,1054.9,-12041000000.0,5187300000000.0,1475400.0,1.0365,1.1903,0.98941,301200.0,,-7e-06,-92992000000000.0,-10.818,1020.3,2.9553,3342.5,-0.000372,17.011,0.095268,5.7448,15.883,0.037934,4.486,-0.88909,8.4384,-1.1898,0.001391,,175.81,67.133,119.26,0.007034,0.46004,-0.000705,-0.39149,2.0888,0.7979,0.13592,4011100000.0,63.063,0.033075,75194.0,103.97,-15.482,2.9432,1.1804,1.007,2.1572,1251.5,1894700000000000.0,10770000000.0,0.99225,4.5331,14348.0,1575.7,9.8105,0.37283,1.5606,18354000000.0,-3.4298,6485700.0,2120.0,30812000000.0,34.056,157.43,3724.5,8.4211,0.40778,2971.2,204.7,-0.97998,9.9405,12011.0,0.99898,50634000000000.0,1.2261,0.2502,0.72974,373690.0,194.65,120.93,0.26071,0.23424,-0.002794,1442300000.0,-0.01182,-34.858,2.0694,0.79631,-16.336,4952.4,1.1784,4533000000000.0,4889.1,0.51486,1
4,0.11623,0.5029,-109.15,0.29791,0.3449,-0.40932,2538.9,65332.0,1907200000000000.0,144.12,1.0531,2634100000.0,0.29782,2.6548,,1808.9,7.2783,3.9757,,,29520.0,3.4225,96.725,0.79725,215.57,17326000000000.0,2635200000000.0,2161200.0,0.89547,6.8257,0.97413,142620.0,231350.0,0.001257,1.0125e+16,51.508,293.76,1.3351,3042.1,0.006791,94.889,0.91709,8.7369,,0.020281,3.9115,0.65634,6.141,-1.0896,0.24794,7.9704,2063.1,0.80633,131.77,0.17796,0.98938,0.000344,-0.98027,2.361,0.5803,0.46577,5702500000.0,23.738,-0.000847,75843.0,73.737,,64.591,1.1029,0.98985,1.3446,519.2,569320000000000.0,286960000000.0,0.011649,6.0236,1969.8,1967.6,,0.08569,1.5846,38252000000.0,130.7,102100.0,1951.8,11428000000.0,58.566,176.83,1279.0,4.9662,0.47912,-70.278,10.887,1.1434,6.1912,197.47,,15748000000000.0,1.0083,0.33953,13.486,201300.0,38.842,324.0,0.23825,0.14155,0.002208,5830700000.0,0.92739,-13.641,1.5298,1.1464,-0.43124,3856.5,1.483,-8991300000000.0,,0.23049,1


In [4]:
test_data.head()

Unnamed: 0,f1,f2,f3,f4,f5,f6,f7,f8,f9,f10,f11,f12,f13,f14,f15,f16,f17,f18,f19,f20,f21,f22,f23,f24,f25,f26,f27,f28,f29,f30,f31,f32,f33,f34,f35,f36,f37,f38,f39,f40,f41,f42,f43,f44,f45,f46,f47,f48,f49,f50,f51,f52,f53,f54,f55,f56,f57,f58,f59,f60,f61,f62,f63,f64,f65,f66,f67,f68,f69,f70,f71,f72,f73,f74,f75,f76,f77,f78,f79,f80,f81,f82,f83,f84,f85,f86,f87,f88,f89,f90,f91,f92,f93,f94,f95,f96,f97,f98,f99,f100,f101,f102,f103,f104,f105,f106,f107,f108,f109,f110,f111,f112,f113,f114,f115,f116,f117,f118
0,0.16585,0.48705,1295.0,0.0231,0.319,0.90188,573.29,3743.7,2705700000000.0,6221.0,1.172,5175000000.0,0.25831,3.4205,0.044983,1001.6,10.104,10.536,19.517,-1.1209,1577.6,2.1847,96.109,1.1535,95.865,2847100000000.0,96421000000.0,6406000.0,0.00299,6.6353,-0.015913,21723.0,67604.0,-0.000227,6.0462e+16,203.58,301.79,1.3461,5524.6,-0.003163,21.883,0.027383,7.2113,24.825,-0.00142,4.895,-1.0871,7.0561,-1.0615,0.0001,1.856,449.99,-0.36286,160.63,0.24801,0.623,0.000116,-0.39384,1.9038,0.068588,0.020439,2506500000.0,48.164,-0.002272,78643.0,112.36,1021.9,11.481,1.1573,0.002995,1.8192,1096.8,300410000000000.0,2042300000.0,0.0855,4.6312,1683.1,9833.6,,0.51041,4.0322,247790000000.0,69.264,5494800.0,1239.0,534930000.0,5.3086,182.59,829.17,5.2319,0.010301,3640.8,112.12,-0.43442,11.161,3755.7,0.99926,53382000000.0,1.3867,-0.001878,58.794,75657.0,187.24,1258.9,0.16334,0.055398,0.020002,795640000.0,0.16253,-22.189,2.0655,0.43088,-10.741,81606.0,1.194,198040000000000.0,2017.1,0.46357
1,0.12965,0.37348,1763.0,0.72884,0.33247,-1.2631,875.55,554370.0,595570000000000.0,934.43,1.8979,4905100000.0,0.28471,2.1387,-0.034328,35.223,6.5873,12.734,29.59,4.1639,31915.0,3.1158,109.43,-0.8522,991.37,4700100000.0,1618200000000.0,967810.0,1.0215,2.9617,0.81031,415570.0,384720.0,0.002243,6712900000000000.0,228.59,33.952,1.4938,2067.5,-0.002343,32.772,0.092283,6.5363,2.0773,0.046237,4.459,-0.84092,4.4473,-1.0012,0.00375,99.647,8146.8,22.504,153.4,0.43076,0.74301,-4.7e-05,-0.11692,1.6544,0.46744,0.12965,444280000.0,38.506,0.39622,74296.0,93.629,-15.691,30.655,1.2311,1.0044,2.2484,780.87,121360000000000.0,348820000000.0,-0.000792,6.9993,2451.6,10483.0,-5.3544,0.067286,5.4044,246260000000.0,810.3,860670.0,2165.2,271150000.0,10.232,515.41,262.71,5.6357,0.37422,420.16,116.23,1.2698,0.78619,1207.0,1.0007,20650000000000.0,1.2888,0.24885,9.9857,16323.0,244.46,647.58,0.25382,0.0088,0.018479,112060000.0,0.81528,-1.6342,1.5736,-1.0712,11.832,90114.0,1.1507,4.388e+16,6638.9,0.28125
2,0.12019,0.44521,736.26,0.04615,0.29605,0.31665,2659.5,317140.0,397780000000000.0,131.81,-0.48404,3800000.0,0.37173,0.40245,0.015119,1991.6,6.005,0.9919,11.949,888.07,887.7,3.5237,108.14,-1.6542,528.14,2463600000000.0,9005900000.0,7259.3,1.0074,2.6123,1.0625,-208010.0,65708.0,0.001391,81298000000000.0,-84.032,,1.7556,4729.2,0.003527,861.66,0.90267,9.3934,58.785,0.007244,5.6645,-0.62747,6.5806,-1.1282,0.3865,56.547,125.36,12.703,147.38,0.41437,0.51998,0.000857,-0.12065,5.4115,0.77253,0.12885,5664900000.0,50.894,0.37871,80045.0,65.224,780.21,14.125,1.1657,-0.001285,1.0663,432.01,-595310000000.0,1383400000000.0,-0.006236,5.6052,866.39,1065.2,-1.4805,0.064203,3.0197,168440000000.0,212.83,7891000.0,277.16,40479000000.0,1.117,393.51,8859.1,8.8098,0.40535,393.65,305.14,1.3266,30.852,2803.7,0.99925,4722600000000.0,1.5003,0.49338,37.047,139070.0,2464.0,4724.8,0.29916,0.093046,0.018516,65193000.0,0.81831,-32.78,2.1364,-1.9312,-3.2804,37739.0,1.1548,171810000000000.0,5844.0,0.13797
3,0.054008,0.39596,996.14,0.85934,0.36678,-0.1706,386.56,325680.0,-34322000000000.0,-26.473,-2.1293,4675400000.0,0.26659,1.0968,-0.083571,1987.5,6.8989,11.123,23.164,133.57,-815.32,2.7295,82.011,3.8374,304.57,-13159000000.0,-8324500000.0,2297700.0,0.099522,4.9249,0.6599,48773.0,199560.0,-0.000621,3.9938e+16,1400.4,503.66,1.9131,2811.6,0.002362,278.2,0.98919,7.4646,33.624,0.025889,4.1921,0.096508,4.8219,-0.010526,0.34624,0.92399,1392.1,1.3866,144.19,0.1475,0.26398,-0.000571,-0.14971,4.8384,0.35774,0.12486,-92544000.0,18.472,0.045596,86713.0,1.0519,1447.8,28.947,1.3372,1.0041,1.4836,483.92,4156700000000000.0,11254000000.0,0.010409,7.268,13656.0,1893.2,-2.3828,0.12858,1.4494,268100000000.0,66.599,-733900.0,843.42,12167000000.0,3.6871,243.59,1199.7,4.5092,0.37703,-36.886,11.401,0.97205,23.642,1882.7,0.99922,15680000000000.0,1.0456,0.54818,27.665,813040.0,1332.0,359.17,0.026553,0.66862,-0.00126,1995100000.0,0.86559,-2.4162,1.5199,-0.011633,1.384,26849.0,1.149,2.1388e+17,6173.3,0.3291
4,0.079947,-0.006919,10574.0,0.34845,0.45008,-1.842,3027.0,428150.0,929150000000.0,5999.4,1.8738,1857300000.0,0.32259,2.2115,-0.1072,661.07,6.5391,6.8495,7.258,468.74,10316.0,0.79638,111.52,1.4098,429.79,4121700000000.0,-394570000.0,7119.4,1.0277,16.121,0.99451,372800.0,12042.0,-0.000659,186920000000000.0,-129.58,933.15,2.7392,490.84,0.012809,5.2358,0.009404,1.3044,0.29176,0.001332,4.0513,0.84652,4.9508,-0.6704,0.43678,36.11,961.45,0.47044,108.67,0.25482,0.27473,-0.001589,-0.99328,2.5776,0.90362,0.24753,1251000000.0,1.1726,0.18456,7429.8,88.79,654.25,27.426,1.0843,-0.004769,1.2764,208.61,382340000000000.0,6267300000000.0,-0.004554,7.0114,45952.0,3695.5,-3.2187,0.50229,6.9219,148730000000.0,9.9686,-35362.0,854.84,26039000000.0,13.943,14.552,675.62,6.8424,0.37685,3452.1,35.434,0.94128,0.95142,-56.004,0.99969,20097000000000.0,1.2255,0.71393,14.182,4362.6,12.007,10653.0,0.1653,0.22709,0.020485,-10504000.0,0.2519,-18.63,3.7387,0.75708,-4.9405,50336.0,1.2488,2.1513e+17,2250.1,0.33796


In [5]:
features = [col for col in train_data.columns if col != target]

len(features)

118

# Missing Value

In [6]:
train_data['n_missing'] = train_data[features].isna().sum(axis=1)
test_data['n_missing'] = test_data[features].isna().sum(axis=1)

features.append('n_missing')

In [7]:
modes = train_data[features].mode().iloc[0]

train_data[features] = train_data[features].fillna(modes)
test_data[features] = test_data[features].fillna(modes)

# Scaler 
## Standardize features by removing the mean and scaling to unit variance

In [8]:
train_data.describe()

Unnamed: 0,f1,f2,f3,f4,f5,f6,f7,f8,f9,f10,f11,f12,f13,f14,f15,f16,f17,f18,f19,f20,f21,f22,f23,f24,f25,f26,f27,f28,f29,f30,f31,f32,f33,f34,f35,f36,f37,f38,f39,f40,f41,f42,f43,f44,f45,f46,f47,f48,f49,f50,f51,f52,f53,f54,f55,f56,f57,f58,f59,f60,f61,f62,f63,f64,f65,f66,f67,f68,f69,f70,f71,f72,f73,f74,f75,f76,f77,f78,f79,f80,f81,f82,f83,f84,f85,f86,f87,f88,f89,f90,f91,f92,f93,f94,f95,f96,f97,f98,f99,f100,f101,f102,f103,f104,f105,f106,f107,f108,f109,f110,f111,f112,f113,f114,f115,f116,f117,f118,claim,n_missing
count,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0
mean,0.090361,0.348394,4024.055132,0.200181,0.305243,-0.088305,1629.175187,372787.236353,1808771838939572.0,5254.808445,0.736882,1834241701.218232,0.248605,7.049095,0.020712,468.367326,6.893046,4.436377,22.290407,200.682202,62023.044055,2.269389,87.410766,0.355247,424.728923,3603114521180.719,1267294935213.1648,2244633.225811,0.339991,7.925109,0.404137,134055.630828,368534.059121,-2.1e-05,2.8979198044250788e+16,180.320106,415.657405,1.763374,1966.065066,0.369676,468.807788,0.369887,6.941763,29.499724,0.013411,4.277867,0.045345,6.437406,-0.434872,0.300471,55.947877,2669.793419,11.987613,137.23164,0.251903,0.420606,-7e-06,-0.340153,3.040365,0.552924,0.271104,2446945627.809109,37.854061,0.21109,48344.311096,84.365153,618.529091,28.707851,1.211459,0.427657,1.536854,492.588334,800892494176804.6,1139692875580.188,0.386662,6.878436,10734.007629,10532.830538,1.694608,0.195104,3.204542,105531433077.35307,150.524687,6285035.241819,645.22668,33631074571.287983,26.370013,206.524901,3907.128556,6.789791,0.36893,4806.106043,131.772851,0.828505,13.071178,3964.292198,0.999974,14102679069790.107,1.677109,0.435189,20.051832,332492.51532,582.321467,3810.514783,0.17679,0.160179,0.014146,1670617523.666425,0.396502,-19.848534,2.066367,25.16343,1.881166,63877.509304,1.208017,4.231004897803466e+16,4056.395922,0.566662,0.498492,1.900768
std,0.043234,0.146345,6373.280131,0.210931,0.144199,2.110587,1267.576277,344359.156116,2316641258090114.5,10002.649732,1.484562,2109596231.937814,0.100553,6.580398,0.101573,652.709565,1.701868,3.892431,14.544017,279.788018,89441.64622,0.888829,37.098915,1.633755,321.372738,5876021052637.763,1632665256904.7603,2287506.502147,0.438771,5.901396,0.779315,202028.777759,466337.7829,0.001527,3.542856997624216e+16,697.293529,321.113451,0.585725,1946.22462,0.44555,639.491638,0.412099,1.817529,28.616772,0.014543,1.130644,0.682988,2.139761,0.726995,0.144978,87.63484,2507.208501,21.542606,15.950591,0.109584,0.329655,0.001514,0.291728,1.725701,0.26821,0.254884,2885081672.340553,35.33086,0.223652,35935.556645,35.797764,529.269877,27.230853,0.128495,0.494907,0.442649,384.478533,1182224177820340.0,2073347598107.0608,0.448312,1.694906,14985.537478,10333.002074,9.073303,0.161204,1.995898,98164820020.94173,226.742991,8782953.081941,583.913162,31661361589.182167,25.31387,157.030627,3593.52889,3.163621,0.14621,8374.192894,109.234026,0.709138,12.641935,6448.930279,0.001523,16277984705473.04,0.707833,0.29062,19.501192,336329.810301,896.177006,6626.657925,0.122707,0.140554,0.016133,1860679288.49709,0.296106,18.438926,0.890794,46.30509,10.062351,91861.742362,0.114217,6.686964578071474e+16,3221.481924,0.40933,0.499998,2.026843
min,-0.14991,-0.019044,-9421.7,-0.082122,-0.00699,-12.791,-224.8,-29843.0,-1153300000000000.0,-26404.0,-8.0863,-408100000.0,-0.1038,-0.85376,-0.33566,-116.88,-3.6645,-0.066527,-4.4225,-58.834,-84079.0,-6.0094,-20.514,-5.7352,-71.502,-695670000000.0,-938420000000.0,-470600.0,-0.005659,-0.52999,-3.8135,-349650.0,-605590.0,-0.003881,-2.0689e+16,-2414.3,-40.881,0.5461,-433.7,-0.007641,-107.38,-0.05771,-4.4214,-8.1892,-0.01026,-3.5615,-2.6172,1.0564,-1.7306,-0.006924,-131.95,-721.61,-26.637,98.868,-0.033956,-0.052052,-0.003899,-1.179,0.68364,-0.15099,-0.19692,-1825600000.0,-11.941,-0.13478,-3302.6,-22.021,-68.682,-2.1598,0.84922,-0.009201,0.7742,-64.669,-280280000000000.0,-610670000000.0,-0.013163,-2.9862,-1546.0,-1284.2,-24.288,-0.017615,0.9642,-73457000000.0,-28.752,-2992000.0,-74.545,-5949500000.0,-7.6164,-22.576,-296.78,-0.25757,-0.012238,-12829.0,-12.922,-3.2933,-1.3524,-7764.3,0.9961,-5714600000000.0,0.6082,-0.034559,-4.2949,-227770.0,-222.21,-11581.0,-0.029027,-0.066726,-0.007535,-587700000.0,-0.042355,-105.86,0.27704,-27.691,-26.589,-81977.0,0.90527,-8944400000000000.0,-415.24,-0.15124,0.0,0.0
25%,0.070507,0.28557,428.08,0.036203,0.24232,-1.1112,493.76,93506.0,12498000000000.0,79.6515,0.33885,48386000.0,0.22325,1.5015,-0.03453,11.03,5.9777,1.0315,11.591,5.74185,2732.9,1.8707,76.618,-0.770955,130.52,23613500000.0,29948500000.0,156000.0,0.001604,3.119,-0.012585,12019.0,42375.5,-0.001155,276425000000000.0,-112.86,120.73,1.4109,424.02,0.003143,12.602,0.007002,5.9098,7.0023,0.002052,4.0087,-0.54966,5.0485,-1.0116,0.23275,4.0704,658.815,-0.260535,125.17,0.20397,0.095969,-0.001118,-0.42593,1.7843,0.37489,0.044925,280535000.0,8.95955,0.036771,10700.0,74.873,149.05,7.1412,1.1392,-0.000679,1.2191,155.48,5978100000000.0,2238900000.0,0.004589,5.9342,355.94,2271.4,-3.90655,0.07345,1.5441,22831000000.0,4.649,65718.0,146.605,2849250000.0,6.1885,67.4745,984.79,4.6701,0.33482,79.571,39.678,0.583905,2.4908,209.89,0.99882,184380000000.0,1.2408,0.2319,4.2411,59659.0,14.035,174.85,0.068834,0.06431,0.001568,64900000.0,0.11827,-28.472,1.4906,-0.590745,-4.3656,2596.75,1.1473,245155000000000.0,1335.9,0.28027,0.0,0.0
50%,0.090477,0.39149,1305.3,0.13761,0.32808,-0.41539,1489.3,282540.0,548600000000000.0,1012.8,1.1868,970510000.0,0.27738,5.4647,0.011648,96.403,6.8186,3.9455,19.552,41.941,19909.0,2.276,96.99,1.0971,378.62,844330000000.0,341940000000.0,1506200.0,0.081058,6.9148,0.66941,52011.0,178260.0,-4.5e-05,1.0372e+16,41.275,364.64,1.5486,1362.8,0.087219,124.8,0.097103,6.7247,20.462,0.0087,4.2931,0.17697,6.1363,-0.73288,0.32665,17.711,1953.3,2.0946,133.26,0.27011,0.41124,-2.6e-05,-0.239,2.4384,0.60816,0.17023,1365400000.0,27.913,0.1393,75557.0,92.734,505.64,20.659,1.1799,0.004376,1.4405,440.31,272900000000000.0,106950000000.0,0.091207,6.8141,2699.8,7539.8,0.95583,0.16104,2.5843,82957000000.0,34.656,1045600.0,506.92,26284000000.0,18.804,176.87,2907.4,6.2836,0.41187,1012.8,103.56,1.0517,9.583,1054.3,1.0,7515600000000.0,1.396,0.39569,14.031,221960.0,102.99,1012.9,0.15299,0.12237,0.008063,866290000.0,0.34296,-14.98,1.6557,1.8194,1.0471,20453.0,1.1761,1.4009e+16,3295.5,0.48004,0.0,1.0
75%,0.11551,0.46139,4327.0,0.29347,0.41155,0.904285,2475.5,554590.0,3049300000000000.0,5561.4,1.5012,3431100000.0,0.30951,10.623,0.07019,747.78,7.5272,6.4257,32.092,305.59,90431.0,2.6836,111.05,1.2425,688.605,4180300000000.0,2097600000000.0,3956400.0,0.90219,10.848,0.95348,168900.0,549970.0,0.00114,5.1813e+16,212.83,679.28,1.9714,2906.6,0.90732,720.045,0.89859,7.7407,43.766,0.02207,4.6395,0.60004,7.5082,0.021737,0.40926,70.031,3904.2,14.297,151.35,0.32963,0.724005,0.001142,-0.13947,3.8645,0.78087,0.50487,3565000000.0,55.775,0.31191,80282.0,104.95,964.28,42.469,1.2409,0.99886,1.7404,744.77,1069500000000000.0,727245000000.0,0.90985,7.5072,13373.0,14358.5,6.5625,0.25849,4.0858,156650000000.0,208.59,12561000.0,990.46,54244000000.0,38.9675,330.04,5770.6,8.4687,0.47553,5487.9,203.63,1.2949,20.135,4575.0,1.0011,25344000000000.0,1.7519,0.61042,30.024,514360.0,726.53,4115.9,0.2832,0.22882,0.023076,2957950000.0,0.61774,-5.44415,2.4794,20.8935,7.2235,95024.0,1.2401,5.17395e+16,6290.3,0.76506,1.0,3.0
max,0.41517,0.51899,39544.0,1.3199,0.55475,11.202,5426.6,1913700.0,1.0424e+16,85622.0,8.6505,8473600000.0,0.58977,36.951,0.50963,2335.4,19.189,25.458,80.154,1032.2,523590.0,11.306,160.45,6.96,1220.8,25805000000000.0,5447100000000.0,8960600.0,1.0958,36.744,3.7531,1154000.0,2873200.0,0.003919,1.5905e+17,3728.5,1218.0,4.084,11195.0,1.0435,2335.4,1.0287,19.978,180.97,0.066794,10.066,3.0153,16.87,1.799,0.54832,503.17,14553.0,131.75,175.16,0.49607,1.1866,0.003906,0.071947,7.7346,1.0141,1.0751,18289000000.0,210.43,1.352,91871.0,161.75,1996.7,167.66,1.8917,1.0179,3.7999,1453.9,6087900000000000.0,6694600000000.0,1.0304,18.366,56889.0,47503.0,43.552,1.3572,7.2883,738970000000.0,950.53,34511000.0,2307.5,130970000000.0,147.08,618.13,20675.0,21.994,0.51629,55362.0,448.78,3.9251,65.317,38704.0,1.0039,71701000000000.0,4.1691,1.0613,105.62,2337900.0,3260.9,46876.0,0.49156,0.84855,0.089019,7556500000.0,1.1236,1.6134,4.5659,217.84,47.757,526050.0,1.8867,3.2499e+17,13151.0,2.7436,1.0,14.0


In [9]:
train_data['min_row'] = train_data[features].min(axis=1)
train_data['max_row'] = train_data[features].max(axis=1)
train_data['mean_row'] = train_data[features].mean(axis=1)
train_data['std_row'] = train_data[features].std(axis=1)

test_data['min_row'] = test_data[features].min(axis=1)
test_data['max_row'] = test_data[features].max(axis=1)
test_data['mean_row'] = test_data[features].mean(axis=1)
test_data['std_row'] = test_data[features].std(axis=1)

features += ['min_row', 'max_row', 'mean_row', 'std_row']

In [10]:
scaler = preprocessing.StandardScaler()

train_data[features] = scaler.fit_transform(train_data[features])
test_data[features] = scaler.transform(test_data[features])

In [11]:
train_data.describe()

Unnamed: 0,f1,f2,f3,f4,f5,f6,f7,f8,f9,f10,f11,f12,f13,f14,f15,f16,f17,f18,f19,f20,f21,f22,f23,f24,f25,f26,f27,f28,f29,f30,f31,f32,f33,f34,f35,f36,f37,f38,f39,f40,f41,f42,f43,f44,f45,f46,f47,f48,f49,f50,f51,f52,f53,f54,f55,f56,f57,f58,f59,f60,f61,f62,f63,f64,f65,f66,f67,f68,f69,f70,f71,f72,f73,f74,f75,f76,f77,f78,f79,f80,f81,f82,f83,f84,f85,f86,f87,f88,f89,f90,f91,f92,f93,f94,f95,f96,f97,f98,f99,f100,f101,f102,f103,f104,f105,f106,f107,f108,f109,f110,f111,f112,f113,f114,f115,f116,f117,f118,claim,n_missing,min_row,max_row,mean_row,std_row
count,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0
mean,-0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,0.0,-0.0,-0.0,-0.0,0.0,0.0,0.0,-0.0,0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,-0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,0.0,0.0,-0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,0.0,-0.0,0.0,0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,0.0,-0.0,0.0,-0.0,-0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,0.0,0.0,0.0,0.0,0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,0.0,0.498492,-0.0,0.0,0.0,0.0,-0.0
std,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,0.499998,1.000001,1.000001,1.000001,1.000001,1.000001
min,-5.557461,-2.510776,-2.109708,-1.338369,-2.165294,-6.018562,-1.462615,-1.169217,-1.278607,-3.165044,-5.943294,-1.062925,-3.504672,-1.20097,-3.508535,-0.896643,-6.203508,-1.156837,-1.836695,-0.927546,-1.633491,-9.314274,-2.90911,-3.727884,-1.544099,-0.731581,-1.350991,-1.186984,-0.787769,-1.432729,-5.411982,-2.394242,-2.088882,-2.527294,-1.401926,-3.720989,-1.421736,-2.078237,-1.233037,-0.846858,-0.90101,-1.037609,-6.251989,-1.317023,-1.627658,-6.933543,-3.898378,-2.514771,-1.782308,-2.120287,-2.144101,-1.352662,-1.792941,-2.405156,-2.608592,-1.433796,-2.571015,-2.875438,-1.365663,-2.624485,-1.836224,-1.480911,-1.409394,-1.546464,-1.43721,-2.971867,-1.298414,-1.133555,-2.819083,-0.882708,-1.722933,-1.449386,-0.914525,-0.844221,-0.891845,-5.820171,-0.819458,-1.143621,-2.863634,-1.319568,-1.122474,-1.823347,-0.790661,-1.056255,-1.23267,-1.250123,-1.342601,-1.458958,-1.169856,-2.227626,-2.606991,-2.105888,-1.324632,-5.812419,-1.140932,-1.818689,-2.544358,-1.217429,-1.510115,-1.61637,-1.248475,-1.665814,-0.897738,-2.322667,-1.677296,-1.614357,-1.343928,-1.213707,-1.482096,-4.66467,-2.008688,-1.141439,-2.829377,-1.587762,-2.650626,-0.766483,-1.388069,-1.753845,0.0,-0.937798,-33.202115,-0.942605,-1.237469,-0.960825
25%,-0.459215,-0.42929,-0.564227,-0.777402,-0.43636,-0.48465,-0.895738,-0.811018,-0.775379,-0.517379,-0.268114,-0.84654,-0.252153,-0.843049,-0.543867,-0.700675,-0.537848,-0.874744,-0.735657,-0.696743,-0.662892,-0.448556,-0.290919,-0.689334,-0.915476,-0.609171,-0.757869,-0.913062,-0.771216,-0.814403,-0.534729,-0.604056,-0.699404,-0.742599,-0.810159,-0.420455,-0.918453,-0.601775,-0.792327,-0.822654,-0.713389,-0.880578,-0.567784,-0.786163,-0.781074,-0.238066,-0.871179,-0.649094,-0.793305,-0.467113,-0.591974,-0.802079,-0.568555,-0.756188,-0.437411,-0.984778,-0.73416,-0.294029,-0.727858,-0.663784,-0.88738,-0.750901,-0.817827,-0.779418,-1.047551,-0.265161,-0.887032,-0.791994,-0.562346,-0.865489,-0.717846,-0.876794,-0.672389,-0.548608,-0.852247,-0.557103,-0.692539,-0.799519,-0.617323,-0.754662,-0.831928,-0.842466,-0.643353,-0.708113,-0.853932,-0.972221,-0.797252,-0.885499,-0.813223,-0.670021,-0.233295,-0.564417,-0.843097,-0.344926,-0.836928,-0.582175,-0.757945,-0.855039,-0.616401,-0.699504,-0.810758,-0.811209,-0.634123,-0.548643,-0.87978,-0.682077,-0.779644,-0.862974,-0.939638,-0.467677,-0.646353,-0.556185,-0.620806,-0.667098,-0.53159,-0.629058,-0.844486,-0.699659,0.0,-0.937798,0.171099,-0.751834,-0.760044,-0.760145
50%,0.002691,0.294481,-0.426587,-0.296642,0.158375,-0.154973,-0.110349,-0.262073,-0.543965,-0.424089,0.303065,-0.40943,0.286171,-0.240775,-0.089238,-0.569878,-0.043744,-0.126111,-0.188284,-0.567363,-0.470855,0.007438,0.258208,0.454079,-0.143475,-0.469499,-0.566776,-0.322812,-0.590133,-0.171198,0.340393,-0.406104,-0.408018,-0.01562,-0.525203,-0.199407,-0.158877,-0.366681,-0.309967,-0.633952,-0.53794,-0.66194,-0.119428,-0.315819,-0.323899,0.013473,0.19272,-0.140719,-0.409918,0.180571,-0.436321,-0.285774,-0.45923,-0.248997,0.166146,-0.028412,-0.012891,0.346738,-0.348824,0.205944,-0.395764,-0.374875,-0.281371,-0.32099,0.757264,0.233781,-0.213292,-0.295579,-0.245603,-0.855275,-0.217675,-0.135972,-0.44661,-0.498104,-0.659038,-0.037958,-0.536131,-0.289658,-0.081423,-0.211312,-0.310758,-0.229965,-0.511014,-0.596546,-0.236862,-0.232052,-0.298888,-0.188848,-0.278203,-0.160004,0.293687,-0.452976,-0.258279,0.314742,-0.275921,-0.451237,0.017042,-0.404662,-0.39714,-0.135915,-0.308742,-0.328643,-0.534863,-0.422176,-0.193954,-0.268999,-0.377026,-0.432277,-0.180821,0.264036,-0.461012,-0.504136,-0.08289,-0.472716,-0.279439,-0.423227,-0.236195,-0.211618,0.0,-0.44442,0.200782,-0.273539,-0.28115,-0.275367
75%,0.581704,0.772122,0.047534,0.442275,0.737229,0.470291,0.667672,0.527945,0.535486,0.030651,0.514845,0.75695,0.605704,0.543114,0.487117,0.428081,0.372623,0.511075,0.673926,0.374955,0.317615,0.466019,0.637195,0.543076,0.821091,0.098227,0.508558,0.748312,1.281305,0.495288,0.704905,0.172472,0.389066,0.760173,0.644503,0.046623,0.820964,0.35516,0.483261,1.206697,0.39287,1.282951,0.439573,0.498529,0.595436,0.319847,0.81216,0.500427,0.628078,0.750381,0.160702,0.492343,0.107201,0.885131,0.709293,0.920352,0.758826,0.687912,0.477566,0.849879,0.917148,0.38753,0.507232,0.450789,0.888749,0.575032,0.65326,0.505352,0.229123,1.154163,0.459838,0.655906,0.227205,-0.198929,1.167018,0.370973,0.176103,0.370238,0.536507,0.393202,0.441535,0.520742,0.256084,0.714562,0.591241,0.651044,0.497652,0.786567,0.518563,0.530692,0.729088,0.081416,0.657828,0.657693,0.558761,0.094699,0.739489,0.690585,0.105662,0.602955,0.511362,0.540742,0.160915,0.046084,0.867189,0.48836,0.553541,0.691862,0.747158,0.781195,0.463669,-0.092213,0.530923,0.339059,0.280898,0.141013,0.69344,0.484691,1.0,0.542337,0.200841,0.324125,0.358762,0.346781
max,7.512842,1.165713,5.573263,5.308475,1.730304,5.349369,2.995817,4.474728,3.718846,8.034594,5.330612,3.147219,3.392896,4.54409,4.813467,2.860436,7.22498,5.400644,3.978517,2.971958,5.16054,10.166882,1.968771,4.042685,2.477097,3.77839,2.560113,2.935935,1.72256,4.883405,4.297318,5.048513,5.370929,2.579437,3.671355,5.088505,2.498628,3.961975,4.741971,1.512342,2.91887,1.598676,7.172511,5.293062,3.670775,5.119325,4.348474,4.875592,3.07275,1.709561,5.103248,4.739619,5.55933,2.377867,2.228132,2.323621,2.584056,1.412617,2.720191,1.719458,3.154362,5.491027,4.884569,5.101268,1.211244,2.161724,2.603911,5.102749,5.293903,1.192635,5.112514,2.500301,4.472088,2.679199,1.435915,6.777705,3.079971,3.577875,4.61325,7.208863,2.046077,6.45281,3.528249,3.213723,2.846783,3.074377,4.768534,2.621179,4.666132,4.805954,1.007865,6.03711,2.902093,4.366706,4.132742,5.386897,2.578443,3.53842,3.520593,2.154401,4.387845,5.962625,2.988896,6.498828,2.565212,4.897544,4.641063,3.163299,2.455534,1.163948,2.805962,4.161026,4.559159,5.031178,5.942048,4.227331,2.823113,5.318297,1.0,5.9695,0.200841,4.105335,5.170658,4.360322


## Setting Parameters

In [12]:
xgb_params = {
    'n_estimators' : 1000,
    'reg_lambda' : 3,
    'reg_alpha' : 26,
    'subsample' : 0.6000000000000001,
    'colsample_bytree' : 0.6000000000000001,
    'max_depth' : 9,
    'min_child_weight' : 5,
    'gamma' : 13.054739572819486,
    'learning_rate': 0.02,
    'tree_method': 'gpu_hist',
    'booster': 'gbtree'
}

lgbm_params = {
    "objective": "binary",
    "learning_rate": 0.01,
    'n_estimators': 1000,
    'num_leaves': 184,
    'min_child_samples': 63,
    'feature_fraction': 0.6864594334728974,
    'bagging_fraction': 0.9497327922401265,
    'bagging_freq': 1,
    'reg_alpha': 19,
    'reg_lambda': 19,
}

catb_params = {
    'iterations': 1000, 
    'objective': 'CrossEntropy', 
    'bootstrap_type': 'Bernoulli', 
    'od_wait': 1144, 
    'learning_rate': 0.023575206684596582, 
    'reg_lambda': 36.30433203563295, 
    'random_strength': 43.75597655616195, 
    'depth': 7, 
    'min_data_in_leaf': 11, 
    'leaf_estimation_iterations': 1, 
    'subsample': 0.8227911142845009,
    'devices' : '0',
    'verbose' : 0
}

# Setting the Cross Validate and Train Model

### Model XGBC

In [13]:
model = XGBClassifier(**xgb_params)
model

XGBClassifier(base_score=None, booster='gbtree', colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=0.6000000000000001,
              gamma=13.054739572819486, gpu_id=None, importance_type='gain',
              interaction_constraints=None, learning_rate=0.02,
              max_delta_step=None, max_depth=9, min_child_weight=5, missing=nan,
              monotone_constraints=None, n_estimators=1000, n_jobs=None,
              num_parallel_tree=None, random_state=None, reg_alpha=26,
              reg_lambda=3, scale_pos_weight=None, subsample=0.6000000000000001,
              tree_method='gpu_hist', validate_parameters=None, verbosity=None)

In [14]:
X = train_data[features].copy()
y = TARGET
X_test = test_data.copy()

In [15]:
y = TARGET

X.describe()

Unnamed: 0,f1,f2,f3,f4,f5,f6,f7,f8,f9,f10,f11,f12,f13,f14,f15,f16,f17,f18,f19,f20,f21,f22,f23,f24,f25,f26,f27,f28,f29,f30,f31,f32,f33,f34,f35,f36,f37,f38,f39,f40,f41,f42,f43,f44,f45,f46,f47,f48,f49,f50,f51,f52,f53,f54,f55,f56,f57,f58,f59,f60,f61,f62,f63,f64,f65,f66,f67,f68,f69,f70,f71,f72,f73,f74,f75,f76,f77,f78,f79,f80,f81,f82,f83,f84,f85,f86,f87,f88,f89,f90,f91,f92,f93,f94,f95,f96,f97,f98,f99,f100,f101,f102,f103,f104,f105,f106,f107,f108,f109,f110,f111,f112,f113,f114,f115,f116,f117,f118,n_missing,min_row,max_row,mean_row,std_row
count,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0,957919.0
mean,-0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,0.0,-0.0,-0.0,-0.0,0.0,0.0,0.0,-0.0,0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,-0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,0.0,0.0,-0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,0.0,-0.0,0.0,0.0,-0.0,0.0,0.0,0.0,-0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,0.0,-0.0,0.0,-0.0,-0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.0,0.0,0.0,0.0,0.0,-0.0,0.0,0.0,0.0,0.0,0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,-0.0,0.0,0.0,-0.0,0.0,0.0,0.0,-0.0
std,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001,1.000001
min,-5.557461,-2.510776,-2.109708,-1.338369,-2.165294,-6.018562,-1.462615,-1.169217,-1.278607,-3.165044,-5.943294,-1.062925,-3.504672,-1.20097,-3.508535,-0.896643,-6.203508,-1.156837,-1.836695,-0.927546,-1.633491,-9.314274,-2.90911,-3.727884,-1.544099,-0.731581,-1.350991,-1.186984,-0.787769,-1.432729,-5.411982,-2.394242,-2.088882,-2.527294,-1.401926,-3.720989,-1.421736,-2.078237,-1.233037,-0.846858,-0.90101,-1.037609,-6.251989,-1.317023,-1.627658,-6.933543,-3.898378,-2.514771,-1.782308,-2.120287,-2.144101,-1.352662,-1.792941,-2.405156,-2.608592,-1.433796,-2.571015,-2.875438,-1.365663,-2.624485,-1.836224,-1.480911,-1.409394,-1.546464,-1.43721,-2.971867,-1.298414,-1.133555,-2.819083,-0.882708,-1.722933,-1.449386,-0.914525,-0.844221,-0.891845,-5.820171,-0.819458,-1.143621,-2.863634,-1.319568,-1.122474,-1.823347,-0.790661,-1.056255,-1.23267,-1.250123,-1.342601,-1.458958,-1.169856,-2.227626,-2.606991,-2.105888,-1.324632,-5.812419,-1.140932,-1.818689,-2.544358,-1.217429,-1.510115,-1.61637,-1.248475,-1.665814,-0.897738,-2.322667,-1.677296,-1.614357,-1.343928,-1.213707,-1.482096,-4.66467,-2.008688,-1.141439,-2.829377,-1.587762,-2.650626,-0.766483,-1.388069,-1.753845,-0.937798,-33.202115,-0.942605,-1.237469,-0.960825
25%,-0.459215,-0.42929,-0.564227,-0.777402,-0.43636,-0.48465,-0.895738,-0.811018,-0.775379,-0.517379,-0.268114,-0.84654,-0.252153,-0.843049,-0.543867,-0.700675,-0.537848,-0.874744,-0.735657,-0.696743,-0.662892,-0.448556,-0.290919,-0.689334,-0.915476,-0.609171,-0.757869,-0.913062,-0.771216,-0.814403,-0.534729,-0.604056,-0.699404,-0.742599,-0.810159,-0.420455,-0.918453,-0.601775,-0.792327,-0.822654,-0.713389,-0.880578,-0.567784,-0.786163,-0.781074,-0.238066,-0.871179,-0.649094,-0.793305,-0.467113,-0.591974,-0.802079,-0.568555,-0.756188,-0.437411,-0.984778,-0.73416,-0.294029,-0.727858,-0.663784,-0.88738,-0.750901,-0.817827,-0.779418,-1.047551,-0.265161,-0.887032,-0.791994,-0.562346,-0.865489,-0.717846,-0.876794,-0.672389,-0.548608,-0.852247,-0.557103,-0.692539,-0.799519,-0.617323,-0.754662,-0.831928,-0.842466,-0.643353,-0.708113,-0.853932,-0.972221,-0.797252,-0.885499,-0.813223,-0.670021,-0.233295,-0.564417,-0.843097,-0.344926,-0.836928,-0.582175,-0.757945,-0.855039,-0.616401,-0.699504,-0.810758,-0.811209,-0.634123,-0.548643,-0.87978,-0.682077,-0.779644,-0.862974,-0.939638,-0.467677,-0.646353,-0.556185,-0.620806,-0.667098,-0.53159,-0.629058,-0.844486,-0.699659,-0.937798,0.171099,-0.751834,-0.760044,-0.760145
50%,0.002691,0.294481,-0.426587,-0.296642,0.158375,-0.154973,-0.110349,-0.262073,-0.543965,-0.424089,0.303065,-0.40943,0.286171,-0.240775,-0.089238,-0.569878,-0.043744,-0.126111,-0.188284,-0.567363,-0.470855,0.007438,0.258208,0.454079,-0.143475,-0.469499,-0.566776,-0.322812,-0.590133,-0.171198,0.340393,-0.406104,-0.408018,-0.01562,-0.525203,-0.199407,-0.158877,-0.366681,-0.309967,-0.633952,-0.53794,-0.66194,-0.119428,-0.315819,-0.323899,0.013473,0.19272,-0.140719,-0.409918,0.180571,-0.436321,-0.285774,-0.45923,-0.248997,0.166146,-0.028412,-0.012891,0.346738,-0.348824,0.205944,-0.395764,-0.374875,-0.281371,-0.32099,0.757264,0.233781,-0.213292,-0.295579,-0.245603,-0.855275,-0.217675,-0.135972,-0.44661,-0.498104,-0.659038,-0.037958,-0.536131,-0.289658,-0.081423,-0.211312,-0.310758,-0.229965,-0.511014,-0.596546,-0.236862,-0.232052,-0.298888,-0.188848,-0.278203,-0.160004,0.293687,-0.452976,-0.258279,0.314742,-0.275921,-0.451237,0.017042,-0.404662,-0.39714,-0.135915,-0.308742,-0.328643,-0.534863,-0.422176,-0.193954,-0.268999,-0.377026,-0.432277,-0.180821,0.264036,-0.461012,-0.504136,-0.08289,-0.472716,-0.279439,-0.423227,-0.236195,-0.211618,-0.44442,0.200782,-0.273539,-0.28115,-0.275367
75%,0.581704,0.772122,0.047534,0.442275,0.737229,0.470291,0.667672,0.527945,0.535486,0.030651,0.514845,0.75695,0.605704,0.543114,0.487117,0.428081,0.372623,0.511075,0.673926,0.374955,0.317615,0.466019,0.637195,0.543076,0.821091,0.098227,0.508558,0.748312,1.281305,0.495288,0.704905,0.172472,0.389066,0.760173,0.644503,0.046623,0.820964,0.35516,0.483261,1.206697,0.39287,1.282951,0.439573,0.498529,0.595436,0.319847,0.81216,0.500427,0.628078,0.750381,0.160702,0.492343,0.107201,0.885131,0.709293,0.920352,0.758826,0.687912,0.477566,0.849879,0.917148,0.38753,0.507232,0.450789,0.888749,0.575032,0.65326,0.505352,0.229123,1.154163,0.459838,0.655906,0.227205,-0.198929,1.167018,0.370973,0.176103,0.370238,0.536507,0.393202,0.441535,0.520742,0.256084,0.714562,0.591241,0.651044,0.497652,0.786567,0.518563,0.530692,0.729088,0.081416,0.657828,0.657693,0.558761,0.094699,0.739489,0.690585,0.105662,0.602955,0.511362,0.540742,0.160915,0.046084,0.867189,0.48836,0.553541,0.691862,0.747158,0.781195,0.463669,-0.092213,0.530923,0.339059,0.280898,0.141013,0.69344,0.484691,0.542337,0.200841,0.324125,0.358762,0.346781
max,7.512842,1.165713,5.573263,5.308475,1.730304,5.349369,2.995817,4.474728,3.718846,8.034594,5.330612,3.147219,3.392896,4.54409,4.813467,2.860436,7.22498,5.400644,3.978517,2.971958,5.16054,10.166882,1.968771,4.042685,2.477097,3.77839,2.560113,2.935935,1.72256,4.883405,4.297318,5.048513,5.370929,2.579437,3.671355,5.088505,2.498628,3.961975,4.741971,1.512342,2.91887,1.598676,7.172511,5.293062,3.670775,5.119325,4.348474,4.875592,3.07275,1.709561,5.103248,4.739619,5.55933,2.377867,2.228132,2.323621,2.584056,1.412617,2.720191,1.719458,3.154362,5.491027,4.884569,5.101268,1.211244,2.161724,2.603911,5.102749,5.293903,1.192635,5.112514,2.500301,4.472088,2.679199,1.435915,6.777705,3.079971,3.577875,4.61325,7.208863,2.046077,6.45281,3.528249,3.213723,2.846783,3.074377,4.768534,2.621179,4.666132,4.805954,1.007865,6.03711,2.902093,4.366706,4.132742,5.386897,2.578443,3.53842,3.520593,2.154401,4.387845,5.962625,2.988896,6.498828,2.565212,4.897544,4.641063,3.163299,2.455534,1.163948,2.805962,4.161026,4.559159,5.031178,5.942048,4.227331,2.823113,5.318297,5.9695,0.200841,4.105335,5.170658,4.360322


In [17]:
splits = 5
skf = StratifiedKFold(n_splits=splits, shuffle=True, random_state=42)

oof_preds = np.zeros((X.shape[0],))
preds = 0
model_fi = 0
total_mean_auc = 0

for num, (train_idx, valid_idx) in enumerate(skf.split(X, y)):
    X_train, X_valid = X.loc[train_idx], X.loc[valid_idx]
    y_train, y_valid = y.loc[train_idx], y.loc[valid_idx]
    
    imputer = SimpleImputer(strategy='median')
    X_train = imputer.fit_transform(X_train)
    X_valid = imputer.transform(X_valid)
    
    model.fit(X_train, y_train,
              verbose=False,
              eval_set=[(X_train, y_train), (X_valid, y_valid)],
              eval_metric="auc",
              early_stopping_rounds=300,
              )
    
    X_test = imputer.transform(X_test)
    
    preds += model.predict_proba(X_test)[:, 1] / splits
   
   
    
    model_fi += model.feature_importances_ / splits
    
    oof_preds[valid_idx] = model.predict_proba(X_valid)[:, 1]
    
    fold_auc = roc_auc_score(y_valid, oof_preds[valid_idx])
    print(f"Fold {num} ROC AUC: {fold_auc}")

    total_mean_auc += fold_auc / splits
    
print(f"\nOverall ROC AUC: {total_mean_auc}")


Fold 0 ROC AUC: 0.8121415899435734
Fold 1 ROC AUC: 0.8140037311039028
Fold 2 ROC AUC: 0.8127198823661544
Fold 3 ROC AUC: 0.8125704520095638
Fold 4 ROC AUC: 0.8121161474994273

Overall ROC AUC: 0.8127103605845243


In [18]:
XGBC_score = total_mean_auc
XGBC_score

0.8127103605845243

### Submission

In [19]:
submission.claim = preds
submission.head()


Unnamed: 0,id,claim
0,957919,0.616455
1,957920,0.117593
2,957921,0.615548
3,957922,0.13975
4,957923,0.14213


In [20]:
submission.to_csv('submissionXGBC.csv', index=False)

### LGBMC Model

In [21]:
model = LGBMClassifier(**lgbm_params)
model

LGBMClassifier(bagging_fraction=0.9497327922401265, bagging_freq=1,
               feature_fraction=0.6864594334728974, learning_rate=0.01,
               min_child_samples=63, n_estimators=1000, num_leaves=184,
               objective='binary', reg_alpha=19, reg_lambda=19)

In [22]:
splits = 5
skf = StratifiedKFold(n_splits=splits, shuffle=True, random_state=42)

oof_preds = np.zeros((X.shape[0],))
preds = 0
model_fi = 0
total_mean_auc = 0

for num, (train_idx, valid_idx) in enumerate(skf.split(X, y)):
    X_train, X_valid = X.loc[train_idx], X.loc[valid_idx]
    y_train, y_valid = y.loc[train_idx], y.loc[valid_idx]
    
    imputer = SimpleImputer(strategy='median')
    X_train = imputer.fit_transform(X_train)
    X_valid = imputer.transform(X_valid)
    
    model.fit(X_train, y_train,
              verbose=False,
              eval_set=[(X_train, y_train), (X_valid, y_valid)],
              eval_metric="auc",
              early_stopping_rounds=300,
              )
    
    X_test = imputer.transform(X_test)
    
    preds += model.predict_proba(X_test)[:, 1] / splits
   
   
    
    model_fi += model.feature_importances_ / splits
    
    oof_preds[valid_idx] = model.predict_proba(X_valid)[:, 1]
    
    fold_auc = roc_auc_score(y_valid, oof_preds[valid_idx])
    print(f"Fold {num} ROC AUC: {fold_auc}")

    total_mean_auc += fold_auc / splits
    
print(f"\nOverall ROC AUC: {total_mean_auc}")

Fold 0 ROC AUC: 0.8133090682871394
Fold 1 ROC AUC: 0.8145690700399486
Fold 2 ROC AUC: 0.8134982575316991
Fold 3 ROC AUC: 0.8136227397728083
Fold 4 ROC AUC: 0.8127641606316659

Overall ROC AUC: 0.8135526592526523


In [23]:
LGB_Score = total_mean_auc

#### Submission

In [24]:
submission = pd.read_csv("sample_solution.csv")

In [25]:
submission.claim = preds
submission.head()

Unnamed: 0,id,claim
0,957919,0.629321
1,957920,0.11628
2,957921,0.62424
3,957922,0.137937
4,957923,0.144077


In [26]:
submission.to_csv('submissionLGBMC.csv', index=False)



### CatBoostClassifier Model

In [27]:
model = CatBoostClassifier(**catb_params)
model

<catboost.core.CatBoostClassifier at 0x21c31222a90>

In [28]:

skf = StratifiedKFold(n_splits=splits, shuffle=True, random_state=42)

oof_preds = np.zeros((X.shape[0],))
preds = 0
model_fi = 0
total_mean_auc = 0

for num, (train_idx, valid_idx) in enumerate(skf.split(X, y)):
    X_train, X_valid = X.loc[train_idx], X.loc[valid_idx]
    y_train, y_valid = y.loc[train_idx], y.loc[valid_idx]
    
    imputer = SimpleImputer(strategy='median')
    X_train = imputer.fit_transform(X_train)
    X_valid = imputer.transform(X_valid)
    
    model.fit(X_train, y_train,
              verbose=False,
              eval_set=[(X_train, y_train), (X_valid, y_valid)],
              early_stopping_rounds=300,
              )
    
    X_test = imputer.transform(X_test)
    
    preds += model.predict_proba(X_test)[:, 1] / splits
   
   
    
    model_fi += model.feature_importances_ / splits
    
    oof_preds[valid_idx] = model.predict_proba(X_valid)[:, 1]
    
    fold_auc = roc_auc_score(y_valid, oof_preds[valid_idx])
    print(f"Fold {num} ROC AUC: {fold_auc}")

    total_mean_auc += fold_auc / splits
    
print(f"\nOverall ROC AUC: {total_mean_auc}")

Fold 0 ROC AUC: 0.8122416733812063
Fold 1 ROC AUC: 0.8138562050579907
Fold 2 ROC AUC: 0.8125555969368421
Fold 3 ROC AUC: 0.8127739362803434
Fold 4 ROC AUC: 0.8116527092631229

Overall ROC AUC: 0.8126160241839011


In [29]:
CAT_Score = total_mean_auc

In [30]:
#### Submission

In [31]:
submission = pd.read_csv("sample_solution.csv")

In [32]:
submission.claim = preds
submission.head()

Unnamed: 0,id,claim
0,957919,0.59737
1,957920,0.122496
2,957921,0.594329
3,957922,0.13565
4,957923,0.143358


In [33]:
submission.to_csv('submissionCAT.csv', index=False)