In [11]:
# Useful starting lines
%matplotlib inline
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

%load_ext autoreload
%autoreload 2

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


# Load the data

In [34]:
import datetime
from helpers import *
from plots import *
from implementations import *
from preprocessing import *
from preprocessing_naive import *


features, x_train, x_test, y_train, train_ids, test_ids = load_csv_data("data/dataset")

# Split data into train and validation sets
def split_data(x, y, ratio, seed=1):
    """split the dataset based on the split ratio."""
    np.random.seed(seed)
    indices = np.random.permutation(len(y))
    split = int(len(y) * ratio)
    training_idx, test_idx = indices[:split], indices[split:]
    return x[training_idx], y[training_idx], x[test_idx], y[test_idx]

ratio = 0.8
x_train, y_train, x_val, y_val = split_data(x_train, y_train, ratio, seed=1)

In [35]:
print(np.shape(features))
print(np.shape(x_train))
print(np.shape(y_train))
print(np.shape(x_val))
print(np.shape(y_val))
print(np.shape(x_test))

(321,)
(262508, 321)
(262508,)
(65627, 321)
(65627,)
(109379, 321)


In [26]:
# Show the first 5 rows of the data and statistics
pd.set_option('display.max_columns', None)
data = pd.DataFrame(x_train, columns=features)

data.head()

Unnamed: 0,_STATE,FMONTH,IDATE,IMONTH,IDAY,IYEAR,DISPCODE,SEQNO,_PSU,CTELENUM,PVTRESD1,COLGHOUS,STATERES,CELLFON3,LADULT,NUMADULT,NUMMEN,NUMWOMEN,CTELNUM1,CELLFON2,CADULT,PVTRESD2,CCLGHOUS,CSTATE,LANDLINE,HHADULT,GENHLTH,PHYSHLTH,MENTHLTH,POORHLTH,HLTHPLN1,PERSDOC2,MEDCOST,CHECKUP1,BPHIGH4,BPMEDS,BLOODCHO,CHOLCHK,TOLDHI2,CVDSTRK3,ASTHMA3,ASTHNOW,CHCSCNCR,CHCOCNCR,CHCCOPD1,HAVARTH3,ADDEPEV2,CHCKIDNY,DIABETE3,DIABAGE2,SEX,MARITAL,EDUCA,RENTHOM1,NUMHHOL2,NUMPHON2,CPDEMO1,VETERAN3,EMPLOY1,CHILDREN,INCOME2,INTERNET,WEIGHT2,HEIGHT3,PREGNANT,QLACTLM2,USEEQUIP,BLIND,DECIDE,DIFFWALK,DIFFDRES,DIFFALON,SMOKE100,SMOKDAY2,STOPSMK2,LASTSMK2,USENOW3,ALCDAY5,AVEDRNK2,DRNK3GE5,MAXDRNKS,FRUITJU1,FRUIT1,FVBEANS,FVGREEN,FVORANG,VEGETAB1,EXERANY2,EXRACT11,EXEROFT1,EXERHMM1,EXRACT21,EXEROFT2,EXERHMM2,STRENGTH,LMTJOIN3,ARTHDIS2,ARTHSOCL,JOINPAIN,SEATBELT,FLUSHOT6,FLSHTMY2,IMFVPLAC,PNEUVAC3,HIVTST6,HIVTSTD3,WHRTST10,PDIABTST,PREDIAB1,INSULIN,BLDSUGAR,FEETCHK2,DOCTDIAB,CHKHEMO3,FEETCHK,EYEEXAM,DIABEYE,DIABEDU,CAREGIV1,CRGVREL1,CRGVLNG1,CRGVHRS1,CRGVPRB1,CRGVPERS,CRGVHOUS,CRGVMST2,CRGVEXPT,VIDFCLT2,VIREDIF3,VIPRFVS2,VINOCRE2,VIEYEXM2,VIINSUR2,VICTRCT4,VIGLUMA2,VIMACDG2,CIMEMLOS,CDHOUSE,CDASSIST,CDHELP,CDSOCIAL,CDDISCUS,WTCHSALT,LONGWTCH,DRADVISE,ASTHMAGE,ASATTACK,ASERVIST,ASDRVIST,ASRCHKUP,ASACTLIM,ASYMPTOM,ASNOSLEP,ASTHMED3,ASINHALR,HAREHAB1,STREHAB1,CVDASPRN,ASPUNSAF,RLIVPAIN,RDUCHART,RDUCSTRK,ARTTODAY,ARTHWGT,ARTHEXER,ARTHEDU,TETANUS,HPVADVC2,HPVADSHT,SHINGLE2,HADMAM,HOWLONG,HADPAP2,LASTPAP2,HPVTEST,HPLSTTST,HADHYST2,PROFEXAM,LENGEXAM,BLDSTOOL,LSTBLDS3,HADSIGM3,HADSGCO1,LASTSIG3,PCPSAAD2,PCPSADI1,PCPSARE1,PSATEST1,PSATIME,PCPSARS1,PCPSADE1,PCDMDECN,SCNTMNY1,SCNTMEL1,SCNTPAID,SCNTWRK1,SCNTLPAD,SCNTLWK1,SXORIENT,TRNSGNDR,RCSGENDR,RCSRLTN2,CASTHDX2,CASTHNO2,EMTSUPRT,LSATISFY,ADPLEASR,ADDOWN,ADSLEEP,ADENERGY,ADEAT1,ADFAIL,ADTHINK,ADMOVE,MISTMNT,ADANXEV,QSTVER,QSTLANG,MSCODE,_STSTR,_STRWT,_RAWRAKE,_WT2RAKE,_CHISPNC,_CRACE1,_CPRACE,_CLLCPWT,_DUALUSE,_DUALCOR,_LLCPWT,_RFHLTH,_HCVU651,_RFHYPE5,_CHOLCHK,_RFCHOL,_LTASTH1,_CASTHM1,_ASTHMS1,_DRDXAR1,_PRACE1,_MRACE1,_HISPANC,_RACE,_RACEG21,_RACEGR3,_RACE_G1,_AGEG5YR,_AGE65YR,_AGE80,_AGE_G,HTIN4,HTM4,WTKG3,_BMI5,_BMI5CAT,_RFBMI5,_CHLDCNT,_EDUCAG,_INCOMG,_SMOKER3,_RFSMOK3,DRNKANY5,DROCDY3_,_RFBING5,_DRNKWEK,_RFDRHV5,FTJUDA1_,FRUTDA1_,BEANDAY_,GRENDAY_,ORNGDAY_,VEGEDA1_,_MISFRTN,_MISVEGN,_FRTRESP,_VEGRESP,_FRUTSUM,_VEGESUM,_FRTLT1,_VEGLT1,_FRT16,_VEG23,_FRUITEX,_VEGETEX,_TOTINDA,METVL11_,METVL21_,MAXVO2_,FC60_,ACTIN11_,ACTIN21_,PADUR1_,PADUR2_,PAFREQ1_,PAFREQ2_,_MINAC11,_MINAC21,STRFREQ_,PAMISS1_,PAMIN11_,PAMIN21_,PA1MIN_,PAVIG11_,PAVIG21_,PA1VIGM_,_PACAT1,_PAINDX1,_PA150R2,_PA300R2,_PA30021,_PASTRNG,_PAREC1,_PASTAE1,_LMTACT1,_LMTWRK1,_LMTSCL1,_RFSEAT2,_RFSEAT3,_FLSHOT6,_PNEUMO2,_AIDTST3
0,35.0,10.0,10072015.0,10.0,7.0,2015.0,1100.0,2015004000.0,2015004000.0,1.0,1.0,,1.0,2.0,,2.0,1.0,1.0,,,,,,,,,5.0,30.0,88.0,30.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,7.0,2.0,,2.0,2.0,2.0,1.0,2.0,2.0,4.0,,2.0,1.0,6.0,1.0,2.0,,1.0,2.0,7.0,88.0,99.0,1.0,180.0,502.0,,1.0,1.0,1.0,2.0,1.0,1.0,1.0,2.0,,,,3.0,888.0,,,,203.0,203.0,203.0,555.0,203.0,201.0,2.0,,,,,,,888.0,1.0,2.0,1.0,10.0,1.0,2.0,,,1.0,2.0,,,2.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10.0,1.0,5.0,351051.0,17.109993,2.0,34.219987,9.0,,,,1.0,0.726059,76.345588,2.0,9.0,2.0,1.0,2.0,1.0,1.0,3.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,12.0,2.0,78.0,6.0,62.0,1.57,81.65,32.92,4.0,2.0,1.0,4.0,9.0,4.0,1.0,2.0,0.0,1.0,0.0,1.0,0.43,0.43,0.43,0.0,0.43,0.14,0.0,0.0,1.0,1.0,0.86,1.0,2.0,1.0,1.0,1.0,0.0,0.0,2.0,,,19.14,3.28,,,,,,,,,0.0,0.0,,,,,,,4.0,2.0,3.0,3.0,2.0,2.0,4.0,2.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,2.0
1,35.0,7.0,7132015.0,7.0,13.0,2015.0,1100.0,2015002000.0,2015002000.0,1.0,1.0,,1.0,2.0,,2.0,0.0,2.0,,,,,,,,,4.0,88.0,88.0,,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,,2.0,2.0,2.0,1.0,2.0,2.0,3.0,,2.0,2.0,5.0,1.0,2.0,,2.0,2.0,7.0,88.0,4.0,1.0,9999.0,505.0,,2.0,2.0,1.0,2.0,1.0,2.0,2.0,1.0,3.0,,7.0,3.0,215.0,2.0,88.0,2.0,555.0,101.0,310.0,101.0,101.0,101.0,1.0,64.0,107.0,100.0,6.0,105.0,20.0,888.0,1.0,2.0,3.0,4.0,1.0,2.0,,,1.0,7.0,,,1.0,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10.0,1.0,5.0,351021.0,20.595798,2.0,41.191595,9.0,,,,9.0,,304.318707,2.0,9.0,2.0,1.0,1.0,1.0,1.0,3.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,12.0,2.0,77.0,6.0,65.0,1.65,,,,9.0,1.0,3.0,2.0,3.0,1.0,1.0,50.0,1.0,700.0,1.0,0.0,1.0,0.33,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,3.33,1.0,1.0,1.0,1.0,0.0,0.0,1.0,3.5,6.8,19.51,3.34,2.0,2.0,60.0,20.0,7.0,5.0,420.0,100.0,0.0,0.0,840.0,200.0,1040.0,420.0,100.0,520.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,2.0,3.0,1.0,1.0,2.0,1.0,9.0
2,30.0,4.0,4062015.0,4.0,6.0,2015.0,1100.0,2015002000.0,2015002000.0,1.0,1.0,,1.0,2.0,,2.0,1.0,1.0,,,,,,,,,4.0,88.0,88.0,,1.0,1.0,2.0,1.0,3.0,,2.0,,,2.0,2.0,,1.0,2.0,2.0,1.0,1.0,2.0,3.0,,1.0,1.0,4.0,1.0,2.0,,1.0,2.0,7.0,88.0,6.0,2.0,246.0,600.0,,1.0,2.0,1.0,2.0,1.0,2.0,2.0,1.0,3.0,,5.0,3.0,888.0,,,,202.0,206.0,201.0,206.0,202.0,205.0,1.0,64.0,102.0,20.0,76.0,107.0,300.0,888.0,2.0,2.0,3.0,7.0,1.0,1.0,102014.0,1.0,2.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,2.0,2.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10.0,1.0,5.0,301041.0,8.511576,2.0,17.023151,9.0,,,,1.0,0.710896,47.651656,2.0,9.0,1.0,3.0,,1.0,1.0,3.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,11.0,2.0,71.0,6.0,72.0,1.83,111.58,33.36,4.0,2.0,1.0,2.0,4.0,3.0,1.0,2.0,0.0,1.0,0.0,1.0,0.29,0.86,0.14,0.86,0.29,0.71,0.0,0.0,1.0,1.0,1.15,2.0,1.0,1.0,1.0,1.0,0.0,0.0,1.0,3.5,4.0,20.95,3.59,1.0,2.0,20.0,180.0,2.0,7.0,40.0,1260.0,0.0,0.0,40.0,2520.0,2560.0,0.0,1260.0,1260.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,3.0,1.0,1.0,1.0,2.0,2.0
3,20.0,10.0,11172015.0,11.0,17.0,2015.0,1200.0,2015022000.0,2015022000.0,,,,,,,,,,1.0,1.0,1.0,1.0,,1.0,2.0,3.0,4.0,88.0,88.0,,2.0,1.0,2.0,1.0,3.0,,7.0,,,2.0,2.0,,2.0,2.0,2.0,2.0,2.0,2.0,3.0,,1.0,6.0,5.0,1.0,,,,2.0,1.0,4.0,5.0,1.0,230.0,506.0,,2.0,2.0,2.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,22.0,2.0,,202049.0,23.883669,1.0,23.883669,9.0,,,,9.0,,266.893621,2.0,2.0,1.0,9.0,,1.0,1.0,3.0,2.0,77.0,77.0,1.0,8.0,2.0,5.0,3.0,3.0,1.0,32.0,2.0,66.0,1.68,104.33,37.12,4.0,2.0,5.0,3.0,3.0,9.0,9.0,9.0,900.0,9.0,99900.0,9.0,,,,,,,2.0,4.0,0.0,0.0,,,9.0,9.0,1.0,1.0,1.0,1.0,9.0,,,42.4,7.27,,,,,,,,,,9.0,,,,,,,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,3.0,3.0,4.0,9.0,9.0,,,
4,2.0,9.0,10012015.0,10.0,1.0,2015.0,1200.0,2015002000.0,2015002000.0,1.0,1.0,,1.0,2.0,,2.0,1.0,1.0,,,,,,,,,4.0,15.0,88.0,30.0,1.0,3.0,1.0,3.0,3.0,,2.0,,,2.0,2.0,,2.0,2.0,2.0,2.0,2.0,2.0,3.0,,1.0,1.0,9.0,9.0,2.0,,2.0,2.0,3.0,5.0,1.0,2.0,129.0,505.0,,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,,3.0,888.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10.0,1.0,5.0,21051.0,0.945246,2.0,1.890492,,,,,9.0,,21.773786,2.0,1.0,1.0,3.0,,1.0,1.0,3.0,2.0,3.0,3.0,2.0,3.0,2.0,3.0,4.0,7.0,1.0,50.0,4.0,65.0,1.65,58.51,21.47,2.0,1.0,6.0,9.0,1.0,2.0,2.0,2.0,0.0,1.0,0.0,1.0,,,,,,,2.0,4.0,0.0,0.0,,,9.0,9.0,1.0,1.0,1.0,1.0,9.0,,,32.5,5.57,,,,,,,,,,9.0,,,,,,,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,3.0,3.0,4.0,9.0,9.0,,,


In [20]:
data.describe()

Unnamed: 0,_STATE,FMONTH,IDATE,IMONTH,IDAY,IYEAR,DISPCODE,SEQNO,_PSU,CTELENUM,PVTRESD1,COLGHOUS,STATERES,CELLFON3,LADULT,NUMADULT,NUMMEN,NUMWOMEN,CTELNUM1,CELLFON2,CADULT,PVTRESD2,CCLGHOUS,CSTATE,LANDLINE,HHADULT,GENHLTH,PHYSHLTH,MENTHLTH,POORHLTH,HLTHPLN1,PERSDOC2,MEDCOST,CHECKUP1,BPHIGH4,BPMEDS,BLOODCHO,CHOLCHK,TOLDHI2,CVDSTRK3,ASTHMA3,ASTHNOW,CHCSCNCR,CHCOCNCR,CHCCOPD1,HAVARTH3,ADDEPEV2,CHCKIDNY,DIABETE3,DIABAGE2,SEX,MARITAL,EDUCA,RENTHOM1,NUMHHOL2,NUMPHON2,CPDEMO1,VETERAN3,EMPLOY1,CHILDREN,INCOME2,INTERNET,WEIGHT2,HEIGHT3,PREGNANT,QLACTLM2,USEEQUIP,BLIND,DECIDE,DIFFWALK,DIFFDRES,DIFFALON,SMOKE100,SMOKDAY2,STOPSMK2,LASTSMK2,USENOW3,ALCDAY5,AVEDRNK2,DRNK3GE5,MAXDRNKS,FRUITJU1,FRUIT1,FVBEANS,FVGREEN,FVORANG,VEGETAB1,EXERANY2,EXRACT11,EXEROFT1,EXERHMM1,EXRACT21,EXEROFT2,EXERHMM2,STRENGTH,LMTJOIN3,ARTHDIS2,ARTHSOCL,JOINPAIN,SEATBELT,FLUSHOT6,FLSHTMY2,IMFVPLAC,PNEUVAC3,HIVTST6,HIVTSTD3,WHRTST10,PDIABTST,PREDIAB1,INSULIN,BLDSUGAR,FEETCHK2,DOCTDIAB,CHKHEMO3,FEETCHK,EYEEXAM,DIABEYE,DIABEDU,CAREGIV1,CRGVREL1,CRGVLNG1,CRGVHRS1,CRGVPRB1,CRGVPERS,CRGVHOUS,CRGVMST2,CRGVEXPT,VIDFCLT2,VIREDIF3,VIPRFVS2,VINOCRE2,VIEYEXM2,VIINSUR2,VICTRCT4,VIGLUMA2,VIMACDG2,CIMEMLOS,CDHOUSE,CDASSIST,CDHELP,CDSOCIAL,CDDISCUS,WTCHSALT,LONGWTCH,DRADVISE,ASTHMAGE,ASATTACK,ASERVIST,ASDRVIST,ASRCHKUP,ASACTLIM,ASYMPTOM,ASNOSLEP,ASTHMED3,ASINHALR,HAREHAB1,STREHAB1,CVDASPRN,ASPUNSAF,RLIVPAIN,RDUCHART,RDUCSTRK,ARTTODAY,ARTHWGT,ARTHEXER,ARTHEDU,TETANUS,HPVADVC2,HPVADSHT,SHINGLE2,HADMAM,HOWLONG,HADPAP2,LASTPAP2,HPVTEST,HPLSTTST,HADHYST2,PROFEXAM,LENGEXAM,BLDSTOOL,LSTBLDS3,HADSIGM3,HADSGCO1,LASTSIG3,PCPSAAD2,PCPSADI1,PCPSARE1,PSATEST1,PSATIME,PCPSARS1,PCPSADE1,PCDMDECN,SCNTMNY1,SCNTMEL1,SCNTPAID,SCNTWRK1,SCNTLPAD,SCNTLWK1,SXORIENT,TRNSGNDR,RCSGENDR,RCSRLTN2,CASTHDX2,CASTHNO2,EMTSUPRT,LSATISFY,ADPLEASR,ADDOWN,ADSLEEP,ADENERGY,ADEAT1,ADFAIL,ADTHINK,ADMOVE,MISTMNT,ADANXEV,QSTVER,QSTLANG,MSCODE,_STSTR,_STRWT,_RAWRAKE,_WT2RAKE,_CHISPNC,_CRACE1,_CPRACE,_CLLCPWT,_DUALUSE,_DUALCOR,_LLCPWT,_RFHLTH,_HCVU651,_RFHYPE5,_CHOLCHK,_RFCHOL,_LTASTH1,_CASTHM1,_ASTHMS1,_DRDXAR1,_PRACE1,_MRACE1,_HISPANC,_RACE,_RACEG21,_RACEGR3,_RACE_G1,_AGEG5YR,_AGE65YR,_AGE80,_AGE_G,HTIN4,HTM4,WTKG3,_BMI5,_BMI5CAT,_RFBMI5,_CHLDCNT,_EDUCAG,_INCOMG,_SMOKER3,_RFSMOK3,DRNKANY5,DROCDY3_,_RFBING5,_DRNKWEK,_RFDRHV5,FTJUDA1_,FRUTDA1_,BEANDAY_,GRENDAY_,ORNGDAY_,VEGEDA1_,_MISFRTN,_MISVEGN,_FRTRESP,_VEGRESP,_FRUTSUM,_VEGESUM,_FRTLT1,_VEGLT1,_FRT16,_VEG23,_FRUITEX,_VEGETEX,_TOTINDA,METVL11_,METVL21_,MAXVO2_,FC60_,ACTIN11_,ACTIN21_,PADUR1_,PADUR2_,PAFREQ1_,PAFREQ2_,_MINAC11,_MINAC21,STRFREQ_,PAMISS1_,PAMIN11_,PAMIN21_,PA1MIN_,PAVIG11_,PAVIG21_,PA1VIGM_,_PACAT1,_PAINDX1,_PA150R2,_PA300R2,_PA30021,_PASTRNG,_PAREC1,_PASTAE1,_LMTACT1,_LMTWRK1,_LMTSCL1,_RFSEAT2,_RFSEAT3,_FLSHOT6,_PNEUMO2,_AIDTST3
count,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,151064.0,151064.0,25.0,151063.0,151064.0,25.0,151049.0,150973.0,150972.0,111444.0,111444.0,111443.0,111444.0,629.0,111444.0,110970.0,108376.0,262506.0,262507.0,262508.0,134767.0,262508.0,262508.0,262507.0,262507.0,262507.0,105441.0,262508.0,227414.0,227414.0,262508.0,262508.0,35224.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262503.0,33724.0,262508.0,262508.0,262508.0,262508.0,151064.0,7911.0,151064.0,262507.0,262508.0,262506.0,260543.0,259951.0,259366.0,259003.0,38922.0,256985.0,256338.0,255911.0,255566.0,255228.0,254998.0,254660.0,254118.0,109558.0,36628.0,72645.0,253764.0,253167.0,125866.0,125615.0,125364.0,245968.0,245317.0,244572.0,244014.0,243523.0,242930.0,241574.0,176210.0,175181.0,174986.0,174765.0,117692.0,117582.0,239663.0,81137.0,81026.0,80907.0,79396.0,238656.0,238112.0,113062.0,113661.0,237771.0,236925.0,67967.0,67854.0,49289.0,49289.0,17346.0,17345.0,17344.0,17344.0,17343.0,17189.0,17343.0,17342.0,17342.0,64613.0,14253.0,14237.0,14221.0,14207.0,14189.0,14179.0,14143.0,50191.0,1914.0,1907.0,1907.0,635.0,1501.0,1902.0,1900.0,1900.0,1898.0,69469.0,7756.0,7746.0,2473.0,7737.0,7730.0,24536.0,15123.0,24516.0,617.0,377.0,173.0,173.0,375.0,375.0,374.0,264.0,373.0,373.0,619.0,418.0,11217.0,7888.0,3327.0,3328.0,3327.0,11742.0,11734.0,11731.0,11724.0,24043.0,6470.0,898.0,16597.0,13730.0,11156.0,13726.0,12805.0,13718.0,4170.0,13581.0,3396.0,2996.0,32168.0,11778.0,32146.0,23281.0,23279.0,3905.0,3900.0,3895.0,3895.0,2118.0,2116.0,482.0,145.0,41424.0,43745.0,20805.0,20796.0,15277.0,22839.0,99343.0,99287.0,35549.0,35427.0,31204.0,3852.0,12117.0,12110.0,12236.0,12229.0,12223.0,12220.0,12212.0,12208.0,12198.0,12190.0,12181.0,12174.0,262508.0,262498.0,148601.0,262508.0,262489.0,262508.0,262508.0,190067.0,38792.0,38792.0,35549.0,262508.0,164080.0,262508.0,262508.0,262508.0,262508.0,262508.0,227414.0,262508.0,262508.0,262508.0,261018.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,258157.0,262508.0,262508.0,262508.0,262508.0,252366.0,253446.0,244095.0,240834.0,240834.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,239866.0,241034.0,239076.0,240240.0,239379.0,238059.0,262508.0,262508.0,262508.0,262508.0,236881.0,232494.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,175517.0,172575.0,262508.0,262508.0,173629.0,170739.0,171449.0,114981.0,173474.0,116374.0,170343.0,169076.0,236592.0,262508.0,168572.0,167310.0,172199.0,171458.0,168910.0,173040.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,261018.0,261018.0,261018.0,262508.0,262508.0,93447.0,93447.0,236925.0
mean,29.992156,6.362587,6563340.0,6.416326,14.499886,2015.024967,1115.01059,2015005000.0,2015005000.0,1.0,1.000165,1.0,1.0,1.544822,1.68,1.794073,0.801249,0.992403,1.0,1.0,1.506366,1.005653,1.0,1.067469,1.63355,2.429689,2.573366,60.671247,64.712134,55.724814,1.099418,1.393367,1.916014,1.574655,2.212135,1.173282,1.240431,1.448979,1.628888,1.971045,1.880857,1.481745,1.918505,1.91193,1.943057,1.694695,1.835011,1.980004,2.75886,54.477672,1.5782,2.261264,4.923294,1.373417,1.972369,1.72001,1.225944,1.881881,3.934692,65.898265,20.132155,1.231182,735.729861,738.511106,2.008247,1.79305,1.898981,1.97301,1.940023,1.85712,1.972666,1.947887,1.613333,2.437312,1.453997,6.768174,2.976561,534.841208,3.456239,67.86133,5.576082,367.632359,212.755243,314.150847,259.104601,301.667358,227.072214,1.309499,52.46957,142.889531,107.322529,62.62421,146.915296,124.402128,602.388783,1.57785,1.861649,2.439875,6.16327,1.278522,1.570572,136488.492898,4.121801,2.068658,1.909212,390118.404226,4.571433,1.622837,2.796709,1.675487,252.579475,268.348881,14.529001,14.650291,24.133457,2.404659,1.882655,1.463441,1.807887,7.533572,3.360258,2.199142,12.76955,1.536613,1.259398,5.50555,2.21217,1.365204,1.713686,2.389617,5.938583,2.817455,1.582019,2.432105,1.959474,1.991043,1.941801,3.978984,4.074232,2.186009,3.997544,1.607374,1.414126,425.923031,1.726831,63.633712,1.594164,62.50289,56.710983,37.261333,680.536,4.259358,5.25,4.453083,5.048257,1.725363,1.657895,1.711064,2.851166,1.811241,1.3122,1.697926,2.23846,1.683058,1.500043,1.897049,3.421536,2.345904,14.68931,1.797313,1.206191,1.846988,1.104255,2.599844,3.138067,2.555396,1.749356,1.137515,1.846128,1.678096,3.260401,1.302339,2.061724,3.257142,1.633803,1.961282,1.679846,1.679846,1.90085,1.677221,2.329876,1.827586,4.120944,4.330735,1.902716,43.753991,1.867448,47.433732,1.253757,4.050853,1.848013,1.709487,2.190296,1.465472,1.832632,1.676053,63.437643,67.011775,51.365213,39.507201,59.859073,74.227392,76.171995,78.991222,1.879156,1.872022,14.882167,1.037036,2.541484,301402.956923,104.269853,1.440333,121.585816,7.610753,7.266189,7.266189,804.030444,4.159195,0.619909,569.7162,1.205655,3.937507,1.423945,1.530449,1.488976,1.157892,1.146578,2.822044,1.663843,3.112458,3.195945,1.983025,2.013721,1.353216,1.675648,1.452403,7.791237,1.368038,55.347601,4.439392,66.716927,1.694414,80.87583,28.029993,2.93591,2.264045,1.566554,2.958573,4.675271,3.545949,1.461929,1.844287,58.939747,1.571716,5988.838458,1.509786,0.355684,1.004568,0.280899,0.568871,0.297309,0.804428,0.168056,0.355334,0.902376,0.885664,1.360983,1.952762,2.121067,2.097266,0.999794,0.999867,0.098035,0.114602,1.925408,4.170684,2.889406,40.035164,16.846285,1.279619,0.874621,63.471196,71.934824,4.02446,3.128486,229.772882,131.064699,1.200492,0.816105,313.418255,182.879935,484.504463,82.115282,51.157078,131.300647,3.25016,2.373794,2.627074,2.835331,2.582051,2.441907,3.487101,2.735806,2.715096,2.812296,3.650181,1.818059,1.879924,2.28415,2.402089,1.966994
std,16.034203,3.487616,3489557.0,3.493035,8.34036,0.156024,35.717588,4119.885,4119.885,0.0,0.012863,0.0,0.0,0.497989,0.476095,0.799739,0.62026,0.525346,0.0,0.0,0.499962,0.074974,0.0,0.250833,0.557689,5.169173,1.11537,37.060859,35.832562,38.091392,0.50049,0.828634,0.407138,1.247056,1.032835,0.449445,0.909971,1.034314,0.727832,0.315614,0.443545,1.087207,0.390138,0.382682,0.441484,0.624264,0.544734,0.33617,0.713534,18.227792,0.493848,1.686386,1.072772,0.816543,0.464936,1.194849,0.668328,0.449691,2.871733,37.713332,31.73796,0.571769,2202.25871,1369.391304,0.569615,0.663207,0.452183,0.428456,0.556444,0.569867,0.385369,0.482977,0.743292,0.885656,0.609252,6.4154,0.489413,355.856532,10.460801,35.827391,13.892794,192.209818,141.596279,149.657916,138.448086,143.868637,133.182897,0.718052,23.5876,84.6707,149.478309,28.880006,88.305723,166.83723,365.387258,0.835431,1.140795,0.934896,11.202142,0.953226,0.780284,163070.07157,5.271476,1.666288,1.168047,355738.058695,10.846785,1.284865,0.668479,0.523549,271.302019,282.576131,28.020788,28.893375,36.468501,1.454339,0.691509,0.624099,0.594037,8.55321,1.536601,1.715693,17.516999,0.726586,0.656356,1.347103,1.407842,0.854777,1.055061,1.075706,10.259612,1.32765,1.049713,0.840096,0.443714,0.556198,0.597201,1.362365,1.260735,1.261266,1.401033,0.744965,0.671437,121.775551,0.631668,33.441537,0.748948,39.5709,41.509844,42.115908,363.418607,2.798814,2.881368,2.864516,3.132869,0.9962,0.657148,0.503249,0.676853,0.518874,1.035096,1.557228,0.997839,0.699094,0.828044,0.521052,1.601159,1.571104,27.744943,0.801607,0.545362,1.359127,0.584924,1.719824,2.500601,1.8432,0.629234,0.505283,1.377625,0.70557,1.770868,0.621504,0.738552,1.660982,1.258408,1.237314,1.227966,1.272337,1.511596,1.330234,1.139491,2.585603,1.386946,1.172438,1.081764,16.562044,1.241008,22.806008,1.238984,0.547911,1.679155,1.783994,1.476086,0.978662,1.278701,0.913564,37.494419,35.902667,40.085996,39.836026,38.736606,30.576215,28.640436,25.356835,0.538358,0.575993,5.027423,0.188932,1.723315,160347.968296,160.006173,0.702646,167.065042,2.838454,22.250035,22.250035,1346.641076,3.765112,0.20163,992.68448,0.558806,3.794923,0.632581,1.548422,0.86475,0.546747,0.721085,0.789163,0.472394,12.546424,12.554625,0.724159,2.265455,1.075474,1.520396,0.951952,3.494344,0.506664,17.036105,1.553353,4.131547,0.105662,21.654184,6.681245,0.826485,2.071207,1.201628,1.044479,2.407465,1.460241,1.582491,1.630972,191.651088,1.855952,23203.108257,1.862416,0.66908,1.130174,0.496596,0.701184,0.502647,0.842992,0.529791,1.080636,0.296806,0.318219,1.4002,1.657691,2.308944,2.509201,0.014341,0.011546,0.298054,0.31896,2.201525,1.632639,2.646405,106.269566,108.526417,0.549864,0.814786,65.227147,77.595043,2.879916,3.171242,374.131847,374.567596,2.254306,2.508549,532.796114,487.870741,757.001859,234.807556,186.461465,314.778894,2.463857,2.489832,2.489788,2.452412,2.473872,2.211653,2.394127,2.443391,1.314827,1.345389,1.257103,2.35201,2.342812,2.510628,2.767797,1.436966
min,1.0,1.0,1012016.0,1.0,1.0,2015.0,1100.0,2015000000.0,2015000000.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,50.0,205.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,101.0,1.0,1.0,1.0,101.0,101.0,101.0,101.0,101.0,101.0,1.0,1.0,101.0,1.0,1.0,101.0,1.0,101.0,1.0,1.0,1.0,0.0,1.0,1.0,12014.0,1.0,1.0,1.0,11985.0,1.0,1.0,1.0,1.0,101.0,101.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,101.0,1.0,11.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,10.0,1.0,1.0,11011.0,0.945246,0.333333,0.362773,1.0,1.0,1.0,7.81393,1.0,0.079438,1.433505,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,18.0,1.0,36.0,0.91,22.68,12.05,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,5.55,0.95,0.0,0.0,1.0,1.0,0.233,0.233,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0
25%,19.0,3.0,3232015.0,3.0,7.0,2015.0,1100.0,2015002000.0,2015002000.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,15.0,29.0,10.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,44.0,1.0,1.0,4.0,1.0,2.0,1.0,1.0,2.0,1.0,4.0,5.0,1.0,149.0,504.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,1.0,6.0,3.0,202.0,1.0,77.0,1.0,202.0,102.0,202.0,201.0,202.0,102.0,1.0,37.0,103.0,30.0,47.0,102.0,30.0,107.0,1.0,1.0,2.0,3.0,1.0,1.0,102014.0,1.0,1.0,1.0,62008.0,1.0,1.0,3.0,1.0,101.0,101.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,5.0,1.0,1.0,6.0,2.0,1.0,1.0,2.0,4.0,2.0,1.0,2.0,2.0,2.0,2.0,3.0,3.0,1.0,3.0,1.0,1.0,402.0,1.0,30.0,1.0,3.0,3.0,2.0,777.0,2.0,2.0,2.0,1.0,1.0,1.0,1.0,3.0,2.0,1.0,1.0,2.0,1.0,1.0,2.0,3.0,2.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,3.0,4.0,1.0,38.0,1.0,40.0,1.0,4.0,1.0,1.0,2.0,1.0,1.0,1.0,14.0,14.0,7.0,4.0,10.0,88.0,88.0,88.0,2.0,2.0,10.0,1.0,1.0,191021.0,17.829576,1.0,25.385745,9.0,1.0,1.0,135.388317,1.0,0.464705,92.270773,1.0,1.0,1.0,1.0,1.0,1.0,1.0,3.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,5.0,1.0,43.0,3.0,64.0,1.63,65.77,23.73,2.0,1.0,1.0,2.0,3.0,3.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,0.33,0.07,0.14,0.07,0.33,0.0,0.0,1.0,1.0,0.57,1.1,1.0,1.0,1.0,1.0,0.0,0.0,1.0,3.5,0.0,22.47,3.85,1.0,0.0,30.0,30.0,2.0,1.0,70.0,0.0,0.0,0.0,90.0,0.0,120.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,3.0,1.0,1.0,1.0,1.0,1.0
50%,29.0,6.0,6242015.0,6.0,14.0,2015.0,1100.0,2015004000.0,2015004000.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,2.0,88.0,88.0,88.0,1.0,1.0,2.0,1.0,3.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,54.0,2.0,1.0,5.0,1.0,2.0,1.0,1.0,2.0,3.0,88.0,7.0,1.0,175.0,507.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,1.0,7.0,3.0,777.0,2.0,88.0,2.0,308.0,202.0,302.0,205.0,302.0,203.0,1.0,64.0,105.0,45.0,67.0,105.0,45.0,888.0,2.0,2.0,3.0,5.0,1.0,2.0,102014.0,4.0,2.0,2.0,112014.0,3.0,1.0,3.0,2.0,103.0,101.0,4.0,3.0,3.0,2.0,2.0,1.0,2.0,6.0,4.0,1.0,11.0,1.0,1.0,6.0,2.0,1.0,1.0,2.0,5.0,2.0,1.0,3.0,2.0,2.0,2.0,4.0,5.0,2.0,5.0,2.0,1.0,407.0,2.0,63.0,2.0,88.0,88.0,4.0,888.0,3.0,5.0,3.0,7.0,2.0,2.0,2.0,3.0,2.0,1.0,1.0,2.0,2.0,1.0,2.0,4.0,2.0,3.0,2.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,1.0,1.0,2.0,3.0,1.0,2.0,3.0,1.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,5.0,5.0,2.0,40.0,2.0,40.0,1.0,4.0,2.0,1.0,2.0,1.0,1.0,2.0,88.0,88.0,88.0,14.0,88.0,88.0,88.0,88.0,2.0,2.0,12.0,1.0,2.0,292039.0,44.823976,1.0,61.625519,9.0,1.0,1.0,328.164379,2.0,0.669767,232.37252,1.0,1.0,1.0,1.0,1.0,1.0,1.0,3.0,2.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,8.0,1.0,58.0,5.0,66.0,1.68,77.11,26.91,3.0,2.0,1.0,3.0,5.0,4.0,1.0,2.0,3.0,1.0,23.0,1.0,0.07,1.0,0.14,0.43,0.17,0.71,0.0,0.0,1.0,1.0,1.0,1.7,1.0,1.0,1.0,1.0,0.0,0.0,1.0,3.5,3.5,27.28,4.68,1.0,1.0,45.0,45.0,3.5,2.333,140.0,35.0,0.0,0.0,180.0,47.0,271.0,0.0,0.0,0.0,3.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,3.0,3.0,4.0,1.0,1.0,1.0,1.0,2.0
75%,44.0,9.0,10022020.0,10.0,21.0,2015.0,1100.0,2015007000.0,2015007000.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,3.0,88.0,88.0,88.0,1.0,1.0,2.0,2.0,3.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,64.0,2.0,3.0,6.0,2.0,2.0,2.0,1.0,2.0,7.0,88.0,8.0,1.0,210.0,510.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,7.0,3.0,888.0,2.0,88.0,4.0,555.0,305.0,313.0,310.0,310.0,310.0,2.0,64.0,204.0,100.0,88.0,204.0,130.0,888.0,2.0,2.0,3.0,7.0,1.0,2.0,112014.0,5.0,2.0,2.0,772013.0,4.0,2.0,3.0,2.0,204.0,207.0,5.0,4.0,76.0,3.0,2.0,2.0,2.0,12.0,5.0,3.0,13.0,2.0,1.0,6.0,2.0,1.0,2.0,3.0,7.0,4.0,2.0,3.0,2.0,2.0,2.0,5.0,5.0,3.0,5.0,2.0,2.0,420.0,2.0,97.0,2.0,88.0,88.0,88.0,888.0,8.0,8.0,8.0,8.0,2.0,2.0,2.0,3.0,2.0,1.0,2.0,3.0,2.0,2.0,2.0,4.0,2.0,3.0,2.0,1.0,2.0,1.0,4.0,7.0,4.0,2.0,1.0,2.0,2.0,5.0,2.0,2.0,5.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,1.0,5.0,5.0,2.0,50.0,2.0,50.0,1.0,4.0,2.0,1.0,2.0,2.0,2.0,2.0,88.0,88.0,88.0,88.0,88.0,88.0,88.0,88.0,2.0,2.0,20.0,1.0,5.0,441031.0,97.314988,2.0,136.543634,9.0,2.0,2.0,910.109662,9.0,0.766052,621.963797,1.0,9.0,2.0,1.0,2.0,1.0,1.0,3.0,2.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,10.0,2.0,69.0,6.0,70.0,1.78,90.72,30.9,4.0,2.0,2.0,4.0,5.0,4.0,1.0,2.0,27.0,1.0,350.0,1.0,0.5,1.0,0.33,0.83,0.43,1.0,0.0,0.0,1.0,1.0,2.0,2.43,2.0,2.0,1.0,1.0,0.0,0.0,2.0,5.0,5.0,34.15,5.85,2.0,2.0,60.0,90.0,5.833,4.0,252.0,120.0,2.0,0.0,360.0,180.0,546.0,84.0,19.0,140.0,4.0,2.0,3.0,3.0,2.0,2.0,4.0,2.0,3.0,3.0,4.0,1.0,1.0,2.0,2.0,2.0
max,72.0,12.0,12312020.0,12.0,31.0,2016.0,1200.0,2015023000.0,2015023000.0,1.0,2.0,1.0,1.0,2.0,2.0,20.0,18.0,10.0,1.0,1.0,2.0,2.0,1.0,2.0,9.0,99.0,9.0,99.0,99.0,99.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,99.0,2.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,99.0,99.0,9.0,9999.0,9999.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,99.0,9.0,999.0,99.0,99.0,99.0,999.0,999.0,999.0,999.0,999.0,999.0,9.0,99.0,999.0,999.0,99.0,999.0,999.0,999.0,9.0,9.0,9.0,99.0,9.0,9.0,999999.0,99.0,9.0,9.0,999999.0,99.0,9.0,9.0,9.0,999.0,999.0,99.0,99.0,99.0,9.0,9.0,9.0,9.0,99.0,9.0,9.0,99.0,9.0,9.0,9.0,9.0,8.0,7.0,9.0,99.0,9.0,8.0,7.0,7.0,7.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,999.0,9.0,99.0,7.0,98.0,98.0,99.0,999.0,9.0,8.0,9.0,8.0,9.0,9.0,9.0,9.0,9.0,7.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,99.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,21.0,9.0,9.0,9.0,99.0,9.0,99.0,9.0,9.0,9.0,9.0,9.0,7.0,9.0,9.0,99.0,99.0,99.0,99.0,99.0,99.0,99.0,99.0,9.0,9.0,23.0,3.0,5.0,722019.0,1603.286561,5.0,2553.557492,9.0,99.0,99.0,25653.294435,9.0,0.920562,33134.939618,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,2.0,99.0,99.0,9.0,9.0,9.0,9.0,5.0,14.0,3.0,80.0,6.0,95.0,2.41,289.85,97.65,4.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,900.0,9.0,99900.0,9.0,99.0,99.0,99.0,99.0,99.0,99.0,2.0,4.0,1.0,1.0,150.0,199.29,9.0,9.0,1.0,1.0,2.0,2.0,9.0,12.8,12.8,999.0,999.0,2.0,2.0,599.0,599.0,99.0,99.0,53460.0,47520.0,99.0,9.0,53460.0,47520.0,54000.0,14250.0,12600.0,14250.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0


# Preprocess the data

In [61]:
# Preprocessing of the data (standardization, outliers, ...)
new_x_train, mean, std = preprocessing_dataset_naive(x_train)

np.set_printoptions(suppress=True, precision=3)

data = pd.DataFrame(new_x_train)

data.describe()
    

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,133,134,135,136,137,138,139,140,141,142,143,144,145,146,147,148,149,150,151,152,153,154,155,156,157,158,159,160,161,162,163,164,165,166,167,168,169,170,171,172,173,174,175,176,177,178,179,180,181,182,183,184,185,186,187,188,189,190,191,192,193,194,195,196,197,198,199,200,201,202,203,204,205,206,207,208,209,210,211,212,213,214,215,216,217,218,219,220,221,222,223,224,225,226,227,228,229,230,231,232,233,234,235,236,237,238,239,240,241,242,243,244,245,246,247,248,249,250,251,252,253,254,255,256,257,258,259,260,261,262,263,264,265,266,267,268,269,270,271,272,273,274,275,276,277,278,279,280,281,282,283,284,285,286,287,288,289,290,291,292,293,294,295,296,297,298,299,300,301,302,303,304,305,306,307,308,309,310,311,312,313,314,315,316,317,318,319,320
count,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0,262508.0
mean,-3.938317e-18,-8.259977e-17,-5.2121800000000006e-17,6.0529630000000004e-18,5.524471000000001e-17,-6.330708e-13,-1.393636e-15,-8.388624e-12,-8.388624e-12,0.0,-1.833736e-16,0.0,0.0,-3.131368e-18,1.3533729999999999e-20,-7.507839000000001e-17,-7.183030000000001e-17,2.2418630000000003e-17,0.0,0.0,6.221458e-17,-3.732063e-16,0.0,-1.278803e-16,-9.040535e-18,-3.248096e-18,1.955895e-16,-1.761416e-17,1.850332e-16,2.7392280000000002e-17,-1.322347e-16,-4.478313e-17,-8.991813e-17,7.277766000000001e-17,3.7109500000000004e-17,-6.049579e-18,-1.248352e-16,-6.640327000000001e-17,2.8204300000000003e-17,4.8660540000000006e-17,-1.007181e-16,-5.7653710000000004e-18,5.106278e-17,1.640965e-16,-8.533020000000001e-17,-1.119714e-16,1.943444e-17,2.796306e-16,-1.462049e-16,8.011971e-18,-9.286849000000001e-17,-9.135271000000001e-17,3.099225e-16,1.959685e-17,3.388171e-17,-8.120241e-19,-5.165827000000001e-17,-1.855407e-16,-4.055722e-17,-7.286225e-17,-2.2330660000000002e-17,-2.6424620000000003e-17,-8.214977e-18,-4.8910920000000003e-17,1.0529250000000001e-17,-1.034553e-16,1.943614e-16,-1.748153e-16,5.4568020000000004e-17,1.550154e-16,-1.076203e-16,-1.954813e-16,1.013e-16,1.248352e-16,2.811633e-17,-8.133775e-18,1.277568e-16,1.191104e-16,-1.4670570000000002e-17,-8.760006000000001e-17,-1.151721e-17,-1.325359e-16,6.799348000000001e-17,-1.290306e-16,2.7229870000000003e-17,2.107473e-16,2.0706610000000002e-17,-1.235495e-16,7.247315000000001e-17,-1.13115e-16,2.647875e-17,2.5632890000000004e-17,4.2665100000000006e-17,-4.330795e-18,-1.7688590000000002e-17,1.542592e-17,-2.6796800000000002e-18,-4.554778e-17,4.27666e-18,4.5750790000000003e-17,4.9892110000000004e-17,-8.817228e-18,-2.0814880000000002e-17,-1.145901e-16,-8.516103e-18,1.2166830000000001e-17,5.048083e-18,-6.142624e-18,-1.801932e-17,-8.120241e-20,1.776303e-18,-1.096233e-18,-2.1924650000000002e-18,8.763092999999998e-19,-1.437959e-18,8.763092999999998e-19,-7.8631e-18,1.520853e-18,1.3902530000000002e-17,1.006572e-18,3.5483759999999995e-19,6.293187e-19,-9.913461e-19,-3.600819e-18,-2.200078e-18,-6.959723e-18,-1.559763e-18,-8.966099e-19,6.124015e-19,2.605244e-19,2.5534349999999998e-20,-6.208600999999999e-19,7.308217e-19,1.94632e-18,9.050684999999999e-19,1.040406e-19,4.8342500000000006e-17,-1.389745e-18,-1.336456e-18,1.8651179999999999e-19,-1.820287e-18,-5.166503e-18,-1.542169e-17,-9.965904e-18,8.482268e-18,-5.413494e-20,-2.343028e-19,-5.413494e-20,2.283818e-20,6.851453e-20,2.0469769999999998e-19,-1.505628e-19,3.637191e-20,1.6578829999999999e-19,2.0935e-19,-7.210943e-20,-1.281476e-19,-4.06012e-18,1.541154e-18,-1.375366e-18,7.578892e-19,1.250179e-18,1.302622e-18,5.0650000000000004e-18,-2.58156e-18,-6.22721e-18,8.353698e-18,2.116338e-18,-4.905979e-20,-2.510508e-18,6.922505e-18,-1.928557e-19,-2.963888e-18,-2.546034e-18,-5.927776e-18,2.7828739999999995e-19,2.652612e-18,-2.134947e-18,-7.257464999999999e-19,-3.532305e-18,1.688333e-18,9.230007e-18,-2.847159e-18,9.419479000000001e-18,-3.7556109999999995e-19,3.062008e-19,-9.486302e-19,-9.693537999999999e-19,5.548831e-19,-4.669139e-19,-2.723664e-19,-3.04509e-20,4.648838e-18,3.447042e-17,6.645064e-18,2.348103e-18,-4.398464e-19,8.316480000000001e-18,-2.7371980000000002e-17,8.001821e-18,-1.2248030000000001e-18,-6.412453e-18,6.892054e-18,1.819864e-18,3.638883e-18,-3.288698e-18,-2.568026e-18,3.308998e-18,-3.456178e-18,-3.219337e-18,3.535688e-18,-2.831934e-18,8.810461e-18,-1.2285250000000002e-17,-2.970655e-18,-2.758344e-18,1.7176e-16,3.357246e-16,7.819792000000001e-17,4.327412e-17,-2.02842e-13,-4.099016e-15,-6.008207e-14,7.343405e-17,6.580778999999999e-19,6.580778999999999e-19,-1.318693e-16,-5.5149970000000005e-17,5.130336e-13,8.000955e-15,1.632304e-16,5.625297000000001e-17,1.007451e-16,3.3015550000000005e-17,-3.456516e-17,-1.040474e-16,1.241991e-16,-1.020173e-16,4.2073e-17,-1.272171e-17,9.270608e-18,-1.205991e-16,4.15215e-17,2.035474e-17,6.117248e-17,-6.323638e-17,1.13433e-16,8.018061e-17,2.3832910000000003e-17,-1.556515e-16,1.377761e-15,-6.023803e-12,3.008788e-12,2.53456e-13,4.9316930000000004e-17,3.7001230000000004e-17,8.643320000000001e-17,1.413328e-16,-4.181924e-17,9.412713e-18,-4.698913e-17,-3.3699e-18,9.798424000000001e-18,-7.419193e-17,-2.070661e-18,1.099548e-16,8.994472e-14,-2.333162e-13,3.319487e-13,1.304049e-13,3.17453e-13,-1.438979e-13,-1.565853e-17,5.72477e-17,1.104894e-16,-3.13306e-18,-2.619436e-13,-1.034907e-13,-9.978423000000001e-17,-4.4674860000000007e-17,3.853257e-15,1.332261e-15,3.3056150000000004e-17,-6.6924320000000005e-18,3.725161e-17,-3.997644e-13,3.586626e-13,-1.805806e-15,-1.048729e-14,-8.890310000000001e-17,6.983407e-18,1.165255e-17,-6.252586e-18,-2.905605e-15,-7.060288e-14,-1.441343e-17,-1.873069e-17,-1.869127e-14,4.211698e-17,-1.597657e-17,-1.3547270000000001e-17,1.46435e-17,1.975925e-18,3.6541080000000004e-18,-2.7432880000000002e-17,1.042639e-16,-8.895724000000001e-17,7.695282000000001e-17,-1.6240480000000003e-17,1.01503e-17,1.18339e-16,8.146632e-17,-7.18506e-17,-1.765882e-16,5.0832710000000004e-17,7.554531000000001e-17,-4.4823730000000007e-17,-6.85619e-17,2.706747e-17,6.008978e-18,6.6315300000000005e-18
std,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,0.0,0.7585951,0.0,0.0,0.7585951,0.009758871,0.7585575,0.7583666,0.7583641,0.0,0.0,0.6515623,0.6515652,0.0,0.6515652,0.6501781,0.642534,0.9999981,1.0,1.000002,0.7165085,1.000002,1.000002,1.0,1.0,1.0,0.6337738,1.000002,0.9307609,0.9307609,1.000002,1.000002,0.3663101,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,0.9999924,0.3584257,1.000002,1.000002,1.000002,1.000002,0.7585951,0.1735982,0.7585951,1.0,1.000002,0.9999981,0.9962521,0.9951196,0.9939993,0.9933035,0.3850589,0.9894263,0.98818,0.9873566,0.9866908,0.9860381,0.9855938,0.9849403,0.9838916,0.6460284,0.3735392,0.5260565,0.9832061,0.9820489,0.6924426,0.6917518,0.6910604,0.9679855,0.9667037,0.9652347,0.964133,0.9631625,0.9619891,0.9593005,0.8193035,0.8169078,0.816453,0.8159373,0.6695809,0.6692679,0.9554986,0.5559542,0.5555738,0.5551657,0.5499572,0.9534891,0.9524018,0.6562781,0.6580142,0.9517196,0.9500249,0.5088369,0.5084137,0.4333158,0.4333158,0.2570569,0.2570495,0.2570421,0.2570421,0.2570346,0.2558909,0.2570346,0.2570272,0.2570272,0.4961232,0.2330144,0.2328835,0.2327526,0.232638,0.2324906,0.2324087,0.2321135,0.4372627,0.08538872,0.08523244,0.08523244,0.04918316,0.07561708,0.08512063,0.08507586,0.08507586,0.08503107,0.5144286,0.1718891,0.1717783,0.0970603,0.1716785,0.1716008,0.3057253,0.2400206,0.3056007,0.04848106,0.0378966,0.02567158,0.02567158,0.03779594,0.03779594,0.03774552,0.03171258,0.03769502,0.03769502,0.04855958,0.03990412,0.2067131,0.1733457,0.1125786,0.1125955,0.1125786,0.2114952,0.2114232,0.2113961,0.2113331,0.3026383,0.1569935,0.05848813,0.2514458,0.2286993,0.2061502,0.228666,0.2208612,0.2285993,0.1260369,0.227455,0.11374,0.1068318,0.3500593,0.2118192,0.3499395,0.2978039,0.2977911,0.1219664,0.1218883,0.1218101,0.1218101,0.08982403,0.08978161,0.04285022,0.02350247,0.3972424,0.4082195,0.2815227,0.2814618,0.2412396,0.2949634,0.6151743,0.6150009,0.3679961,0.3673641,0.3447741,0.1211359,0.2148459,0.2147839,0.2158983,0.2158366,0.2157836,0.2157571,0.2156865,0.2156512,0.2155628,0.2154921,0.2154126,0.2153507,1.000002,0.9999829,0.7523855,1.000002,0.9999657,1.000002,1.000002,0.8509086,0.3844153,0.3844153,0.3679961,1.000002,0.790601,1.000002,1.000002,1.000002,1.000002,1.000002,0.9307609,1.000002,1.000002,1.000002,0.9971599,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,0.9916799,1.000002,1.000002,1.000002,1.000002,0.9804941,0.9825899,0.964293,0.95783,0.95783,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,0.9559032,0.9582277,0.9543277,0.9566481,0.9549323,0.9522958,1.000002,1.000002,1.000002,1.000002,0.9499367,0.9410993,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,0.8176909,0.8108089,1.000002,1.000002,0.8132811,0.8064843,0.8081594,0.6618241,0.812918,0.6658211,0.8055485,0.8025471,0.9493571,1.000002,0.8013501,0.7983448,0.8099251,0.8081806,0.802153,0.8119005,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,1.000002,0.9971599,0.9971599,0.9971599,1.000002,1.000002,0.5966398,0.5966398,0.9500249
min,-1.808148,-1.537611,-1.590842,-1.55061,-1.618625,-0.1600193,-0.4202585,-1.261404,-1.261404,0.0,-0.01286546,0.0,0.0,-1.094049,-1.457738,-0.992919,-1.2918,-1.889051,0.0,0.0,-1.012815,-0.07540028,0.0,-0.26898,-1.136031,-0.2765811,-1.410625,-1.610091,-1.778055,-1.436677,-0.1986416,-0.4747186,-2.249889,-0.4608104,-1.173602,-0.3855478,-0.2642185,-0.4340845,-0.8640587,-3.07669,-1.985949,-0.4431099,-2.354313,-2.383004,-2.136109,-1.112825,-1.53288,-2.915208,-2.465003,-2.933897,-1.170807,-0.7479109,-3.657163,-0.4573154,-2.09141,-0.6026332,-0.3380748,-1.961086,-1.021925,-1.720834,-0.6028173,-0.4043282,-0.3113763,-0.389598,-1.770073,-1.195783,-1.988095,-2.270973,-1.689343,-1.504073,-2.52399,-1.962598,-0.8251589,-1.622886,-0.7451817,-0.8991199,-4.038644,-1.219149,-0.2348051,-1.866215,-0.3293866,-1.387197,-0.7892543,-1.424257,-1.14198,-1.394799,-0.9466116,-0.4310274,-2.182067,-0.4947361,-0.7112927,-2.133808,-0.5199605,-0.739659,-1.372215,-0.6916826,-0.7553104,-1.540155,-0.5501902,-0.2921897,-0.731238,-0.7633224,-0.5922089,-0.6413422,-0.7784054,-1.062962,-0.3292643,-0.4847535,-2.687785,-1.290246,-0.5587273,-0.5922429,-0.4828341,-0.4724503,-0.6343592,-0.9658679,-1.276455,-0.7425975,-1.360004,-0.7639005,-1.536079,-0.6989504,-0.6719167,-0.7385662,-0.3952225,-3.344739,-0.8610207,-0.4273618,-0.676618,-1.292158,-0.481741,-1.369382,-0.5546014,-1.705141,-2.162938,-1.782288,-1.577037,-2.186768,-2.438601,-0.9405225,-2.139662,-0.8153585,-0.6167883,-2.668301,-1.150678,-1.575179,-0.7943862,-1.558757,-1.346011,-0.8621393,-1.872342,-1.16611,-1.477795,-1.207087,-1.293924,-0.7287194,-1.002335,-1.413009,-2.735135,-1.5637,-0.3016595,-0.4482522,-1.241195,-0.9771035,-0.6039101,-1.721684,-1.512396,-0.8567277,-0.4936733,-0.9946727,-0.3780945,-0.6232134,-0.1782429,-0.9302733,-0.8550522,-0.8439574,-1.190945,-0.2721939,-0.6142958,-0.9610759,-1.276491,-0.4864715,-1.437605,-1.358949,-0.503719,-0.7770103,-0.5537067,-0.5343972,-0.5961003,-0.5092195,-1.168291,-0.3211841,-2.250255,-2.840896,-0.8345053,-2.581506,-0.6990093,-2.036075,-0.2048117,-5.568187,-0.5050304,-0.3977015,-0.8063997,-0.4756831,-0.6511814,-0.7400477,-1.66532,-1.838707,-1.256481,-0.9666822,-1.519531,-2.395012,-2.624788,-3.075874,-1.6331,-1.514008,-0.9711092,-0.1960308,-0.8944903,-1.811015,-0.6457551,-1.575476,-0.7256053,-2.329004,-0.2816297,-0.2816297,-0.5912694,-0.8390723,-2.680514,-0.5724717,-0.3680259,-0.7740636,-0.6701842,-0.3425743,-0.5654547,-0.2887858,-0.2032753,-2.308834,-1.405276,-0.1683716,-0.1749115,-1.357474,-0.4474702,-0.3284288,-0.4443904,-0.4752379,-1.943498,-0.7263968,-2.192266,-2.214177,-7.434743,-7.423834,-2.687515,-2.391774,-2.342345,-0.6102953,-0.4714898,-1.875171,-1.526618,-1.743516,-0.2919003,-0.5176595,-0.3075373,-0.3080451,-0.2581055,-0.2737237,-0.531603,-0.8888628,-0.5656496,-0.8113019,-0.5914879,-0.9542556,-0.3172122,-0.3288197,-3.040299,-2.783197,-0.9719944,-1.178004,-0.4855331,-0.4372977,-69.71556,-86.59809,-0.3289183,-0.3593001,-0.4203493,-2.554573,-1.091826,-0.3245071,-0.1464742,-2.327163,-1.07344,-0.9577512,-0.9141709,-1.316521,-0.9130488,-0.6141513,-0.3499104,-0.5325338,-0.32533,-0.5882535,-0.3748544,-0.6400326,-0.3497141,-0.2743582,-0.4171214,-0.9132689,-0.5517629,-0.6535004,-0.7483791,-0.6395052,-0.65196,-1.038836,-0.7104101,-1.30443,-1.347045,-2.108169,-0.3478134,-0.3755851,-0.5114884,-0.5065748,-0.6729425
25%,-0.6855456,-0.9641525,-0.9546576,-0.9780414,-0.8992298,-0.1600193,-0.4202585,-0.7528939,-0.7528939,0.0,-0.01286546,0.0,0.0,-1.094049,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.07540028,0.0,-0.26898,0.0,-0.08312571,-0.5140598,-1.232333,-0.9966411,0.0,-0.1986416,-0.4747186,0.2062851,-0.4608104,-1.173602,-0.3855478,-0.2642185,-0.4340845,-0.8640587,0.09174294,0.2686157,0.0,0.2088871,0.2301387,0.1289811,-1.112825,0.3028808,0.05948062,0.3379525,0.0,-1.170807,-0.7479109,-0.8606634,-0.4573154,0.0,0.0,-0.3380748,0.262667,-1.021925,-1.641287,-0.476785,-0.4043282,-0.2659683,-0.1712524,0.0,0.0,0.2234032,0.0629934,0.1077858,0.2507258,0.07092832,0.107899,-0.8251589,0.0,0.0,0.0,0.04789237,-0.935326,-0.1392097,0.0,-0.2574066,-0.8565259,-0.7821919,-0.7427009,-0.412463,-0.6927678,-0.9391031,-0.4310274,0.0,-0.4593046,-0.5172841,0.0,-0.4633388,-0.1462637,-1.095795,0.0,0.0,0.0,0.0,-0.2921897,-0.731238,-0.2114039,0.0,-0.6413422,-0.7784054,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.2048117,-0.0928123,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.9711092,-0.1960308,-0.8944903,-0.6883914,-0.5402319,-0.6266799,-0.5758252,0.0,0.0,0.0,0.0,-0.8390723,0.0,-0.4809648,-0.3680259,-0.7740636,-0.6701842,-0.3425743,-0.5654547,-0.2887858,-0.2032753,0.2255006,-1.405276,-0.1683716,-0.1749115,0.02344064,-0.4474702,-0.3284288,-0.4443904,-0.4752379,-0.7987887,-0.7263968,-0.7247915,-0.9266374,-0.6576066,-0.6096242,-0.5927656,-0.598691,-1.1324,-0.6102953,-0.4714898,-0.9177537,-0.6958665,-0.3738767,-0.2919003,-0.5176595,-0.3075373,-0.3080451,-0.2581055,-0.2737237,-0.531603,-0.5083897,-0.4246897,-0.5688545,-0.4522249,-0.4441666,-0.3172122,-0.3288197,0.3289151,0.359299,-0.5434832,-0.472201,-0.4855331,-0.4372977,0.014344,0.0115476,-0.3289183,-0.3593001,-0.4203493,-0.4107988,-1.091826,-0.1652891,-0.1197525,-0.5085258,-1.07344,-0.5131497,-0.1538098,-0.3557265,-0.04051618,-0.3335007,-0.3499104,-0.5325338,-0.32533,-0.3348725,-0.3748544,-0.3758317,-0.3497141,-0.2743582,-0.4171214,-0.9132689,-0.5517629,-0.6535004,-0.7483791,-0.6395052,-0.1998086,-0.6211467,-0.301142,-0.5438722,-0.6037643,-0.5172069,-0.3478134,-0.3755851,-0.1131796,-0.1452747,-0.6729425
50%,-0.06187762,-0.1039644,-0.09208214,-0.1191878,-0.05993586,-0.1600193,-0.4202585,-0.2259365,-0.2259365,0.0,-0.01286546,0.0,0.0,0.0,0.0,0.0,0.0,0.01446182,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.5140598,0.7374034,0.6499092,0.0,-0.1986416,-0.4747186,0.2062851,-0.4608104,0.762819,0.0,-0.2642185,-0.4340845,0.5098876,0.09174294,0.2686157,0.0,0.2088871,0.2301387,0.1289811,0.4890651,0.3028808,0.05948062,0.3379525,0.0,0.8541117,-0.7479109,0.07150297,-0.4573154,0.05942912,0.0,0.0,0.262667,-0.3254805,0.5860468,-0.4137689,-0.4043282,-0.2546163,-0.1690616,0.0,0.3120446,0.2234032,0.0629934,0.1077858,0.2507258,0.07092832,0.107899,0.5202092,0.0,0.0,0.0,0.04789237,0.0,0.0,0.0,0.0,-0.2738282,-0.06889491,-0.07450906,-0.3835713,0.0,-0.1732374,-0.4310274,0.0,0.0,-0.04898737,0.0,0.0,0.0,0.7816688,0.0,0.0,0.0,0.0,-0.2921897,0.0,0.0,0.0,-0.04120455,0.07772671,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.5732903,-0.1960308,0.0,-0.05839784,-0.3715231,-0.6266799,-0.3589046,0.4894392,0.0,0.0,0.0,-0.5734754,0.0,-0.3398304,-0.3680259,-0.7740636,-0.6701842,-0.3425743,0.0,-0.2887858,-0.2032753,0.2255006,0.7116038,-0.1683716,-0.1749115,0.02344064,-0.4474702,-0.3284288,-0.4443904,-0.4752379,0.05974328,-0.7263968,0.1556931,0.3609023,0.0,0.0,-0.06907822,-0.08830607,0.07754513,-0.127484,-0.4714898,0.03966321,0.1348845,0.310943,-0.2919003,0.0954729,-0.2918838,-0.3080451,-0.2571143,-0.2737237,-0.3373059,-0.004041594,-0.2233184,-0.141006,-0.1935936,0.0,-0.3172122,-0.3288197,0.3289151,0.359299,-0.157823,-0.05595853,-0.4855331,-0.4372977,0.014344,0.0115476,-0.3289183,-0.3593001,-0.4203493,0.0,0.0,-0.1200267,-0.1121046,0.0,0.0,-0.05321719,0.0,0.0,0.0,0.0,0.0,-0.5325338,-0.32533,0.0,0.0,0.0,0.0,-0.08665129,0.0,-0.101532,-0.1501286,-0.251859,-0.3406166,-0.2352798,-0.1998086,-0.2034571,-0.301142,0.2166858,0.1395164,0.2782742,-0.3478134,-0.3755851,0.0,0.0,0.02296943
75%,0.8736243,0.7562238,0.9911521,1.02595,0.779358,-0.1600193,-0.4202585,0.4852498,0.4852498,0.0,0.0,0.0,0.0,0.9140359,0.0,0.257493,0.3204325,0.01446182,0.0,0.0,0.0,0.0,0.0,0.0,0.6570899,0.0,0.3825052,0.7374034,0.6499092,0.8473123,-0.1986416,-0.4747186,0.2062851,0.3410799,0.762819,0.0,-0.2642185,0.0,0.5098876,0.09174294,0.2686157,0.0,0.2088871,0.2301387,0.1289811,0.4890651,0.3028808,0.05948062,0.3379525,0.0,0.8541117,0.4380591,1.003669,0.7673614,0.05942912,0.0,0.0,0.262667,1.067409,0.5860468,-0.3822608,-0.4043282,-0.2387235,-0.1668709,0.0,0.3120446,0.2234032,0.0629934,0.1077858,0.2507258,0.07092832,0.107899,0.5202092,0.6353382,0.0,0.0,0.04789237,0.992421,0.0,0.5621048,0.0,0.9748098,0.6444021,0.0,0.3676144,0.05791852,0.6226622,0.0,0.4888358,0.0,0.0,0.497778,0.0,0.0,0.7816688,0.0,0.0,0.0,0.0,-0.2921897,0.55035,0.0,0.0,-0.04120455,0.07772671,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.017985,-0.1960308,0.0,0.8707832,-0.04346631,0.7965147,0.08953307,0.4894392,0.0,0.0,0.0,1.285703,0.5011022,0.05263273,-0.3680259,1.33402,0.9106433,-0.3425743,0.590951,-0.2887858,-0.2032753,0.2255006,0.7116038,-0.1683716,-0.1749115,0.02344064,-0.4474702,-0.3284288,-0.4443904,-0.4752379,0.6320979,1.247302,0.8013818,1.004672,0.7946369,0.8100028,0.4546092,0.3562228,1.28749,-0.127484,0.3607163,0.9970801,0.1348845,0.310943,-0.2919003,0.0954729,-0.166656,-0.3080451,-0.2430213,-0.2737237,0.1110722,0.0,0.09887574,0.2012727,0.06503775,0.231998,-0.3172122,-0.3288197,0.3289151,0.359299,0.4563764,0.227569,-0.05243393,-0.03876365,0.014344,0.0115476,-0.3289183,-0.3593001,0.03388203,0.0,0.3440881,-0.05537968,-0.1013238,0.0,0.1538794,0.0,0.0,0.2231115,0.0,0.0,0.0,0.2956608,-0.32533,0.0,0.0,0.0,0.0,0.0,0.0,0.3043364,-0.1501286,0.1497824,0.06714596,-0.2352798,-0.1998086,0.2142324,-0.301142,0.2166858,0.1395164,0.2782742,-0.3478134,-0.3755851,0.0,0.0,0.02296943
max,2.619895,1.616412,1.647397,1.598519,1.978349,6.249248,2.379488,4.378084,4.378084,0.0,77.72747,0.0,0.0,0.9140359,0.6859943,22.76491,27.72839,17.14608,0.0,0.0,0.9873471,13.26255,0.0,3.717748,13.20894,18.68205,5.761895,1.034213,0.9568931,1.136093,15.78573,9.179748,17.3995,5.954312,6.572083,17.41427,8.527287,7.30053,10.12751,22.27077,16.05057,6.915298,18.15129,18.52214,15.98461,11.7023,13.15321,20.8823,8.746818,2.442588,0.8541117,3.995969,3.800168,9.340099,15.1153,6.093197,11.63214,15.82894,1.763854,0.8777214,2.484974,13.58736,4.206267,6.762499,12.27468,10.86684,15.70389,16.40076,12.68768,12.53432,18.23536,14.60138,9.937786,7.410012,12.38586,14.37673,12.3075,1.304345,9.13354,0.8691337,6.724658,3.28479,5.552733,4.576106,5.344219,4.847019,5.79601,10.71025,1.97267,10.11109,5.96528,1.259553,9.649299,5.242245,1.085457,8.884268,6.257384,7.017002,8.287461,8.100383,9.521466,5.295357,17.99849,4.159759,6.070651,1.714422,8.705738,5.741643,9.279807,13.99054,2.751332,2.585753,3.01467,2.919428,2.052969,4.535071,10.29278,12.07624,12.10727,10.69419,3.670399,3.964052,4.922846,10.27222,11.79371,2.594139,4.82149,7.764045,5.011746,6.146771,9.077808,4.658309,6.115645,5.438778,11.36284,9.008089,11.81888,3.685753,3.907312,5.403595,3.570778,9.924103,11.29819,4.706166,11.51446,1.058414,7.227496,0.8996548,0.9975675,1.467881,0.8774715,1.696073,0.9562205,1.589457,0.9434506,7.308293,11.18606,14.48441,9.085023,13.85662,5.495777,4.689853,6.776471,10.46677,9.057827,13.63252,3.484088,4.235627,3.04047,8.985578,14.2916,5.263182,13.49925,3.721547,2.344295,3.496841,11.52339,15.56285,5.193768,10.37744,3.24126,12.38573,9.394627,3.457583,5.854334,5.68944,5.961966,5.754053,4.69757,5.50618,5.85968,7.440766,3.517884,3.982573,6.561004,3.33578,5.747574,2.261132,6.252125,9.032812,4.259337,4.086681,4.613426,5.655933,5.605427,8.017229,0.9485094,0.8910071,1.188364,1.493503,1.010479,0.8102253,0.7970877,0.7891205,13.22752,12.37562,1.614714,10.3898,1.426625,2.62315,9.368511,5.066099,14.55706,0.4894392,4.122915,4.122915,18.45303,1.285703,1.491116,32.80527,13.94824,1.33402,11.97644,4.823986,8.685791,14.34325,10.89114,7.828504,0.7116038,7.642634,7.630991,9.689843,3.083837,7.110167,4.817407,3.726661,1.776807,3.221001,1.447071,1.004672,6.845651,6.772436,9.650541,10.42024,1.28749,3.252195,6.186159,5.784165,1.796387,3.735042,4.76343,4.3874,4.388506,4.002419,4.04736,4.021781,147.4332,86.70843,198.7919,140.3787,196.3662,116.4849,3.457869,3.37271,0.3289151,0.359299,106.1558,119.0437,2.979261,2.750974,0.014344,0.0115476,6.381296,5.911087,3.213502,5.285515,3.744938,9.023907,9.049922,1.310111,1.381198,8.210237,6.79254,32.97868,30.23167,142.2771,126.5168,43.38351,3.262408,99.75061,97.02829,70.69421,60.33846,67.30013,44.85288,2.333678,2.661312,2.559631,2.513721,2.594298,2.965251,2.30268,2.563735,4.780034,4.599201,4.25568,3.05354,3.039121,2.674982,2.383826,4.894353


# Build the model

In [62]:
# Define the parameters of the algorithm.
max_iters = 50
gamma = 0.2

# Initialization
w_initial = np.zeros((new_x_train.shape[1],))

# Start gradient descent.
start_time = datetime.datetime.now()
gd_ws, gd_losses = mean_squared_error_gd(y_train, new_x_train, w_initial, max_iters, gamma)
end_time = datetime.datetime.now()

# Print result
exection_time = (end_time - start_time).total_seconds()
print("Gradient Descent: execution time={t:.3f} seconds".format(t=exection_time))
print("Gradient Descent: loss={l}".format(l=gd_losses))
print("Gradient Descent: w={w}".format(w=gd_ws))

GD iter. 0/49: loss=nan, w0=nan, w1=nan
GD iter. 1/49: loss=nan, w0=nan, w1=nan
GD iter. 2/49: loss=nan, w0=nan, w1=nan
GD iter. 3/49: loss=nan, w0=nan, w1=nan
GD iter. 4/49: loss=nan, w0=nan, w1=nan
GD iter. 5/49: loss=nan, w0=nan, w1=nan
GD iter. 6/49: loss=nan, w0=nan, w1=nan
GD iter. 7/49: loss=nan, w0=nan, w1=nan
GD iter. 8/49: loss=nan, w0=nan, w1=nan
GD iter. 9/49: loss=nan, w0=nan, w1=nan
GD iter. 10/49: loss=nan, w0=nan, w1=nan
GD iter. 11/49: loss=nan, w0=nan, w1=nan
GD iter. 12/49: loss=nan, w0=nan, w1=nan
GD iter. 13/49: loss=nan, w0=nan, w1=nan
GD iter. 14/49: loss=nan, w0=nan, w1=nan
GD iter. 15/49: loss=nan, w0=nan, w1=nan
GD iter. 16/49: loss=nan, w0=nan, w1=nan
GD iter. 17/49: loss=nan, w0=nan, w1=nan
GD iter. 18/49: loss=nan, w0=nan, w1=nan
GD iter. 19/49: loss=nan, w0=nan, w1=nan
GD iter. 20/49: loss=nan, w0=nan, w1=nan
GD iter. 21/49: loss=nan, w0=nan, w1=nan
GD iter. 22/49: loss=nan, w0=nan, w1=nan
GD iter. 23/49: loss=nan, w0=nan, w1=nan
GD iter. 24/49: loss=nan, 

# Test the model

In [58]:
new_x_val = preprocessing_dataset_test_naive(x_val, mean, std)
y_pred = new_x_val @ gd_ws
y_pred[y_pred <= 0] = -1
y_pred[y_pred > 0] = 1

def precision(y_pred, y_test):
    return np.sum(y_pred[y_pred == 1] == y_test[y_pred == 1]) / np.sum(y_pred == 1)

def recall(y_pred, y_test):
    return np.sum(y_pred[y_test == 1] == y_test[y_test == 1]) / np.sum(y_test == 1)

def accuracy(y_pred, y_test):
    return np.sum(y_pred == y_test) / len(y_test)

def f1_score(y_pred, y_test):
    prec = precision(y_pred, y_test)
    rec = recall(y_pred, y_test)
    return 2 * prec * rec / (prec + rec)

print("Precision: ", precision(y_pred, y_val))
print("Recall: ", recall(y_pred, y_val))
print("Accuracy: ", accuracy(y_pred, y_val))
print("F1 score: ", f1_score(y_pred, y_val))

Precision:  0.12568984946112283
Recall:  0.7681440932368003
Accuracy:  0.5189175187041919
F1 score:  0.21603098927294398


# Create Submission

In [39]:
new_x_test = preprocessing_dataset_test_naive(x_test, mean, std)
y_pred = new_x_test @ gd_ws
y_pred[y_pred <= 0] = -1
y_pred[y_pred > 0] = 1

create_csv_submission(test_ids, y_pred, "data/submission_gd.csv")