In [72]:
import numpy as np
import pandas as pd

from sklearn.naive_bayes import GaussianNB, BernoulliNB, MultinomialNB
from sklearn.datasets import fetch_olivetti_faces
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, MinMaxScaler
from sklearn.feature_extraction.text import CountVectorizer, HashingVectorizer, TfidfVectorizer
from sklearn import metrics

In [73]:
data = fetch_olivetti_faces()
print(data.DESCR)

.. _olivetti_faces_dataset:

The Olivetti faces dataset
--------------------------

`This dataset contains a set of face images`_ taken between April 1992 and 
April 1994 at AT&T Laboratories Cambridge. The
:func:`sklearn.datasets.fetch_olivetti_faces` function is the data
fetching / caching function that downloads the data
archive from AT&T.

.. _This dataset contains a set of face images: http://www.cl.cam.ac.uk/research/dtg/attarchive/facedatabase.html

As described on the original website:

    There are ten different images of each of 40 distinct subjects. For some
    subjects, the images were taken at different times, varying the lighting,
    facial expressions (open / closed eyes, smiling / not smiling) and facial
    details (glasses / no glasses). All the images were taken against a dark
    homogeneous background with the subjects in an upright, frontal position 
    (with tolerance for some side movement).

**Data Set Characteristics:**

    Classes                        

In [74]:
pd.DataFrame(data.data)

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,...,4056,4057,4058,4059,4060,4061,4062,4063,4064,4065,4066,4067,4068,4069,4070,4071,4072,4073,4074,4075,4076,4077,4078,4079,4080,4081,4082,4083,4084,4085,4086,4087,4088,4089,4090,4091,4092,4093,4094,4095
0,0.309917,0.367769,0.417355,0.442149,0.528926,0.607438,0.657025,0.677686,0.690083,0.685950,0.702479,0.698347,0.694215,0.698347,0.690083,0.694215,0.690083,0.698347,0.702479,0.702479,0.698347,0.706612,0.710744,0.719008,0.727273,0.756198,0.772727,0.776860,0.776860,0.756198,0.760331,0.780992,0.760331,0.768595,0.756198,0.739669,0.743802,0.739669,0.743802,0.719008,...,0.756198,0.752066,0.694215,0.690083,0.681818,0.681818,0.657025,0.648760,0.636364,0.632231,0.636364,0.623967,0.619835,0.644628,0.681818,0.685950,0.677686,0.681818,0.673554,0.665289,0.632231,0.582645,0.541322,0.537190,0.537190,0.553719,0.570248,0.611570,0.632231,0.657025,0.665289,0.669421,0.652893,0.661157,0.475207,0.132231,0.148760,0.152893,0.161157,0.157025
1,0.454545,0.471074,0.512397,0.557851,0.595041,0.640496,0.681818,0.702479,0.710744,0.702479,0.710744,0.698347,0.702479,0.706612,0.706612,0.714876,0.714876,0.706612,0.698347,0.714876,0.698347,0.723140,0.731405,0.743802,0.756198,0.772727,0.768595,0.785124,0.764463,0.756198,0.731405,0.743802,0.735537,0.719008,0.706612,0.714876,0.719008,0.710744,0.710744,0.706612,...,0.673554,0.661157,0.652893,0.628099,0.632231,0.644628,0.640496,0.628099,0.632231,0.636364,0.628099,0.619835,0.619835,0.603306,0.590909,0.561983,0.516529,0.533058,0.578512,0.570248,0.561983,0.557851,0.545455,0.111570,0.095041,0.152893,0.152893,0.128099,0.136364,0.132231,0.136364,0.157025,0.136364,0.148760,0.152893,0.152893,0.152893,0.152893,0.152893,0.152893
2,0.318182,0.400826,0.491736,0.528926,0.586777,0.657025,0.681818,0.685950,0.702479,0.698347,0.702479,0.706612,0.706612,0.714876,0.710744,0.706612,0.706612,0.706612,0.723140,0.719008,0.719008,0.710744,0.710744,0.752066,0.756198,0.764463,0.785124,0.797521,0.838843,0.826446,0.842975,0.847107,0.830579,0.818182,0.793388,0.768595,0.760331,0.756198,0.739669,0.710744,...,0.719008,0.714876,0.706612,0.685950,0.665289,0.652893,0.644628,0.636364,0.623967,0.636364,0.657025,0.644628,0.677686,0.681818,0.690083,0.690083,0.690083,0.681818,0.661157,0.652893,0.636364,0.586777,0.545455,0.570248,0.607438,0.603306,0.595041,0.578512,0.607438,0.413223,0.074380,0.132231,0.181818,0.136364,0.128099,0.148760,0.144628,0.140496,0.148760,0.152893
3,0.198347,0.194215,0.194215,0.194215,0.190083,0.190083,0.243802,0.404959,0.483471,0.516529,0.537190,0.566116,0.574380,0.586777,0.611570,0.632231,0.640496,0.657025,0.673554,0.694215,0.702479,0.719008,0.727273,0.719008,0.723140,0.710744,0.739669,0.747934,0.756198,0.756198,0.764463,0.772727,0.785124,0.785124,0.805785,0.818182,0.805785,0.809917,0.793388,0.789256,...,0.400826,0.442149,0.479339,0.512397,0.537190,0.557851,0.566116,0.586777,0.586777,0.615702,0.632231,0.661157,0.681818,0.673554,0.714876,0.710744,0.706612,0.690083,0.681818,0.623967,0.615702,0.586777,0.582645,0.578512,0.590909,0.590909,0.611570,0.628099,0.644628,0.657025,0.652893,0.636364,0.657025,0.685950,0.727273,0.743802,0.764463,0.752066,0.752066,0.739669
4,0.500000,0.545455,0.582645,0.623967,0.648760,0.690083,0.694215,0.714876,0.723140,0.731405,0.739669,0.739669,0.764463,0.756198,0.764463,0.785124,0.793388,0.797521,0.814050,0.809917,0.809917,0.818182,0.830579,0.830579,0.842975,0.838843,0.838843,0.838843,0.830579,0.818182,0.805785,0.801653,0.797521,0.793388,0.793388,0.785124,0.797521,0.801653,0.793388,0.793388,...,0.561983,0.557851,0.574380,0.595041,0.599174,0.611570,0.623967,0.636364,0.669421,0.681818,0.698347,0.698347,0.714876,0.710744,0.764463,0.756198,0.785124,0.797521,0.739669,0.714876,0.681818,0.619835,0.293388,0.144628,0.152893,0.152893,0.157025,0.148760,0.161157,0.161157,0.190083,0.161157,0.177686,0.173554,0.177686,0.177686,0.177686,0.177686,0.173554,0.173554
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
395,0.400826,0.495868,0.570248,0.632231,0.648760,0.640496,0.661157,0.636364,0.665289,0.698347,0.702479,0.657025,0.665289,0.731405,0.747934,0.768595,0.768595,0.768595,0.780992,0.809917,0.809917,0.814050,0.818182,0.814050,0.809917,0.818182,0.805785,0.809917,0.805785,0.822314,0.814050,0.818182,0.814050,0.805785,0.797521,0.793388,0.789256,0.780992,0.785124,0.772727,...,0.206612,0.231405,0.280992,0.330579,0.330579,0.351240,0.351240,0.347107,0.347107,0.355372,0.376033,0.371901,0.359504,0.342975,0.363636,0.309917,0.301653,0.252066,0.276859,0.314050,0.334711,0.322314,0.330579,0.347107,0.338843,0.351240,0.371901,0.363636,0.351240,0.367769,0.388430,0.396694,0.264463,0.099174,0.181818,0.243802,0.247934,0.161157,0.157025,0.136364
396,0.367769,0.367769,0.351240,0.301653,0.247934,0.247934,0.367769,0.512397,0.574380,0.628099,0.652893,0.669421,0.698347,0.731405,0.760331,0.768595,0.797521,0.801653,0.801653,0.805785,0.809917,0.814050,0.818182,0.826446,0.826446,0.822314,0.826446,0.826446,0.826446,0.822314,0.826446,0.830579,0.826446,0.826446,0.822314,0.830579,0.826446,0.834711,0.834711,0.830579,...,0.772727,0.776860,0.785124,0.797521,0.793388,0.797521,0.805785,0.814050,0.805785,0.809917,0.801653,0.805785,0.801653,0.801653,0.780992,0.752066,0.723140,0.710744,0.690083,0.648760,0.623967,0.599174,0.590909,0.590909,0.582645,0.566116,0.541322,0.520661,0.491736,0.446281,0.380165,0.334711,0.289256,0.285124,0.338843,0.404959,0.458678,0.487603,0.512397,0.549587
397,0.500000,0.533058,0.607438,0.628099,0.657025,0.632231,0.657025,0.669421,0.673554,0.702479,0.719008,0.735537,0.702479,0.698347,0.752066,0.768595,0.785124,0.793388,0.801653,0.805785,0.814050,0.822314,0.822314,0.822314,0.826446,0.814050,0.814050,0.801653,0.805785,0.805785,0.805785,0.805785,0.809917,0.809917,0.801653,0.805785,0.789256,0.789256,0.789256,0.785124,...,0.483471,0.491736,0.537190,0.541322,0.557851,0.561983,0.570248,0.574380,0.557851,0.545455,0.533058,0.549587,0.541322,0.524793,0.512397,0.504132,0.466942,0.450413,0.404959,0.371901,0.342975,0.347107,0.363636,0.367769,0.367769,0.376033,0.417355,0.111570,0.198347,0.239669,0.194215,0.148760,0.152893,0.161157,0.161157,0.173554,0.157025,0.177686,0.148760,0.190083
398,0.214876,0.219008,0.219008,0.223140,0.210744,0.202479,0.276859,0.400826,0.487603,0.549587,0.595041,0.615702,0.648760,0.690083,0.719008,0.752066,0.768595,0.785124,0.785124,0.789256,0.797521,0.793388,0.793388,0.814050,0.814050,0.818182,0.822314,0.818182,0.818182,0.814050,0.818182,0.805785,0.818182,0.809917,0.818182,0.818182,0.826446,0.830579,0.838843,0.822314,...,0.714876,0.723140,0.735537,0.756198,0.764463,0.760331,0.772727,0.793388,0.789256,0.814050,0.805785,0.797521,0.789256,0.793388,0.789256,0.768595,0.756198,0.752066,0.731405,0.698347,0.690083,0.657025,0.652893,0.669421,0.648760,0.611570,0.595041,0.574380,0.549587,0.504132,0.446281,0.392562,0.367769,0.409091,0.479339,0.524793,0.545455,0.574380,0.590909,0.603306


In [75]:
data.target

array([ 0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  1,  1,  1,  1,  1,  1,  1,
        1,  1,  1,  2,  2,  2,  2,  2,  2,  2,  2,  2,  2,  3,  3,  3,  3,
        3,  3,  3,  3,  3,  3,  4,  4,  4,  4,  4,  4,  4,  4,  4,  4,  5,
        5,  5,  5,  5,  5,  5,  5,  5,  5,  6,  6,  6,  6,  6,  6,  6,  6,
        6,  6,  7,  7,  7,  7,  7,  7,  7,  7,  7,  7,  8,  8,  8,  8,  8,
        8,  8,  8,  8,  8,  9,  9,  9,  9,  9,  9,  9,  9,  9,  9, 10, 10,
       10, 10, 10, 10, 10, 10, 10, 10, 11, 11, 11, 11, 11, 11, 11, 11, 11,
       11, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 13, 13, 13, 13, 13, 13,
       13, 13, 13, 13, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 15, 15, 15,
       15, 15, 15, 15, 15, 15, 15, 16, 16, 16, 16, 16, 16, 16, 16, 16, 16,
       17, 17, 17, 17, 17, 17, 17, 17, 17, 17, 18, 18, 18, 18, 18, 18, 18,
       18, 18, 18, 19, 19, 19, 19, 19, 19, 19, 19, 19, 19, 20, 20, 20, 20,
       20, 20, 20, 20, 20, 20, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 22,
       22, 22, 22, 22, 22

In [76]:
X = data.data
y = data.target

In [77]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=.2)

In [78]:
print('전체 데이터 크기: {}'.format(X.shape))
print('학습 데이터 크기: {}'.format(X_train.shape))
print('평가 데이터 크기: {}'.format(X_test.shape))

전체 데이터 크기: (400, 4096)
학습 데이터 크기: (320, 4096)
평가 데이터 크기: (80, 4096)


In [79]:
data_df = pd.DataFrame(data=X)
data_df.describe()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,...,4056,4057,4058,4059,4060,4061,4062,4063,4064,4065,4066,4067,4068,4069,4070,4071,4072,4073,4074,4075,4076,4077,4078,4079,4080,4081,4082,4083,4084,4085,4086,4087,4088,4089,4090,4091,4092,4093,4094,4095
count,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,...,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0,400.0
mean,0.400134,0.434235,0.476281,0.518482,0.554845,0.588729,0.621426,0.647511,0.664814,0.676591,0.686208,0.692572,0.699401,0.704877,0.710155,0.713884,0.718233,0.722345,0.725145,0.727614,0.7297,0.730062,0.730961,0.729907,0.729721,0.730289,0.72841,0.726798,0.725351,0.724111,0.724246,0.725744,0.726353,0.72625,0.726901,0.725816,0.725557,0.724638,0.722118,0.718761,...,0.502634,0.507056,0.507469,0.507428,0.505227,0.501694,0.49718,0.493843,0.490289,0.490176,0.488667,0.488533,0.489256,0.488295,0.4872,0.483698,0.478368,0.471364,0.463719,0.454204,0.442541,0.434453,0.421271,0.409411,0.403667,0.39905,0.391818,0.385361,0.375506,0.366674,0.363079,0.367221,0.363027,0.355506,0.340196,0.338657,0.335909,0.321415,0.313647,0.310455
std,0.180695,0.189504,0.194742,0.193313,0.188593,0.178481,0.167109,0.155024,0.147616,0.143583,0.136356,0.13158,0.12845,0.126246,0.124832,0.125469,0.12609,0.127646,0.129569,0.130954,0.131288,0.13502,0.135711,0.137272,0.13732,0.135546,0.1347,0.134171,0.133041,0.132261,0.129363,0.126623,0.12451,0.123213,0.121916,0.123161,0.121455,0.123242,0.125143,0.125989,...,0.15288,0.150255,0.150632,0.151813,0.150475,0.151989,0.153589,0.156037,0.155301,0.152009,0.152033,0.152803,0.150929,0.14811,0.143041,0.140258,0.138368,0.137675,0.137383,0.134865,0.135484,0.132048,0.133554,0.133768,0.133282,0.134569,0.138198,0.146356,0.152795,0.160557,0.164952,0.181861,0.181611,0.188709,0.186088,0.189256,0.19528,0.187842,0.183616,0.180635
min,0.086777,0.066116,0.090909,0.041322,0.107438,0.107438,0.115702,0.115702,0.119835,0.140496,0.140496,0.14876,0.161157,0.169421,0.181818,0.173554,0.165289,0.18595,0.152893,0.169421,0.157025,0.14876,0.161157,0.152893,0.157025,0.144628,0.144628,0.144628,0.14876,0.165289,0.202479,0.181818,0.214876,0.235537,0.219008,0.243802,0.235537,0.22314,0.190083,0.177686,...,0.049587,0.165289,0.165289,0.165289,0.173554,0.177686,0.169421,0.181818,0.14876,0.181818,0.161157,0.169421,0.152893,0.144628,0.152893,0.123967,0.132231,0.095041,0.066116,0.07438,0.061983,0.078512,0.057851,0.070248,0.070248,0.070248,0.070248,0.028926,0.028926,0.033058,0.049587,0.03719,0.053719,0.049587,0.033058,0.012397,0.049587,0.057851,0.061983,0.033058
25%,0.243802,0.267562,0.31405,0.383264,0.446281,0.515496,0.544421,0.581612,0.599174,0.61157,0.619835,0.628099,0.636364,0.643595,0.64876,0.655992,0.665289,0.669421,0.673554,0.68595,0.694215,0.690083,0.690083,0.68905,0.68595,0.677686,0.681818,0.673554,0.669421,0.669421,0.659091,0.657025,0.665289,0.667355,0.676653,0.68595,0.68595,0.680785,0.67562,0.668388,...,0.38843,0.394628,0.38843,0.380165,0.380165,0.376033,0.370868,0.363636,0.366736,0.363636,0.355372,0.363636,0.363636,0.375,0.383264,0.376033,0.371901,0.363636,0.362603,0.355372,0.35124,0.350207,0.338843,0.326446,0.309917,0.297521,0.289256,0.289256,0.272727,0.252066,0.227273,0.214876,0.219008,0.197314,0.177686,0.177686,0.173554,0.173554,0.173554,0.172521
50%,0.392562,0.458678,0.512397,0.545455,0.584711,0.615702,0.652893,0.669421,0.683884,0.702479,0.714876,0.719008,0.735537,0.743802,0.752066,0.760331,0.768595,0.772727,0.772727,0.768595,0.774793,0.77686,0.778926,0.778926,0.780992,0.780992,0.77686,0.770661,0.764463,0.768595,0.764463,0.766529,0.766529,0.766529,0.764463,0.768595,0.764463,0.764463,0.764463,0.760331,...,0.514463,0.512397,0.510331,0.518595,0.516529,0.510331,0.508264,0.502066,0.491736,0.489669,0.5,0.497934,0.5,0.489669,0.481405,0.483471,0.479339,0.475207,0.458678,0.444215,0.423554,0.421488,0.409091,0.402893,0.404959,0.404959,0.39876,0.38843,0.376033,0.367769,0.367769,0.367769,0.342975,0.334711,0.320248,0.31405,0.299587,0.289256,0.270661,0.272727
75%,0.528926,0.575413,0.636364,0.666322,0.702479,0.714876,0.735537,0.757231,0.772727,0.780992,0.789256,0.789256,0.793388,0.793388,0.793388,0.801653,0.801653,0.805785,0.809917,0.81405,0.818182,0.822314,0.822314,0.822314,0.822314,0.822314,0.822314,0.818182,0.818182,0.818182,0.818182,0.81405,0.81405,0.81405,0.81405,0.81405,0.81405,0.81405,0.809917,0.809917,...,0.619835,0.619835,0.625,0.628099,0.620868,0.61157,0.61157,0.615702,0.608471,0.603306,0.607438,0.603306,0.595041,0.58781,0.586777,0.578512,0.57438,0.566116,0.557851,0.549587,0.541322,0.525826,0.520661,0.512397,0.504132,0.5,0.483471,0.491736,0.483471,0.483471,0.484504,0.496901,0.5,0.5,0.479339,0.46281,0.46281,0.446281,0.414256,0.417355
max,0.805785,0.822314,0.871901,0.892562,0.871901,0.871901,0.871901,0.871901,0.871901,0.871901,0.863636,0.863636,0.859504,0.867769,0.871901,0.876033,0.884298,0.88843,0.892562,0.896694,0.900826,0.900826,0.900826,0.900826,0.904959,0.900826,0.896694,0.900826,0.900826,0.896694,0.896694,0.892562,0.88843,0.88843,0.892562,0.88843,0.88843,0.892562,0.892562,0.896694,...,0.842975,0.834711,0.830579,0.834711,0.830579,0.830579,0.830579,0.830579,0.830579,0.826446,0.826446,0.830579,0.826446,0.826446,0.822314,0.826446,0.822314,0.805785,0.801653,0.789256,0.81405,0.793388,0.801653,0.77686,0.760331,0.772727,0.77686,0.768595,0.789256,0.772727,0.793388,0.904959,0.88843,0.896694,0.826446,0.863636,0.921488,0.929752,0.884298,0.822314


In [80]:
data_train_df = pd.DataFrame(data = X_train)
data_train_df.describe()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,...,4056,4057,4058,4059,4060,4061,4062,4063,4064,4065,4066,4067,4068,4069,4070,4071,4072,4073,4074,4075,4076,4077,4078,4079,4080,4081,4082,4083,4084,4085,4086,4087,4088,4089,4090,4091,4092,4093,4094,4095
count,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,...,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0
mean,0.40195,0.434711,0.475349,0.519757,0.557464,0.592019,0.625426,0.651821,0.669718,0.681663,0.692162,0.698864,0.705385,0.710576,0.715702,0.719912,0.724174,0.728681,0.73134,0.733484,0.73595,0.736945,0.737526,0.736002,0.735718,0.735705,0.73329,0.731418,0.729455,0.728732,0.728835,0.729984,0.729985,0.730269,0.730862,0.729545,0.729313,0.728874,0.726136,0.722327,...,0.504003,0.507593,0.507813,0.507916,0.505385,0.501872,0.498166,0.494796,0.491206,0.490677,0.48865,0.48985,0.49149,0.490625,0.489398,0.484749,0.478357,0.470816,0.4629,0.453758,0.442536,0.43639,0.424019,0.409866,0.403203,0.398631,0.390302,0.383497,0.371255,0.365057,0.362061,0.364773,0.357825,0.351885,0.34162,0.336364,0.328164,0.314889,0.310498,0.310421
std,0.181259,0.187797,0.193708,0.193585,0.189682,0.1793,0.167209,0.153951,0.145762,0.139964,0.131339,0.126461,0.122999,0.121286,0.119382,0.119704,0.120336,0.121931,0.123509,0.12451,0.124054,0.127171,0.128363,0.13039,0.130738,0.128849,0.128599,0.128412,0.128648,0.127667,0.125593,0.123567,0.121535,0.119896,0.118382,0.119685,0.118071,0.119635,0.121601,0.123264,...,0.152274,0.149297,0.149591,0.151572,0.150247,0.153572,0.154708,0.157794,0.157938,0.154354,0.154296,0.155229,0.153057,0.150648,0.144778,0.141102,0.139475,0.138558,0.13831,0.134798,0.135273,0.130738,0.130251,0.131185,0.131593,0.131314,0.135606,0.14425,0.149522,0.15874,0.16137,0.176495,0.174398,0.181493,0.181065,0.185659,0.190987,0.184268,0.181352,0.181981
min,0.086777,0.066116,0.090909,0.041322,0.107438,0.107438,0.115702,0.115702,0.119835,0.140496,0.140496,0.14876,0.161157,0.169421,0.181818,0.173554,0.165289,0.18595,0.152893,0.169421,0.157025,0.14876,0.161157,0.157025,0.157025,0.152893,0.144628,0.144628,0.152893,0.169421,0.202479,0.181818,0.214876,0.239669,0.219008,0.243802,0.235537,0.22314,0.190083,0.177686,...,0.049587,0.165289,0.165289,0.169421,0.177686,0.177686,0.181818,0.181818,0.14876,0.181818,0.173554,0.169421,0.177686,0.144628,0.152893,0.123967,0.132231,0.095041,0.066116,0.07438,0.061983,0.078512,0.07438,0.070248,0.070248,0.070248,0.070248,0.028926,0.028926,0.033058,0.049587,0.03719,0.053719,0.049587,0.066116,0.012397,0.049587,0.061983,0.061983,0.033058
25%,0.246901,0.267562,0.31095,0.386364,0.446281,0.512397,0.556818,0.585744,0.603306,0.615702,0.623967,0.632231,0.640496,0.644628,0.65186,0.661157,0.665289,0.673554,0.680785,0.693182,0.698347,0.694215,0.693182,0.693182,0.690083,0.690083,0.68905,0.684917,0.68595,0.680785,0.680785,0.679752,0.681818,0.68905,0.693182,0.694215,0.693182,0.690083,0.677686,0.676653,...,0.384298,0.387397,0.387397,0.380165,0.376033,0.376033,0.371901,0.363636,0.358471,0.363636,0.354339,0.359504,0.363636,0.383264,0.384298,0.383264,0.366736,0.362603,0.354339,0.355372,0.35124,0.355372,0.347107,0.329545,0.31405,0.297521,0.289256,0.289256,0.271694,0.256198,0.227273,0.22314,0.219008,0.194215,0.181818,0.177686,0.169421,0.172521,0.173554,0.173554
50%,0.394628,0.456612,0.512397,0.551653,0.590909,0.615702,0.657025,0.677686,0.690083,0.706612,0.719008,0.727273,0.739669,0.747934,0.756198,0.764463,0.768595,0.77686,0.77686,0.77686,0.780992,0.780992,0.785124,0.783058,0.780992,0.780992,0.77686,0.772727,0.764463,0.768595,0.764463,0.768595,0.768595,0.768595,0.768595,0.768595,0.768595,0.768595,0.768595,0.764463,...,0.514463,0.514463,0.508264,0.520661,0.516529,0.508264,0.506198,0.5,0.491736,0.487603,0.497934,0.495868,0.5,0.487603,0.481405,0.481405,0.479339,0.475207,0.460744,0.444215,0.431818,0.427686,0.413223,0.407025,0.407025,0.400826,0.400826,0.386364,0.376033,0.367769,0.367769,0.367769,0.338843,0.334711,0.322314,0.318182,0.293388,0.289256,0.270661,0.268595
75%,0.530992,0.583678,0.636364,0.670455,0.703512,0.724174,0.743802,0.764463,0.77686,0.780992,0.789256,0.790289,0.793388,0.793388,0.797521,0.801653,0.801653,0.805785,0.809917,0.81405,0.818182,0.822314,0.822314,0.822314,0.822314,0.822314,0.822314,0.819215,0.818182,0.818182,0.818182,0.818182,0.818182,0.818182,0.818182,0.818182,0.81405,0.81405,0.81095,0.809917,...,0.616736,0.615702,0.623967,0.628099,0.620868,0.61157,0.607438,0.608471,0.607438,0.607438,0.608471,0.604339,0.597107,0.579545,0.586777,0.575413,0.57438,0.561983,0.557851,0.549587,0.541322,0.521694,0.517562,0.512397,0.5,0.491736,0.483471,0.491736,0.479339,0.480372,0.483471,0.492769,0.491736,0.483471,0.467975,0.448347,0.451446,0.42562,0.40186,0.407025
max,0.805785,0.822314,0.871901,0.892562,0.871901,0.871901,0.871901,0.871901,0.871901,0.871901,0.863636,0.863636,0.859504,0.867769,0.871901,0.876033,0.884298,0.88843,0.892562,0.896694,0.900826,0.900826,0.900826,0.900826,0.904959,0.900826,0.896694,0.900826,0.900826,0.896694,0.896694,0.892562,0.88843,0.88843,0.892562,0.88843,0.88843,0.892562,0.892562,0.896694,...,0.842975,0.834711,0.830579,0.834711,0.830579,0.830579,0.830579,0.830579,0.830579,0.826446,0.826446,0.830579,0.826446,0.826446,0.822314,0.826446,0.822314,0.805785,0.801653,0.789256,0.772727,0.760331,0.752066,0.719008,0.710744,0.756198,0.77686,0.768595,0.768595,0.772727,0.793388,0.904959,0.85124,0.838843,0.826446,0.863636,0.921488,0.929752,0.884298,0.822314


In [81]:
data_test_df = pd.DataFrame(data = X_test)
data_test_df.describe()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,...,4056,4057,4058,4059,4060,4061,4062,4063,4064,4065,4066,4067,4068,4069,4070,4071,4072,4073,4074,4075,4076,4077,4078,4079,4080,4081,4082,4083,4084,4085,4086,4087,4088,4089,4090,4091,4092,4093,4094,4095
count,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,...,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0
mean,0.392872,0.432335,0.48001,0.513378,0.54437,0.575568,0.605424,0.630269,0.645196,0.656302,0.662397,0.667407,0.675465,0.682076,0.687965,0.689773,0.694473,0.697004,0.700362,0.704132,0.7047,0.702531,0.7047,0.705527,0.705733,0.708626,0.708884,0.708316,0.708936,0.70563,0.705888,0.708781,0.711829,0.710176,0.711054,0.710899,0.710537,0.707696,0.706043,0.704494,...,0.497159,0.504907,0.506095,0.505475,0.504597,0.500981,0.493234,0.490031,0.486622,0.488171,0.48874,0.483264,0.48032,0.478977,0.478409,0.479494,0.478409,0.473554,0.466994,0.455992,0.442562,0.426705,0.410279,0.407593,0.405527,0.400723,0.397882,0.39282,0.39251,0.37314,0.367149,0.377014,0.383833,0.36999,0.334504,0.347831,0.36689,0.347521,0.32624,0.310589
std,0.179366,0.197386,0.200022,0.19335,0.184976,0.175657,0.166793,0.159058,0.154191,0.156523,0.153408,0.148539,0.146688,0.142964,0.143287,0.144617,0.145296,0.146443,0.149719,0.152693,0.155313,0.160659,0.160041,0.160526,0.159663,0.158626,0.156136,0.154609,0.149078,0.148676,0.142834,0.137696,0.135603,0.135285,0.134773,0.13597,0.133885,0.136215,0.138065,0.136233,...,0.156132,0.154969,0.15568,0.153718,0.152332,0.146425,0.149919,0.149706,0.145159,0.143156,0.143556,0.143497,0.142672,0.137995,0.136396,0.137623,0.134706,0.134918,0.134416,0.135973,0.137182,0.137736,0.146382,0.144498,0.140683,0.147746,0.148864,0.15522,0.165139,0.168507,0.179588,0.202821,0.2079,0.215831,0.206089,0.203985,0.209993,0.200596,0.193077,0.176269
min,0.103306,0.07438,0.099174,0.11157,0.11157,0.123967,0.123967,0.128099,0.132231,0.144628,0.161157,0.161157,0.181818,0.198347,0.210744,0.206612,0.219008,0.206612,0.194215,0.198347,0.190083,0.173554,0.177686,0.152893,0.161157,0.144628,0.144628,0.14876,0.14876,0.165289,0.219008,0.214876,0.239669,0.235537,0.22314,0.260331,0.297521,0.305785,0.297521,0.297521,...,0.144628,0.173554,0.169421,0.165289,0.173554,0.194215,0.169421,0.181818,0.161157,0.210744,0.161157,0.169421,0.152893,0.157025,0.194215,0.198347,0.173554,0.18595,0.169421,0.161157,0.136364,0.128099,0.057851,0.095041,0.107438,0.103306,0.11157,0.049587,0.049587,0.053719,0.049587,0.049587,0.057851,0.070248,0.033058,0.07438,0.078512,0.057851,0.078512,0.053719
25%,0.219008,0.270661,0.335744,0.379132,0.489669,0.527893,0.525826,0.554752,0.582645,0.586777,0.603306,0.607438,0.629132,0.627066,0.647727,0.65186,0.653926,0.660124,0.671488,0.68595,0.677686,0.678719,0.670455,0.672521,0.657025,0.645661,0.639463,0.630165,0.635331,0.599174,0.622934,0.627066,0.626033,0.626033,0.628099,0.626033,0.632231,0.633264,0.639463,0.634298,...,0.396694,0.399793,0.395661,0.39876,0.386364,0.383264,0.367769,0.370868,0.367769,0.369835,0.358471,0.363636,0.363636,0.354339,0.359504,0.362603,0.379132,0.371901,0.366736,0.370868,0.355372,0.338843,0.318182,0.31405,0.304752,0.295455,0.301653,0.286157,0.286157,0.23657,0.22624,0.204545,0.206612,0.202479,0.169421,0.181818,0.196281,0.18595,0.173554,0.168388
50%,0.392562,0.477273,0.516529,0.533058,0.570248,0.60124,0.640496,0.652893,0.665289,0.68595,0.696281,0.698347,0.706612,0.71281,0.727273,0.727273,0.741736,0.747934,0.752066,0.756198,0.756198,0.758264,0.768595,0.768595,0.762397,0.768595,0.774793,0.768595,0.766529,0.766529,0.758264,0.758264,0.760331,0.764463,0.760331,0.766529,0.756198,0.758264,0.762397,0.754132,...,0.504132,0.508264,0.526859,0.5,0.533058,0.524793,0.512397,0.508264,0.495868,0.510331,0.533058,0.514463,0.495868,0.5,0.481405,0.497934,0.487603,0.469008,0.454545,0.440083,0.413223,0.400826,0.392562,0.38843,0.38843,0.404959,0.396694,0.400826,0.39876,0.380165,0.369835,0.376033,0.384298,0.316116,0.295455,0.283058,0.328512,0.299587,0.274793,0.278926
75%,0.521694,0.565083,0.634298,0.661157,0.679752,0.698347,0.721074,0.743802,0.760331,0.777893,0.778926,0.789256,0.785124,0.789256,0.793388,0.794421,0.797521,0.802686,0.806818,0.809917,0.81405,0.81405,0.818182,0.81405,0.809917,0.81405,0.81405,0.81405,0.81405,0.809917,0.806818,0.805785,0.806818,0.805785,0.805785,0.806818,0.801653,0.801653,0.801653,0.797521,...,0.625,0.628099,0.642562,0.629132,0.617769,0.612603,0.616736,0.617769,0.615702,0.603306,0.604339,0.600207,0.588843,0.590909,0.58781,0.583678,0.578512,0.57438,0.567149,0.552686,0.535124,0.534091,0.520661,0.503099,0.520661,0.510331,0.505165,0.5,0.495868,0.491736,0.496901,0.514463,0.538223,0.567149,0.501033,0.540289,0.538223,0.512397,0.457645,0.422521
max,0.780992,0.818182,0.830579,0.834711,0.842975,0.842975,0.863636,0.867769,0.863636,0.859504,0.859504,0.863636,0.855372,0.855372,0.85124,0.859504,0.880165,0.876033,0.884298,0.892562,0.892562,0.880165,0.88843,0.884298,0.892562,0.896694,0.88843,0.871901,0.867769,0.867769,0.867769,0.867769,0.871901,0.871901,0.871901,0.876033,0.880165,0.880165,0.867769,0.871901,...,0.752066,0.743802,0.739669,0.739669,0.747934,0.756198,0.768595,0.772727,0.764463,0.756198,0.739669,0.735537,0.747934,0.747934,0.756198,0.756198,0.768595,0.780992,0.797521,0.780992,0.81405,0.793388,0.801653,0.77686,0.760331,0.772727,0.756198,0.735537,0.789256,0.706612,0.772727,0.847107,0.88843,0.896694,0.822314,0.785124,0.838843,0.913223,0.867769,0.81405


In [82]:
scaler = StandardScaler()
X_train_scale = scaler.fit_transform(X_train)
X_test_scale = scaler.transform(X_test)

In [83]:
data_train_df = pd.DataFrame(data = X_train_scale)
data_train_df.describe()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,...,4056,4057,4058,4059,4060,4061,4062,4063,4064,4065,4066,4067,4068,4069,4070,4071,4072,4073,4074,4075,4076,4077,4078,4079,4080,4081,4082,4083,4084,4085,4086,4087,4088,4089,4090,4091,4092,4093,4094,4095
count,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,...,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0,320.0
mean,5.401671e-09,1.322478e-08,1.080334e-08,-1.145527e-08,-2.235174e-09,1.396984e-10,4.423782e-09,3.49246e-09,1.30909e-08,9.126961e-09,-4.970934e-09,-3.457535e-09,3.096648e-09,-1.508743e-08,5.681068e-09,1.969747e-08,-1.816079e-09,-5.16884e-09,-9.49949e-09,1.536682e-09,-2.514571e-09,-1.464505e-08,1.073349e-08,-4.673347e-09,-5.974289e-09,6.519258e-10,1.18278e-08,-2.980232e-09,6.193295e-09,-1.005828e-08,-8.032657e-09,8.475036e-09,1.043081e-08,4.656613e-10,-6.61239e-09,6.146729e-09,-1.997687e-08,-2.291054e-08,1.587905e-08,2.793968e-10,...,5.029142e-09,7.450581e-10,2.793968e-09,-1.061708e-08,5.960465e-09,-1.024455e-08,-1.788139e-08,-3.129244e-08,1.490116e-09,-1.862645e-09,-8.754432e-09,1.601875e-08,1.247972e-08,1.47149e-08,0.0,7.264316e-09,-7.823109e-09,3.539026e-09,1.639128e-08,1.788139e-08,-3.539026e-09,-1.899898e-08,5.215406e-09,8.195639e-09,3.166497e-09,-2.197921e-08,8.381903e-09,5.029142e-09,-1.117587e-09,5.029142e-09,-1.173466e-08,-8.009374e-09,3.352761e-09,3.72529e-09,1.490116e-08,-1.243316e-08,-2.249144e-08,-8.731149e-09,2.980232e-08,6.332994e-09
std,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001567,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001567,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,...,1.001566,1.001566,1.001567,1.001566,1.001566,1.001566,1.001567,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566,1.001566
min,-1.741519,-1.965801,-1.987738,-2.475319,-2.376248,-2.706864,-3.053196,-3.487845,-3.778381,-3.872519,-4.206897,-4.356792,-4.431576,-4.468776,-4.479076,-4.571406,-4.651641,-4.458089,-4.690781,-4.537361,-4.674037,-4.632395,-4.497189,-4.447316,-4.433303,-4.530319,-4.584676,-4.576752,-4.488708,-4.387878,-4.197543,-4.443138,-4.245007,-4.098279,-4.330535,-4.064874,-4.18856,-4.233922,-4.415221,-4.425402,...,-2.988885,-2.296358,-2.293314,-2.236719,-2.184476,-2.114284,-2.048007,-1.98657,-2.171629,-2.00411,-2.045354,-2.067472,-2.053453,-2.300326,-2.32793,-2.560904,-2.485517,-2.716282,-2.873307,-2.818833,-2.817622,-2.741643,-2.688551,-2.592891,-2.534152,-2.504663,-2.363882,-2.461891,-2.293079,-2.094744,-1.939414,-1.858953,-1.746485,-1.668233,-1.523955,-1.747691,-1.460898,-1.374638,-1.372495,-1.526522
25%,-0.8567388,-0.8914423,-0.8500184,-0.6901495,-0.587073,-0.4447723,-0.4109551,-0.4298794,-0.4563375,-0.4720062,-0.5200399,-0.527724,-0.5283821,-0.5445877,-0.5356169,-0.4916072,-0.4900987,-0.4528203,-0.4099655,-0.3241936,-0.3035956,-0.3365298,-0.3459995,-0.3289164,-0.3496069,-0.3546321,-0.3445596,-0.3626876,-0.3386966,-0.3761501,-0.3831862,-0.4071567,-0.3969384,-0.3443277,-0.3187976,-0.2956586,-0.3064906,-0.3247546,-0.3990629,-0.3711179,...,-0.7873534,-0.8063414,-0.8062264,-0.8441563,-0.8622726,-0.8207009,-0.8174306,-0.8325119,-0.8417426,-0.8243346,-0.8718385,-0.8410196,-0.836642,-0.7137759,-0.727082,-0.7203603,-0.8015522,-0.7822145,-0.7861454,-0.7310219,-0.6759616,-0.6206635,-0.5914097,-0.6132238,-0.6785519,-0.7711958,-0.7463133,-0.6543405,-0.6669046,-0.6868413,-0.8365815,-0.8037291,-0.7972277,-0.8701037,-0.883944,-0.8560121,-0.8324674,-0.7738259,-0.7563163,-0.7532758
50%,-0.04045734,0.1168021,0.1915563,0.1650212,0.176599,0.1322918,0.189273,0.1682723,0.1399271,0.178527,0.2047269,0.2249988,0.2791753,0.3084965,0.3397442,0.3727572,0.3697237,0.3957538,0.3691262,0.3489161,0.3636474,0.3469033,0.3713902,0.361451,0.3468372,0.3520224,0.3393301,0.3221985,0.2725458,0.3127324,0.2841203,0.312956,0.3181893,0.3201646,0.3192347,0.3267806,0.3332182,0.3325386,0.349712,0.3423689,...,0.0687978,0.04608648,0.003026185,0.08421949,0.0742877,0.04168786,0.05199854,0.03303163,0.00335754,-0.01994222,0.06026839,0.03882648,0.055686,-0.02008943,-0.055297,-0.02374007,0.007047513,0.03173664,-0.01561631,-0.07090496,-0.07935625,-0.06667635,-0.08301178,-0.02168965,0.02909198,0.01674378,0.07773108,0.01990461,0.03200457,0.01710986,0.03542522,0.01700079,-0.1090162,-0.09477786,-0.1067876,-0.09808466,-0.1823668,-0.1393238,-0.2200128,-0.2301972
75%,0.7130332,0.7944746,0.8325253,0.7796753,0.7711726,0.7382094,0.709058,0.7328199,0.7361913,0.7107811,0.7404243,0.7240867,0.716602,0.6838538,0.6864218,0.6839283,0.6448671,0.6333542,0.6372005,0.6480758,0.6639066,0.6723475,0.6615704,0.6629907,0.6634026,0.6732289,0.6933433,0.6847853,0.6907638,0.7017484,0.7125142,0.7148793,0.7268338,0.7343937,0.7387627,0.7417401,0.7187963,0.713077,0.698573,0.7117029,...,0.741488,0.7252566,0.7776951,0.7941538,0.7698218,0.7154288,0.7074144,0.7215322,0.7370878,0.7576371,0.7777896,0.738704,0.6911317,0.5911787,0.673661,0.6435487,0.6895351,0.6590018,0.6875851,0.7120243,0.7314152,0.6535071,0.7193035,0.7827969,0.7367361,0.7101306,0.6881341,0.7515321,0.7239937,0.7275793,0.7535484,0.726346,0.7690467,0.7261553,0.6989409,0.6041127,0.6465116,0.6018647,0.5045675,0.531678
max,2.231431,2.067176,2.050366,1.928811,1.660305,1.563411,1.47636,1.431783,1.389242,1.361314,1.307633,1.304992,1.254974,1.298075,1.310442,1.30627,1.332725,1.312213,1.307387,1.312876,1.33115,1.290692,1.274173,1.266071,1.296534,1.283522,1.272638,1.321327,1.334177,1.317691,1.338629,1.317764,1.305747,1.321218,1.368055,1.329599,1.349742,1.37037,1.370769,1.416796,...,2.22956,2.194482,2.161033,2.159412,2.167776,2.14376,2.152004,2.131319,2.152139,2.17873,2.192714,2.198449,2.191865,2.232675,2.303095,2.42543,2.469938,2.421318,2.453069,2.492805,2.444744,2.481664,2.522527,2.360221,2.340729,2.727256,2.855065,2.673847,2.661563,2.572192,2.677093,3.065426,2.833681,2.687274,2.681833,2.844457,3.111477,3.342016,3.168969,2.817303


In [84]:
data_test_df = pd.DataFrame(data=X_test_scale)
data_test_df.describe()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,...,4056,4057,4058,4059,4060,4061,4062,4063,4064,4065,4066,4067,4068,4069,4070,4071,4072,4073,4074,4075,4076,4077,4078,4079,4080,4081,4082,4083,4084,4085,4086,4087,4088,4089,4090,4091,4092,4093,4094,4095
count,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,...,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0,80.0
mean,-0.050161,-0.012672,0.024103,-0.033004,-0.06914,-0.091897,-0.119814,-0.140213,-0.168498,-0.181484,-0.226982,-0.249135,-0.243634,-0.235345,-0.232707,-0.252178,-0.247199,-0.260194,-0.251215,-0.236108,-0.252301,-0.271034,-0.256124,-0.23409,-0.229708,-0.210491,-0.190081,-0.180186,-0.159747,-0.181237,-0.182994,-0.171864,-0.149623,-0.167849,-0.167593,-0.156042,-0.15927,-0.177296,-0.165496,-0.144901,...,-0.045016,-0.018019,-0.011499,-0.016127,-0.005251,-0.005811,-0.031935,-0.030245,-0.029071,-0.016255,0.000587,-0.042493,-0.073093,-0.077439,-0.076022,-0.037306,0.000371,0.019789,0.029643,0.016599,0.000191,-0.074195,-0.105651,-0.017352,0.017691,0.015956,0.055985,0.064735,0.142377,0.051004,0.031578,0.069469,0.14936,0.099909,-0.039358,0.06186,0.203089,0.177366,0.086935,0.000924
std,0.991102,1.052706,1.03421,1.000352,0.976721,0.981218,0.999073,1.034793,1.059482,1.120054,1.169856,1.176424,1.194465,1.180576,1.202117,1.210013,1.20931,1.202914,1.21411,1.228276,1.253938,1.265308,1.248736,1.233051,1.22316,1.23303,1.216031,1.205898,1.160616,1.166389,1.139065,1.116086,1.117501,1.13012,1.140244,1.137843,1.135707,1.14037,1.137178,1.10694,...,1.026948,1.039614,1.042331,1.015744,1.015464,0.954956,0.970558,0.95023,0.920528,0.928908,0.931855,0.925875,0.933606,0.917449,0.943582,0.976872,0.967317,0.975256,0.97337,1.010296,1.015702,1.055176,1.125607,1.103201,1.070753,1.126893,1.099489,1.077737,1.106179,1.063191,1.114635,1.150963,1.193968,1.191065,1.139985,1.100427,1.101234,1.090317,1.066322,0.970132
min,-1.650187,-1.921725,-1.945007,-2.111871,-2.354429,-2.614534,-3.003693,-3.407196,-3.6932,-3.842949,-4.049339,-4.258611,-4.263335,-4.229913,-4.236402,-4.294809,-4.204533,-4.288374,-4.355688,-4.304681,-4.407139,-4.437129,-4.368219,-4.479057,-4.401647,-4.594561,-4.584676,-4.544522,-4.520879,-4.420296,-4.065729,-4.175189,-4.040685,-4.132798,-4.295574,-3.926554,-3.662771,-3.542033,-3.530304,-3.451702,...,-2.363759,-2.240915,-2.265648,-2.264024,-2.212022,-2.006485,-2.128262,-1.98657,-2.093015,-1.816419,-2.125824,-2.067472,-2.215694,-2.217908,-2.042064,-2.03294,-2.188783,-2.059147,-2.12522,-2.174068,-2.26691,-2.361766,-2.815651,-2.403601,-2.251094,-2.252522,-2.05868,-2.318434,-2.154681,-1.964382,-1.939414,-1.788605,-1.722754,-1.554215,-1.706816,-1.413312,-1.309208,-1.397098,-1.281209,-1.41281
25%,-1.010862,-0.874914,-0.721825,-0.727563,-0.357971,-0.358213,-0.596593,-0.631503,-0.598305,-0.678994,-0.677598,-0.724086,-0.620915,-0.689612,-0.570285,-0.5694,-0.584679,-0.563135,-0.485362,-0.382364,-0.470406,-0.458571,-0.523332,-0.487622,-0.602859,-0.699929,-0.730756,-0.789734,-0.732787,-1.016406,-0.844534,-0.8342,-0.856663,-0.870744,-0.869428,-0.866228,-0.823516,-0.800428,-0.713889,-0.71527,...,-0.705815,-0.723178,-0.750893,-0.721283,-0.793408,-0.773539,-0.844182,-0.786612,-0.782782,-0.784115,-0.845015,-0.814358,-0.836642,-0.906085,-0.898601,-0.867017,-0.712532,-0.715008,-0.696375,-0.615885,-0.645367,-0.747289,-0.813834,-0.731531,-0.749316,-0.786955,-0.654753,-0.675859,-0.570026,-0.810685,-0.842993,-0.909251,-0.868422,-0.824496,-0.952517,-0.83372,-0.691612,-0.70083,-0.756316,-0.781704
50%,-0.051874,0.226993,0.212922,0.068814,0.067503,0.051503,0.090266,0.006973,-0.030434,0.030679,0.031413,-0.004091,0.009989,0.018448,0.09707,0.061586,0.14617,0.158153,0.16807,0.182716,0.163475,0.167909,0.242421,0.250357,0.204383,0.25566,0.323238,0.289969,0.288631,0.296524,0.23469,0.229222,0.250082,0.285646,0.249313,0.309491,0.228061,0.246053,0.298659,0.258429,...,0.000849,0.004505,0.127526,-0.052306,0.184471,0.149486,0.092126,0.085489,0.029562,0.12753,0.288266,0.158805,0.028646,0.062329,-0.055297,0.093585,0.066394,-0.013068,-0.060501,-0.101608,-0.217034,-0.272443,-0.241886,-0.163658,-0.112437,0.048261,0.047211,0.120324,0.184242,0.095327,0.048249,0.0639,0.152029,-0.197395,-0.255362,-0.287567,0.001828,-0.083173,-0.197191,-0.173341
75%,0.661659,0.695303,0.821843,0.731572,0.645712,0.593943,0.572924,0.598404,0.622617,0.688604,0.661645,0.715905,0.649305,0.649731,0.651754,0.623423,0.610474,0.607897,0.612069,0.614836,0.630545,0.607259,0.629328,0.599509,0.568433,0.608988,0.628977,0.644498,0.658593,0.636912,0.621892,0.614398,0.633186,0.630836,0.633881,0.646645,0.613639,0.609294,0.621994,0.610975,...,0.795847,0.80842,0.902196,0.80098,0.749162,0.722166,0.767605,0.780546,0.789497,0.730824,0.750966,0.712042,0.637051,0.666729,0.680807,0.702212,0.719208,0.748611,0.754913,0.735052,0.685522,0.748476,0.743135,0.711813,0.89399,0.85196,0.848365,0.808915,0.834712,0.799278,0.836902,0.849456,1.036025,1.18793,0.881801,1.100109,1.101582,1.07353,0.812657,0.616963
max,2.094433,2.045138,1.83671,1.629501,1.507571,1.401833,1.426857,1.4049,1.332456,1.272605,1.276121,1.304992,1.221325,1.195704,1.137103,1.167972,1.298332,1.210385,1.240369,1.279635,1.264425,1.12797,1.177446,1.139107,1.201564,1.251401,1.208272,1.095717,1.076812,1.090765,1.107955,1.116803,1.169532,1.183142,1.193251,1.22586,1.279637,1.266587,1.166558,1.215341,...,1.631614,1.584615,1.552364,1.531393,1.616858,1.658667,1.750729,1.764119,1.732865,1.722908,1.629427,1.585223,1.6781,1.710693,1.84571,1.926797,2.084184,2.2421,2.423145,2.431399,2.750696,2.734916,2.903826,2.8019,2.718139,2.853326,2.702465,2.444317,2.799961,2.155036,2.548856,2.737134,3.047264,3.006526,2.658975,2.420909,2.678076,3.252175,3.077683,2.771819


## 가우시안

In [85]:
model = GaussianNB()
model.fit(X_train_scale, y_train)

GaussianNB(priors=None, var_smoothing=1e-09)

In [86]:
predict = model.predict(X_train_scale)
acc = metrics.accuracy_score(y_train, predict)
f1 = metrics.f1_score(y_train, predict, average=None)

print('Train Accuracy: {}'.format(acc))
print('Train F1 Score: {}'.format(f1.mean()))

Train Accuracy: 1.0
Train F1 Score: 1.0


In [87]:
predict = model.predict(X_test_scale)
acc = metrics.accuracy_score(y_test, predict)
f1 = metrics.f1_score(y_test, predict, average=None)

print('Test Accuracy: {}'.format(acc))
print('Test F1 Score: {}'.format(f1.mean()))

Test Accuracy: 0.9
Test F1 Score: 0.9037323037323038


## 베르누이

In [88]:
model = BernoulliNB()
model.fit(X_train_scale, y_train)

BernoulliNB(alpha=1.0, binarize=0.0, class_prior=None, fit_prior=True)

In [89]:
predict = model.predict(X_train_scale)
acc = metrics.accuracy_score(y_train, predict)
f1 = metrics.f1_score(y_train, predict, average=None)

print('Train Accuracy: {}'.format(acc))
print('Train F1 score: {}'.format(f1.mean()))

Train Accuracy: 0.91875
Train F1 score: 0.9212012530812841


In [90]:
predict = model.predict(X_test_scale)
acc = metrics.accuracy_score(y_test, predict)
f1 = metrics.f1_score(y_test, predict, average=None)

print('Test Accuracy: {}'.format(acc))
print('Test F1 score: {}'.format(f1.mean()))

Test Accuracy: 0.8375
Test F1 score: 0.7774436090225564


## 다항

* Negative value 에러가 떠서 MinMaxScaler를 이용하여 scale함.

In [91]:
scaler = MinMaxScaler()
X_train_scale = scaler.fit_transform(X_train)
X_test_scale = scaler.transform(X_test)

model = MultinomialNB()
model.fit(X_train_scale, y_train)

MultinomialNB(alpha=1.0, class_prior=None, fit_prior=True)

In [92]:
predict = model.predict(X_train_scale)
acc = metrics.accuracy_score(y_train, predict)
f1 = metrics.f1_score(y_train, predict, average=None)

print('Train Accuracy: {}'.format(acc))
print('Train F1 Score: {}'.format(f1.mean()))

Train Accuracy: 0.953125
Train F1 Score: 0.9556062326476414


In [93]:
predict = model.predict(X_test_scale)
acc = metrics.accuracy_score(y_test, predict)
f1 = metrics.f1_score(y_test, predict, average=None)

print('Test Accuracy: {}'.format(acc))
print('Test F1 Score: {}'.format(f1.mean()))

Test Accuracy: 0.9
Test F1 Score: 0.8576576576576576


# 비교 결과
## 정확도 : 가우시안 = 다항 > 베르누이
## F1 점수 : 가우시안 > 다항 > 베르누이
## 결론 : 가우시안이 성능이 가장 뛰어났다.