# Intro

Let's start by loading the important packages and set a bunch of graphic options

In [1]:
%matplotlib inline
import matplotlib
import matplotlib.pyplot as plt
plt.style.use('ggplot')
import pandas as pd
import seaborn as sns
import numpy as np
import pylab
import warnings
from sklearn.preprocessing import LabelEncoder
from sklearn.preprocessing import StandardScaler
import  sklearn.linear_model 
from sklearn.grid_search import GridSearchCV, RandomizedSearchCV
warnings.filterwarnings('ignore')
pylab.rcParams['figure.figsize'] = (12, 8)
plt.style.use('ggplot')
plt.rcParams['image.cmap'] = 'gray'
matplotlib.rcParams.update({'font.size': 14})



# Prepare X,Y arrays. From data to ML arrays

Let's load the training set using the Pandas read_csv option.

In [5]:
train = pd.read_csv('train.csv')

In [6]:
train.head()

Unnamed: 0,id,species,margin1,margin2,margin3,margin4,margin5,margin6,margin7,margin8,...,texture55,texture56,texture57,texture58,texture59,texture60,texture61,texture62,texture63,texture64
0,1,Acer_Opalus,0.007812,0.023438,0.023438,0.003906,0.011719,0.009766,0.027344,0.0,...,0.007812,0.0,0.00293,0.00293,0.035156,0.0,0.0,0.004883,0.0,0.025391
1,2,Pterocarya_Stenoptera,0.005859,0.0,0.03125,0.015625,0.025391,0.001953,0.019531,0.0,...,0.000977,0.0,0.0,0.000977,0.023438,0.0,0.0,0.000977,0.039062,0.022461
2,3,Quercus_Hartwissiana,0.005859,0.009766,0.019531,0.007812,0.003906,0.005859,0.068359,0.0,...,0.1543,0.0,0.005859,0.000977,0.007812,0.0,0.0,0.0,0.020508,0.00293
3,5,Tilia_Tomentosa,0.0,0.003906,0.023438,0.005859,0.021484,0.019531,0.023438,0.0,...,0.0,0.000977,0.0,0.0,0.020508,0.0,0.0,0.017578,0.0,0.047852
4,6,Quercus_Variabilis,0.005859,0.003906,0.048828,0.009766,0.013672,0.015625,0.005859,0.0,...,0.09668,0.0,0.021484,0.0,0.0,0.0,0.0,0.0,0.0,0.03125


As we can see the data set is quite simple and well structured (not a lot of cleaning needed.) We would like to guess the plant's species using the different features presented here.

In machine learning application we prefer to deal with numbers instead of text. So let's turn what we want to predict (the type) from a list of labels to a list of numbers.
So for example Acer_Opalus = 1, Pterocarya_Stenoptera = 2 and so on.

sklearn LabelEncoder() does that for us.

In [10]:
x_train = train.drop(['id', 'species'], axis=1).values
le = LabelEncoder().fit(train['species'])
y_train = le.transform(train['species'])
scaler = StandardScaler().fit(x_train)
x_train = scaler.transform(x_train)

In [11]:
x_train

array([[-0.48661074, -0.13135701, -0.33095592, ..., -0.39487147,
        -0.65214311,  0.26239707],
       [-0.58560191, -0.73488047, -0.02856115, ..., -0.49497401,
         2.18166976,  0.13364087],
       [-0.58560191, -0.48340807, -0.48219201, ..., -0.52001246,
         0.83564129, -0.72463124],
       ..., 
       [-0.78358426, -0.63430181, -1.23821765, ...,  0.1807566 ,
        -0.65214311, -0.76756462],
       [-0.88257543, -0.73488047,  0.5762671 , ..., -0.52001246,
        -0.51045972, -0.72463124],
       [ 0.30542003, -0.23196142, -0.02856115, ...,  0.08065405,
         1.18988604,  0.13364087]])

Let's look at the feauture data types are those all numbers?

In [6]:
train.dtypes

id             int64
species       object
margin1      float64
margin2      float64
margin3      float64
margin4      float64
margin5      float64
margin6      float64
margin7      float64
margin8      float64
margin9      float64
margin10     float64
margin11     float64
margin12     float64
margin13     float64
margin14     float64
margin15     float64
margin16     float64
margin17     float64
margin18     float64
margin19     float64
margin20     float64
margin21     float64
margin22     float64
margin23     float64
margin24     float64
margin25     float64
margin26     float64
margin27     float64
margin28     float64
              ...   
texture35    float64
texture36    float64
texture37    float64
texture38    float64
texture39    float64
texture40    float64
texture41    float64
texture42    float64
texture43    float64
texture44    float64
texture45    float64
texture46    float64
texture47    float64
texture48    float64
texture49    float64
texture50    float64
texture51    

All the data features seems to be numerical. are there any nan etc? 

In [12]:
for feat in train.columns:
    print(feat,np.sum(train[feat].isnull()))

('id', 0)
('species', 0)
('margin1', 0)
('margin2', 0)
('margin3', 0)
('margin4', 0)
('margin5', 0)
('margin6', 0)
('margin7', 0)
('margin8', 0)
('margin9', 0)
('margin10', 0)
('margin11', 0)
('margin12', 0)
('margin13', 0)
('margin14', 0)
('margin15', 0)
('margin16', 0)
('margin17', 0)
('margin18', 0)
('margin19', 0)
('margin20', 0)
('margin21', 0)
('margin22', 0)
('margin23', 0)
('margin24', 0)
('margin25', 0)
('margin26', 0)
('margin27', 0)
('margin28', 0)
('margin29', 0)
('margin30', 0)
('margin31', 0)
('margin32', 0)
('margin33', 0)
('margin34', 0)
('margin35', 0)
('margin36', 0)
('margin37', 0)
('margin38', 0)
('margin39', 0)
('margin40', 0)
('margin41', 0)
('margin42', 0)
('margin43', 0)
('margin44', 0)
('margin45', 0)
('margin46', 0)
('margin47', 0)
('margin48', 0)
('margin49', 0)
('margin50', 0)
('margin51', 0)
('margin52', 0)
('margin53', 0)
('margin54', 0)
('margin55', 0)
('margin56', 0)
('margin57', 0)
('margin58', 0)
('margin59', 0)
('margin60', 0)
('margin61', 0)
('margin

there are no nan, WOW this data set is super clean! pretty good it is ready to be fitted.

## Logistic regression

Let's start from the simplesent algorithm: Logistic regression. It is always good to start from a simple approach to understand data and future improvements.

In [13]:
params = {'C':np.linspace(850,1200,15), 'tol': [0.001, 0.0001, 0.005]}
log_reg = sklearn.linear_model.LogisticRegression(solver='newton-cg', multi_class='multinomial')
clf = GridSearchCV(log_reg, params, scoring='log_loss', n_jobs=-1, cv=5)
clf.fit(x_train, y_train)

print("best params: " + str(clf.best_params_))
for params, mean_score, scores in clf.grid_scores_:
  print("%0.3f (+/-%0.03f) for %r" % (mean_score, scores.std(), params))
  print(scores)

best params: {'C': 950.0, 'tol': 0.001}
-0.043 (+/-0.024) for {'C': 850.0, 'tol': 0.001}
[-0.04959451 -0.0173196  -0.08326873 -0.04577765 -0.02032384]
-0.042 (+/-0.024) for {'C': 850.0, 'tol': 0.0001}
[-0.04469008 -0.02006725 -0.08320248 -0.0433759  -0.01738207]
-0.049 (+/-0.029) for {'C': 850.0, 'tol': 0.005}
[-0.04347863 -0.02278357 -0.10136938 -0.05431205 -0.02351315]
-0.042 (+/-0.024) for {'C': 875.0, 'tol': 0.001}
[-0.04440599 -0.01642818 -0.08301345 -0.04631853 -0.01957703]
-0.042 (+/-0.024) for {'C': 875.0, 'tol': 0.0001}
[-0.04464018 -0.01902781 -0.08340629 -0.04347924 -0.01754161]
-0.046 (+/-0.027) for {'C': 875.0, 'tol': 0.005}
[-0.04519942 -0.01668059 -0.09084301 -0.0545228  -0.02156568]
-0.042 (+/-0.024) for {'C': 900.0, 'tol': 0.001}
[-0.04873539 -0.01611231 -0.08281082 -0.0423985  -0.01992066]
-0.042 (+/-0.024) for {'C': 900.0, 'tol': 0.0001}
[-0.04473058 -0.01935943 -0.08328105 -0.04359346 -0.01746683]
-0.046 (+/-0.024) for {'C': 900.0, 'tol': 0.005}
[-0.04800701 -0.0173

In [14]:
clf.best_score_

-0.04119561321388344

In [16]:
clf.predict(x_train)==y_train

array([ True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,

In [81]:
from scipy.stats import norm
from scipy.stats import uniform

In [82]:
param_dist = {"C": norm(loc=950.0,scale = 200.),
              "tol": uniform(loc=0.0001,scale = 0.008)
             }

In [83]:
random_search = RandomizedSearchCV(log_reg, param_distributions=param_dist,
                                   n_iter=200, scoring='log_loss', n_jobs=-1, cv=5,verbose=10)


In [None]:
random_search.fit(x_train,y_train)

Fitting 5 folds for each of 200 candidates, totalling 1000 fits
[CV] tol=0.00374946306386, C=1041.33042759 ...........................
[CV] tol=0.00374946306386, C=1041.33042759 ...........................
[CV] tol=0.00374946306386, C=1041.33042759 ...........................
[CV] tol=0.00374946306386, C=1041.33042759 ...........................
[CV] tol=0.00374946306386, C=1041.33042759 ...........................
[CV] tol=0.00057111451939, C=1007.78402295 ...........................
[CV] tol=0.00057111451939, C=1007.78402295 ...........................
[CV] tol=0.00057111451939, C=1007.78402295 ...........................
[CV] tol=0.00057111451939, C=1007.78402295 ...........................
[CV] tol=0.00057111451939, C=1007.78402295 ...........................
[CV] tol=0.000829885433192, C=795.656959325 ..........................
[CV] tol=0.000829885433192, C=795.656959325 ..........................
[CV] tol=0.000829885433192, C=795.656959325 ..........................
[CV] tol=0.00

[Parallel(n_jobs=-1)]: Done   9 tasks      | elapsed:    5.8s


[CV] . tol=0.00741458015536, C=1305.72410778, score=-0.080716 -   2.3s
[CV]  tol=0.000829885433192, C=795.656959325, score=-0.082319 -   6.2s
[CV] tol=0.00628698219372, C=973.690614564 ...........................
[CV] tol=0.00628698219372, C=973.690614564 ...........................
[CV] . tol=0.00741458015536, C=1305.72410778, score=-0.094829 -   4.2s
[CV] . tol=0.00374946306386, C=1041.33042759, score=-0.085915 -   6.4s
[CV] tol=0.00628698219372, C=973.690614564 ...........................
[CV] tol=0.00628698219372, C=973.690614564 ...........................
[CV] . tol=0.00057111451939, C=1007.78402295, score=-0.046641 -   6.5s
[CV] . tol=0.00741458015536, C=1305.72410778, score=-0.077211 -   2.4s
[CV] . tol=0.00057111451939, C=1007.78402295, score=-0.082809 -   6.6s
[CV] tol=0.00242889001888, C=929.650495133 ...........................
[CV] tol=0.00242889001888, C=929.650495133 ...........................
[CV] tol=0.00242889001888, C=929.650495133 ...........................
[CV]  

[Parallel(n_jobs=-1)]: Done  18 tasks      | elapsed:    6.7s


[CV] .. tol=0.0062719633376, C=967.200465238, score=-0.058623 -   3.1s
[CV] tol=0.00242889001888, C=929.650495133 ...........................
[CV] . tol=0.00057111451939, C=1007.78402295, score=-0.015665 -   7.9s
[CV] tol=0.0017790045666, C=948.667063989 ............................
[CV] . tol=0.00741458015536, C=1305.72410778, score=-0.162237 -   5.1s
[CV] tol=0.0017790045666, C=948.667063989 ............................
[CV] .. tol=0.0062719633376, C=967.200465238, score=-0.028583 -   3.6s
[CV] tol=0.0017790045666, C=948.667063989 ............................
[CV] .. tol=0.0062719633376, C=967.200465238, score=-0.062156 -   4.2s
[CV] tol=0.0017790045666, C=948.667063989 ............................
[CV] . tol=0.00628698219372, C=973.690614564, score=-0.050965 -   3.7s
[CV] tol=0.0017790045666, C=948.667063989 ............................
[CV] . tol=0.00628698219372, C=973.690614564, score=-0.028517 -   3.5s
[CV] tol=0.00702056994951, C=812.740287771 ...........................
[CV] .

[Parallel(n_jobs=-1)]: Done  29 tasks      | elapsed:   11.0s


[CV] . tol=0.00242889001888, C=929.650495133, score=-0.045016 -   5.4s
[CV] tol=0.00565620067972, C=905.044404435 ...........................
[CV] . tol=0.00628698219372, C=973.690614564, score=-0.090997 -   5.8s
[CV] . tol=0.00628698219372, C=973.690614564, score=-0.019452 -   5.8s
[CV] tol=0.00565620067972, C=905.044404435 ...........................
[CV] tol=0.00565620067972, C=905.044404435 ...........................
[CV] . tol=0.00242889001888, C=929.650495133, score=-0.019580 -   4.9s
[CV] tol=0.00565620067972, C=905.044404435 ...........................
[CV] .. tol=0.0017790045666, C=948.667063989, score=-0.043510 -   5.1s
[CV] tol=0.00565620067972, C=905.044404435 ...........................
[CV] . tol=0.00242889001888, C=929.650495133, score=-0.079316 -   6.6s
[CV] tol=0.00636737577424, C=1401.79841849 ...........................
[CV] . tol=0.00702056994951, C=812.740287771, score=-0.048540 -   3.9s
[CV] tol=0.00636737577424, C=1401.79841849 ...........................
[CV] .

[Parallel(n_jobs=-1)]: Done  40 tasks      | elapsed:   15.3s


[CV] tol=0.00323155898046, C=722.68235754 ............................
[CV] . tol=0.00702056994951, C=812.740287771, score=-0.023461 -   4.7s
[CV] tol=0.00323155898046, C=722.68235754 ............................
[CV] .. tol=0.0017790045666, C=948.667063989, score=-0.082773 -   6.7s
[CV] tol=0.00323155898046, C=722.68235754 ............................
[CV] . tol=0.00565620067972, C=905.044404435, score=-0.048602 -   4.1s
[CV] . tol=0.00702056994951, C=812.740287771, score=-0.122071 -   5.3s
[CV] tol=0.00396775261471, C=1270.62068747 ...........................
[CV] tol=0.00396775261471, C=1270.62068747 ...........................
[CV] . tol=0.00702056994951, C=812.740287771, score=-0.017368 -   6.2s
[CV] tol=0.00396775261471, C=1270.62068747 ...........................
[CV] . tol=0.00636737577424, C=1401.79841849, score=-0.077729 -   2.3s
[CV] . tol=0.00565620067972, C=905.044404435, score=-0.055849 -   4.4s
[CV] tol=0.00396775261471, C=1270.62068747 ...........................
[CV] t

[Parallel(n_jobs=-1)]: Done  53 tasks      | elapsed:   18.5s


[CV] .. tol=0.00323155898046, C=722.68235754, score=-0.046865 -   4.4s
[CV] tol=0.00134643428218, C=810.152057382 ...........................
[CV] .. tol=0.00323155898046, C=722.68235754, score=-0.026027 -   4.1s
[CV] tol=0.00134643428218, C=810.152057382 ...........................
[CV] .. tol=0.00323155898046, C=722.68235754, score=-0.045354 -   4.9s
[CV] tol=0.00134643428218, C=810.152057382 ...........................
[CV] . tol=0.00396775261471, C=1270.62068747, score=-0.042818 -   4.5s
[CV] tol=0.00134643428218, C=810.152057382 ...........................
[CV] . tol=0.00636737577424, C=1401.79841849, score=-0.115075 -   6.5s
[CV] tol=0.00134643428218, C=810.152057382 ...........................
[CV] . tol=0.00396775261471, C=1270.62068747, score=-0.059575 -   4.9s
[CV] tol=0.00316335812935, C=1082.16931814 ...........................
[CV] . tol=0.00510647499563, C=990.277722548, score=-0.045948 -   4.1s
[CV] .. tol=0.00323155898046, C=722.68235754, score=-0.017655 -   6.3s
[CV] t

[Parallel(n_jobs=-1)]: Done  66 tasks      | elapsed:   22.6s


[CV] . tol=0.00396775261471, C=1270.62068747, score=-0.104501 -   6.3s
[CV] tol=0.000397570823275, C=894.27391509 ...........................
[CV] . tol=0.00510647499563, C=990.277722548, score=-0.090748 -   5.6s
[CV] tol=0.00442502828547, C=926.81159149 ............................
[CV] . tol=0.00134643428218, C=810.152057382, score=-0.046069 -   5.1s
[CV] tol=0.00442502828547, C=926.81159149 ............................
[CV] . tol=0.00316335812935, C=1082.16931814, score=-0.043148 -   4.3s
[CV] tol=0.00442502828547, C=926.81159149 ............................
[CV] . tol=0.00134643428218, C=810.152057382, score=-0.045196 -   5.2s
[CV] tol=0.00442502828547, C=926.81159149 ............................
[CV] . tol=0.00316335812935, C=1082.16931814, score=-0.059765 -   4.4s
[CV] tol=0.00442502828547, C=926.81159149 ............................
[CV] . tol=0.00134643428218, C=810.152057382, score=-0.020528 -   5.4s
[CV] tol=0.0026233470704, C=1146.83793396 ............................
[CV] .

[Parallel(n_jobs=-1)]: Done  81 tasks      | elapsed:   27.9s


[CV] .. tol=0.00442502828547, C=926.81159149, score=-0.044240 -   4.6s
[CV] . tol=0.000397570823275, C=894.27391509, score=-0.019379 -   5.3s
[CV] tol=0.00560493928246, C=1023.62668072 ...........................
[CV] tol=0.00560493928246, C=1023.62668072 ...........................
[CV] . tol=0.000397570823275, C=894.27391509, score=-0.043486 -   6.4s
[CV] tol=0.00560493928246, C=1023.62668072 ...........................
[CV] . tol=0.000397570823275, C=894.27391509, score=-0.016008 -   7.2s
[CV] tol=0.000224428962985, C=830.539241097 ..........................
[CV] .. tol=0.00442502828547, C=926.81159149, score=-0.028623 -   3.9s
[CV] tol=0.000224428962985, C=830.539241097 ..........................
[CV] .. tol=0.00442502828547, C=926.81159149, score=-0.063507 -   4.4s
[CV] tol=0.000224428962985, C=830.539241097 ..........................
[CV] . tol=0.000397570823275, C=894.27391509, score=-0.083130 -   8.0s
[CV] tol=0.000224428962985, C=830.539241097 ..........................
[CV] .

[Parallel(n_jobs=-1)]: Done  96 tasks      | elapsed:   32.5s


[CV] . tol=0.00560493928246, C=1023.62668072, score=-0.023629 -   3.7s
[CV] tol=0.00314814531134, C=1110.90511647 ...........................
[CV] .. tol=0.0026233470704, C=1146.83793396, score=-0.015762 -   6.9s
[CV] tol=0.00314814531134, C=1110.90511647 ...........................
[CV] .. tol=0.0026233470704, C=1146.83793396, score=-0.085305 -   7.0s
[CV] tol=0.00314814531134, C=1110.90511647 ...........................
[CV] . tol=0.00560493928246, C=1023.62668072, score=-0.084537 -   6.1s
[CV] tol=0.00424452130643, C=696.87908465 ............................
[CV]  tol=0.000454093418902, C=804.376263513, score=-0.045240 -   5.5s
[CV] tol=0.00424452130643, C=696.87908465 ............................
[CV] . tol=0.00314814531134, C=1110.90511647, score=-0.043676 -   4.4s
[CV] tol=0.00424452130643, C=696.87908465 ............................
[CV]  tol=0.000224428962985, C=830.539241097, score=-0.044703 -   7.4s
[CV] tol=0.00424452130643, C=696.87908465 ............................
[CV]  

[Parallel(n_jobs=-1)]: Done 113 tasks      | elapsed:   39.6s


[CV]  tol=0.000454093418902, C=804.376263513, score=-0.017773 -   8.6s
[CV] tol=0.00668042379265, C=1037.33264208 ...........................
[CV]  tol=0.000454093418902, C=804.376263513, score=-0.017768 -   8.3s
[CV] tol=0.00668042379265, C=1037.33264208 ...........................
[CV] .. tol=0.00424452130643, C=696.87908465, score=-0.069916 -   4.1s
[CV] tol=0.00668042379265, C=1037.33264208 ...........................
[CV] .. tol=0.00424452130643, C=696.87908465, score=-0.022203 -   4.4s
[CV] tol=0.00668042379265, C=1037.33264208 ...........................
[CV] .. tol=0.00424452130643, C=696.87908465, score=-0.017941 -   6.2s
[CV] tol=0.00668042379265, C=1037.33264208 ...........................
[CV] . tol=0.00429714629245, C=1063.46741426, score=-0.044025 -   4.0s
[CV] tol=0.0052884212178, C=814.654632222 ............................
[CV] . tol=0.00429714629245, C=1063.46741426, score=-0.080953 -   3.6s
[CV] tol=0.0052884212178, C=814.654632222 ............................
[CV] .

[Parallel(n_jobs=-1)]: Done 130 tasks      | elapsed:   45.0s


[CV] .. tol=0.0020039645527, C=991.965617641, score=-0.083979 -   6.6s
[CV] tol=0.0016855547379, C=971.62649028 .............................
[CV] . tol=0.00429714629245, C=1063.46741426, score=-0.084740 -   6.4s
[CV] tol=0.0016855547379, C=971.62649028 .............................
[CV] . tol=0.00668042379265, C=1037.33264208, score=-0.023739 -   3.8s
[CV] tol=0.0016855547379, C=971.62649028 .............................
[CV] . tol=0.00668042379265, C=1037.33264208, score=-0.086558 -   6.1s
[CV] .. tol=0.0052884212178, C=814.654632222, score=-0.043365 -   4.5s
[CV] tol=0.00358659786907, C=705.247902704 ...........................
[CV] tol=0.00358659786907, C=705.247902704 ...........................
[CV] .. tol=0.0043296758987, C=1278.15423175, score=-0.043931 -   4.1s
[CV] tol=0.00358659786907, C=705.247902704 ...........................
[CV] .. tol=0.0043296758987, C=1278.15423175, score=-0.071864 -   3.8s
[CV] tol=0.00358659786907, C=705.247902704 ...........................
[CV] .

[Parallel(n_jobs=-1)]: Done 149 tasks      | elapsed:   51.8s


[CV] tol=0.00518385592224, C=613.427229646 ...........................
[CV] . tol=0.00358659786907, C=705.247902704, score=-0.061936 -   4.4s
[CV] tol=0.00518385592224, C=613.427229646 ...........................
[CV] . tol=0.00358659786907, C=705.247902704, score=-0.022901 -   4.8s
[CV] tol=0.00518385592224, C=613.427229646 ...........................
[CV] . tol=0.00762230875287, C=808.558004412, score=-0.049016 -   3.9s
[CV] tol=0.00518385592224, C=613.427229646 ...........................
[CV] . tol=0.00358659786907, C=705.247902704, score=-0.095747 -   6.2s
[CV] tol=0.00679007737117, C=1193.13932429 ...........................
[CV]  tol=0.000949913923912, C=1095.17920893, score=-0.047706 -   5.5s
[CV] tol=0.00679007737117, C=1193.13932429 ...........................
[CV]  tol=0.000949913923912, C=1095.17920893, score=-0.042584 -   5.4s
[CV] tol=0.00679007737117, C=1193.13932429 ...........................
[CV]  tol=0.000949913923912, C=1095.17920893, score=-0.020966 -   5.3s
[CV] t

[Parallel(n_jobs=-1)]: Done 168 tasks      | elapsed:   56.9s


[CV] . tol=0.00679007737117, C=1193.13932429, score=-0.052751 -   3.7s
[CV] tol=0.000964394460267, C=1114.73192607 ..........................
[CV] . tol=0.00518385592224, C=613.427229646, score=-0.049868 -   4.7s
[CV] tol=0.00608454031989, C=864.363351209 ...........................
[CV] . tol=0.00806978276558, C=1164.34090329, score=-0.076218 -   2.3s
[CV] tol=0.00608454031989, C=864.363351209 ...........................
[CV] . tol=0.00518385592224, C=613.427229646, score=-0.019758 -   6.6s
[CV] . tol=0.00679007737117, C=1193.13932429, score=-0.095011 -   4.3s
[CV] . tol=0.00806978276558, C=1164.34090329, score=-0.080423 -   2.5s
[CV] tol=0.00608454031989, C=864.363351209 ...........................
[CV] tol=0.00608454031989, C=864.363351209 ...........................
[CV] . tol=0.00518385592224, C=613.427229646, score=-0.084583 -   5.6s
[CV] tol=0.00608454031989, C=864.363351209 ...........................
[CV] tol=0.00682306583367, C=1003.21577448 ...........................
[CV] .

[Parallel(n_jobs=-1)]: Done 189 tasks      | elapsed:  1.1min


[CV] . tol=0.00608454031989, C=864.363351209, score=-0.019839 -   5.5s
[CV] tol=0.00639179583717, C=933.989781625 ...........................
[CV]  tol=0.000964394460267, C=1114.73192607, score=-0.019580 -   6.1s
[CV] tol=0.00639179583717, C=933.989781625 ...........................
[CV] . tol=0.00608454031989, C=864.363351209, score=-0.099902 -   5.6s
[CV] tol=0.00639179583717, C=933.989781625 ...........................
[CV]  tol=0.000964394460267, C=1114.73192607, score=-0.015901 -   7.7s
[CV] tol=0.00639179583717, C=933.989781625 ...........................
[CV]  tol=0.000964394460267, C=1114.73192607, score=-0.083930 -   7.7s
[CV] tol=0.00639179583717, C=933.989781625 ...........................
[CV] . tol=0.00682306583367, C=1003.21577448, score=-0.087372 -   6.1s
[CV] tol=0.00754484144107, C=847.637766805 ...........................
[CV] .. tol=0.0034146969007, C=751.291845281, score=-0.045778 -   4.2s
[CV] tol=0.00754484144107, C=847.637766805 ...........................
[CV]  

[Parallel(n_jobs=-1)]: Done 210 tasks      | elapsed:  1.2min


[CV] . tol=0.00639179583717, C=933.989781625, score=-0.091154 -   6.5s
[CV] tol=0.00148079645559, C=977.101364634 ...........................
[CV] . tol=0.00754484144107, C=847.637766805, score=-0.033621 -   3.5s
[CV] tol=0.00148079645559, C=977.101364634 ...........................
[CV] . tol=0.00754484144107, C=847.637766805, score=-0.060632 -   4.2s
[CV] tol=0.00148079645559, C=977.101364634 ...........................
[CV] . tol=0.00754484144107, C=847.637766805, score=-0.120469 -   5.1s
[CV] tol=0.00148079645559, C=977.101364634 ...........................
[CV] . tol=0.00754484144107, C=847.637766805, score=-0.021899 -   5.3s
[CV] tol=0.0028084304592, C=597.527734263 ............................
[CV] .. tol=0.0024444855653, C=1184.30657355, score=-0.042046 -   4.5s
[CV] tol=0.0028084304592, C=597.527734263 ............................
[CV] . tol=0.00162216200463, C=833.097330993, score=-0.047390 -   5.3s
[CV] tol=0.0028084304592, C=597.527734263 ............................
[CV] .

[Parallel(n_jobs=-1)]: Done 233 tasks      | elapsed:  1.3min


[CV] . tol=0.00500392837901, C=888.100917005, score=-0.022785 -   4.2s
[CV] tol=0.00336001963361, C=778.599351808 ...........................
[CV] .. tol=0.0028084304592, C=597.527734263, score=-0.021971 -   5.8s
[CV] tol=0.00336001963361, C=778.599351808 ...........................
[CV] .. tol=0.0028084304592, C=597.527734263, score=-0.017227 -   6.7s
[CV] tol=0.00336001963361, C=778.599351808 ...........................
[CV] . tol=0.00500392837901, C=888.100917005, score=-0.055293 -   4.7s
[CV] tol=0.00336001963361, C=778.599351808 ...........................
[CV] . tol=0.00657816344699, C=865.143858572, score=-0.046465 -   4.7s
[CV] tol=0.00336001963361, C=778.599351808 ...........................
[CV] . tol=0.00500392837901, C=888.100917005, score=-0.090220 -   6.2s
[CV] tol=0.00426715428629, C=935.157888193 ...........................
[CV] . tol=0.00657816344699, C=865.143858572, score=-0.060311 -   4.2s
[CV] . tol=0.00500392837901, C=888.100917005, score=-0.017397 -   6.5s
[CV] t

[Parallel(n_jobs=-1)]: Done 256 tasks      | elapsed:  1.5min


[CV] . tol=0.00426715428629, C=935.157888193, score=-0.018619 -   5.7s
[CV] tol=0.00353422479045, C=1337.49344987 ...........................
[CV] . tol=0.00336001963361, C=778.599351808, score=-0.015794 -   7.6s
[CV] . tol=0.00426715428629, C=935.157888193, score=-0.105266 -   6.1s
[CV] tol=0.00353422479045, C=1337.49344987 ...........................
[CV] tol=0.00117841174995, C=854.854607578 ...........................
[CV]  tol=0.000945331528527, C=965.409458174, score=-0.048025 -   5.9s
[CV] tol=0.00117841174995, C=854.854607578 ...........................
[CV] ... tol=0.0064281499948, C=988.14468917, score=-0.052689 -   3.4s
[CV] tol=0.00117841174995, C=854.854607578 ...........................
[CV] ... tol=0.0064281499948, C=988.14468917, score=-0.028455 -   3.3s
[CV] tol=0.00117841174995, C=854.854607578 ...........................
[CV] ... tol=0.0064281499948, C=988.14468917, score=-0.095559 -   4.0s
[CV] tol=0.00117841174995, C=854.854607578 ...........................
[CV] .

[Parallel(n_jobs=-1)]: Done 281 tasks      | elapsed:  1.6min


[CV] . tol=0.00117841174995, C=854.854607578, score=-0.021032 -   5.5s
[CV] tol=0.00790761607287, C=962.716604431 ...........................
[CV] . tol=0.00117841174995, C=854.854607578, score=-0.016212 -   7.6s
[CV] . tol=0.00117841174995, C=854.854607578, score=-0.083559 -   6.3s
[CV] tol=0.00790761607287, C=962.716604431 ...........................
[CV] tol=0.00790761607287, C=962.716604431 ...........................
[CV] . tol=0.00648101018625, C=1171.57380212, score=-0.193714 -   4.9s
[CV] tol=0.00534295130832, C=907.148805754 ...........................
[CV] . tol=0.00138542400205, C=919.029133164, score=-0.048661 -   5.8s
[CV] tol=0.00534295130832, C=907.148805754 ...........................
[CV] . tol=0.00469101845227, C=790.748436378, score=-0.073652 -   3.8s
[CV] tol=0.00534295130832, C=907.148805754 ...........................
[CV] . tol=0.00138542400205, C=919.029133164, score=-0.047215 -   5.1s
[CV] tol=0.00534295130832, C=907.148805754 ...........................
[CV] .

[Parallel(n_jobs=-1)]: Done 306 tasks      | elapsed:  1.7min


[CV] tol=0.000727349025898, C=1164.61161157 ..........................
[CV] . tol=0.00637890184162, C=1001.95690928, score=-0.023721 -   3.9s
[CV] tol=0.000490942301412, C=1055.39697825 ..........................
[CV]  tol=0.000571261194053, C=706.486976985, score=-0.020447 -   5.2s
[CV] tol=0.000490942301412, C=1055.39697825 ..........................
[CV] . tol=0.00568867938126, C=997.245245287, score=-0.046963 -   4.4s
[CV] tol=0.000490942301412, C=1055.39697825 ..........................
[CV] . tol=0.00568867938126, C=997.245245287, score=-0.083372 -   4.5s
[CV] tol=0.000490942301412, C=1055.39697825 ..........................
[CV]  tol=0.000571261194053, C=706.486976985, score=-0.042841 -   5.9s
[CV] tol=0.000490942301412, C=1055.39697825 ..........................
[CV] . tol=0.00637890184162, C=1001.95690928, score=-0.088372 -   5.9s
[CV]  tol=0.000571261194053, C=706.486976985, score=-0.016875 -   7.6s
[CV] tol=0.00048962872256, C=1051.13338026 ...........................
[CV] t

[Parallel(n_jobs=-1)]: Done 333 tasks      | elapsed:  1.9min


[CV] tol=0.00643632967696, C=1022.53214266 ...........................
[CV] . tol=0.00216725548932, C=1245.32794538, score=-0.042926 -   4.3s
[CV] tol=0.00487232490708, C=1017.42930442 ...........................
[CV] . tol=0.00731801875951, C=1180.53920313, score=-0.080461 -   2.4s
[CV] tol=0.00487232490708, C=1017.42930442 ...........................
[CV] . tol=0.00731801875951, C=1180.53920313, score=-0.076349 -   2.5s
[CV] . tol=0.00731801875951, C=1180.53920313, score=-0.060699 -   3.3s
[CV] . tol=0.00048962872256, C=1051.13338026, score=-0.019453 -   6.0s
[CV] tol=0.00487232490708, C=1017.42930442 ...........................
[CV] tol=0.00487232490708, C=1017.42930442 ...........................
[CV] tol=0.00487232490708, C=1017.42930442 ...........................
[CV] . tol=0.00216725548932, C=1245.32794538, score=-0.046558 -   5.2s
[CV] tol=0.00667455409101, C=897.97150179 ............................
[CV] . tol=0.00643632967696, C=1022.53214266, score=-0.053586 -   3.7s
[CV] t

[Parallel(n_jobs=-1)]: Done 360 tasks      | elapsed:  2.0min


[CV] tol=0.000503406437332, C=1160.39686275 ..........................
[CV] .. tol=0.0080915198149, C=1055.72926574, score=-0.095371 -   4.1s
[CV] tol=0.000503406437332, C=1160.39686275 ..........................
[CV] .. tol=0.00667455409101, C=897.97150179, score=-0.023435 -   5.8s
[CV] tol=0.000503406437332, C=1160.39686275 ..........................
[CV] .. tol=0.0080915198149, C=1055.72926574, score=-0.239643 -   4.4s
[CV] tol=0.000503406437332, C=1160.39686275 ..........................
[CV] .. tol=0.00667455409101, C=897.97150179, score=-0.100555 -   5.9s
[CV] tol=0.00376772662271, C=1251.35982435 ...........................
[CV] .. tol=0.0049828363614, C=793.869870262, score=-0.045905 -   4.2s
[CV] tol=0.00376772662271, C=1251.35982435 ...........................
[CV] . tol=0.00315889875163, C=1060.21862299, score=-0.053115 -   3.4s
[CV] tol=0.00376772662271, C=1251.35982435 ...........................
[CV] .. tol=0.0049828363614, C=793.869870262, score=-0.051640 -   5.0s
[CV] t

[Parallel(n_jobs=-1)]: Done 389 tasks      | elapsed:  2.2min


[CV] . tol=0.00582914222876, C=1069.78038695, score=-0.086171 -   6.4s
[CV] tol=0.000427895576338, C=1120.66648752 ..........................
[CV] . tol=0.00449875679507, C=969.790513098, score=-0.062639 -   4.7s
[CV] tol=0.000427895576338, C=1120.66648752 ..........................
[CV] . tol=0.00449875679507, C=969.790513098, score=-0.017016 -   5.8s
[CV] tol=0.000427895576338, C=1120.66648752 ..........................
[CV] . tol=0.00449875679507, C=969.790513098, score=-0.025900 -   4.2s
[CV] tol=0.000427895576338, C=1120.66648752 ..........................
[CV] . tol=0.00449875679507, C=969.790513098, score=-0.091099 -   6.0s
[CV] tol=0.0045105435658, C=852.967702863 ............................
[CV] .. tol=0.00365414303523, C=816.65213007, score=-0.044023 -   4.4s
[CV] tol=0.0045105435658, C=852.967702863 ............................
[CV] . tol=0.00119986656427, C=847.941097905, score=-0.046421 -   4.9s
[CV] tol=0.0045105435658, C=852.967702863 ............................
[CV] .

[Parallel(n_jobs=-1)]: Done 418 tasks      | elapsed:  2.3min


[CV] tol=0.0020067424514, C=841.286640983 ............................
[CV]  tol=0.000636298416502, C=1217.65305347, score=-0.047872 -   5.3s
[CV] tol=0.00209757422791, C=751.298917973 ...........................
[CV] .. tol=0.0056586488636, C=995.782174428, score=-0.083446 -   6.2s
[CV] tol=0.00209757422791, C=751.298917973 ...........................
[CV] . tol=0.00415073059897, C=1069.80029863, score=-0.077586 -   3.3s
[CV] tol=0.00209757422791, C=751.298917973 ...........................
[CV] . tol=0.00415073059897, C=1069.80029863, score=-0.044282 -   4.2s
[CV] tol=0.00209757422791, C=751.298917973 ...........................
[CV]  tol=0.000636298416502, C=1217.65305347, score=-0.015620 -   8.1s
[CV]  tol=0.000636298416502, C=1217.65305347, score=-0.045160 -   5.1s
[CV] tol=0.00435899372111, C=1141.99062017 ...........................
[CV] tol=0.00209757422791, C=751.298917973 ...........................
[CV] . tol=0.00415073059897, C=1069.80029863, score=-0.020709 -   4.6s
[CV] .

[Parallel(n_jobs=-1)]: Done 449 tasks      | elapsed:  2.5min


[CV] . tol=0.00366335067509, C=505.762293074, score=-0.019248 -   6.0s
[CV] tol=0.00761692019851, C=699.212913302 ...........................
[CV] . tol=0.00366335067509, C=505.762293074, score=-0.082911 -   5.8s
[CV] tol=0.00761692019851, C=699.212913302 ...........................
[CV] . tol=0.00163198392352, C=975.302729694, score=-0.024756 -   4.5s
[CV] tol=0.00761692019851, C=699.212913302 ...........................
[CV] . tol=0.00142511501003, C=770.197553629, score=-0.044173 -   4.7s
[CV] tol=0.00761692019851, C=699.212913302 ...........................
[CV] . tol=0.00163198392352, C=975.302729694, score=-0.042997 -   5.1s
[CV] tol=0.00761692019851, C=699.212913302 ...........................
[CV] . tol=0.00163198392352, C=975.302729694, score=-0.015822 -   6.8s
[CV] tol=0.000545175099548, C=891.482710536 ..........................
[CV] . tol=0.00163198392352, C=975.302729694, score=-0.083997 -   6.1s
[CV] tol=0.000545175099548, C=891.482710536 ..........................
[CV] .

[Parallel(n_jobs=-1)]: Done 480 tasks      | elapsed:  2.7min


[CV]  tol=0.000545175099548, C=891.482710536, score=-0.082207 -   7.2s
[CV]  tol=0.000545175099548, C=891.482710536, score=-0.015929 -   7.4s
[CV] . tol=0.00283260203035, C=843.188650933, score=-0.016987 -   6.1s
[CV] tol=0.00684102445522, C=1417.89973541 ...........................
[CV] tol=0.00684102445522, C=1417.89973541 ...........................
[CV] tol=0.00684102445522, C=1417.89973541 ...........................
[CV] . tol=0.00283260203035, C=843.188650933, score=-0.084355 -   6.3s
[CV] tol=0.00684102445522, C=1417.89973541 ...........................
[CV] . tol=0.00677794296655, C=1200.19354357, score=-0.107514 -   5.9s
[CV] tol=0.00053153677675, C=1149.7990691 ............................
[CV] . tol=0.00315008576311, C=1190.21404057, score=-0.041961 -   4.5s
[CV] tol=0.00053153677675, C=1149.7990691 ............................
[CV] . tol=0.00684102445522, C=1417.89973541, score=-0.136589 -   2.3s
[CV] tol=0.00053153677675, C=1149.7990691 ............................
[CV] .

[Parallel(n_jobs=-1)]: Done 513 tasks      | elapsed:  2.9min


[CV] tol=0.00585713834142, C=714.031685635 ...........................
[CV] ... tol=0.00690587578467, C=862.9921283, score=-0.019621 -   5.7s
[CV] tol=0.00585713834142, C=714.031685635 ...........................
[CV] . tol=0.00518193192877, C=895.981969443, score=-0.055638 -   4.9s
[CV] tol=0.00585713834142, C=714.031685635 ...........................
[CV] . tol=0.00518193192877, C=895.981969443, score=-0.023034 -   4.4s
[CV] . tol=0.00518193192877, C=895.981969443, score=-0.017491 -   6.2s
[CV] tol=0.00585713834142, C=714.031685635 ...........................
[CV] tol=0.00585713834142, C=714.031685635 ...........................
[CV] . tol=0.00410876563615, C=721.376531068, score=-0.046700 -   4.4s
[CV] tol=0.00802176147489, C=1047.54595962 ...........................
[CV] . tol=0.00585713834142, C=714.031685635, score=-0.053531 -   3.3s
[CV] tol=0.00802176147489, C=1047.54595962 ...........................
[CV] . tol=0.00410876563615, C=721.376531068, score=-0.026003 -   4.1s
[CV] t

[Parallel(n_jobs=-1)]: Done 546 tasks      | elapsed:  3.1min


[CV] .. tol=0.0031921434081, C=1168.98653782, score=-0.060159 -   4.4s
[CV] tol=0.00118108464728, C=1046.89036324 ...........................
[CV]  tol=0.000764141635668, C=1258.92447076, score=-0.019239 -   6.0s
[CV] tol=0.00118108464728, C=1046.89036324 ...........................
[CV] . tol=0.00305403676483, C=766.086657798, score=-0.044220 -   4.8s
[CV] tol=0.00118108464728, C=1046.89036324 ...........................
[CV]  tol=0.000764141635668, C=1258.92447076, score=-0.084859 -   6.9s
[CV] tol=0.00118108464728, C=1046.89036324 ...........................
[CV]  tol=0.000764141635668, C=1258.92447076, score=-0.015738 -   7.4s
[CV] tol=0.00118108464728, C=1046.89036324 ...........................
[CV] .. tol=0.0031921434081, C=1168.98653782, score=-0.089952 -   6.3s
[CV] tol=0.000594069286188, C=1125.65723748 ..........................
[CV] .. tol=0.0031921434081, C=1168.98653782, score=-0.017106 -   7.3s
[CV] tol=0.000594069286188, C=1125.65723748 ..........................
[CV] .

[Parallel(n_jobs=-1)]: Done 581 tasks      | elapsed:  3.2min


[CV]  tol=0.000594069286188, C=1125.65723748, score=-0.016030 -   8.0s
[CV] tol=0.00664070357871, C=1167.10077853 ...........................
[CV]  tol=0.000594069286188, C=1125.65723748, score=-0.084160 -   7.8s
[CV] tol=0.00664070357871, C=1167.10077853 ...........................
[CV] . tol=0.00639043149059, C=620.368953551, score=-0.053738 -   3.7s
[CV] tol=0.00458742040277, C=1128.73174298 ...........................
[CV] . tol=0.00708423773645, C=1024.32945722, score=-0.086782 -   6.0s
[CV] tol=0.00458742040277, C=1128.73174298 ...........................
[CV] . tol=0.00639043149059, C=620.368953551, score=-0.045413 -   4.9s
[CV] tol=0.00458742040277, C=1128.73174298 ...........................
[CV] . tol=0.00639043149059, C=620.368953551, score=-0.083800 -   5.6s
[CV] . tol=0.00639043149059, C=620.368953551, score=-0.024306 -   4.7s
[CV] . tol=0.00664070357871, C=1167.10077853, score=-0.071280 -   2.6s
[CV] tol=0.00458742040277, C=1128.73174298 ...........................
[CV] t

In [75]:
random_search.best_score_

-0.041110479918746973

In [76]:
random_search.best_params_

{'C': 952.41129537107952, 'tol': 0.00091539811739019511}

---

In [27]:
import sklearn.svm

In [37]:
params = {'C':[1, 10, 50, 100, 500, 1000, 2000], 'tol': [0.001, 0.0001, 0.005]}
clf = sklearn.svm.SVC(probability=True)
grid = GridSearchCV(clf, params, scoring='log_loss', n_jobs=-1, cv=5,verbose=10)

In [38]:
grid.fit(x_train, y_train)

Fitting 5 folds for each of 21 candidates, totalling 105 fits
[CV] tol=0.001, C=1 ..................................................
[CV] tol=0.001, C=1 ..................................................
[CV] tol=0.001, C=1 ..................................................
[CV] tol=0.001, C=1 ..................................................
[CV] tol=0.001, C=1 ..................................................
[CV] tol=0.0001, C=1 .................................................
[CV] tol=0.0001, C=1 .................................................
[CV] tol=0.0001, C=1 .................................................
[CV] tol=0.0001, C=1 .................................................
[CV] tol=0.005, C=1 ..................................................
[CV] tol=0.0001, C=1 .................................................
[CV] tol=0.005, C=1 ..................................................
[CV] tol=0.005, C=1 ..................................................
[CV] tol=0.005,

[Parallel(n_jobs=-1)]: Done   9 tasks      | elapsed:    2.5s


[CV] ....................... tol=0.005, C=10, score=-2.399805 -   2.3s
[CV] tol=0.001, C=50 .................................................
[CV] ....................... tol=0.005, C=10, score=-2.407149 -   2.3s
[CV] tol=0.001, C=50 .................................................
[CV] ....................... tol=0.001, C=10, score=-2.397850 -   2.4s
[CV] ....................... tol=0.001, C=10, score=-2.399774 -   2.4s
[CV] tol=0.0001, C=50 ................................................
[CV] ....................... tol=0.001, C=10, score=-2.404600 -   2.4s
[CV] ....................... tol=0.001, C=10, score=-2.384212 -   2.4s
[CV] tol=0.0001, C=50 ................................................
[CV] tol=0.001, C=50 .................................................
[CV] tol=0.0001, C=50 ................................................
[CV] ....................... tol=0.005, C=10, score=-2.397857 -   2.3s
[CV] tol=0.0001, C=50 ................................................
[CV] .

[Parallel(n_jobs=-1)]: Done  18 tasks      | elapsed:    4.8s
[Parallel(n_jobs=-1)]: Done  29 tasks      | elapsed:    4.9s


[CV] tol=0.001, C=100 ................................................
[CV] ....................... tol=0.001, C=50, score=-2.397415 -   2.3s
[CV] tol=0.001, C=100 ................................................
[CV] ....................... tol=0.005, C=50, score=-2.402342 -   2.3s
[CV] ....................... tol=0.001, C=50, score=-2.403580 -   2.4s
[CV] tol=0.001, C=100 ................................................
[CV] ....................... tol=0.001, C=50, score=-2.383676 -   2.4s
[CV] tol=0.0001, C=100 ...............................................
[CV] tol=0.0001, C=100 ...............................................
[CV] ....................... tol=0.005, C=50, score=-2.402036 -   2.3s
[CV] tol=0.0001, C=100 ...............................................
[CV] ....................... tol=0.005, C=50, score=-2.403654 -   2.3s
[CV] ....................... tol=0.005, C=50, score=-2.397414 -   2.3s
[CV] tol=0.0001, C=100 ...............................................
[CV] t

[Parallel(n_jobs=-1)]: Done  40 tasks      | elapsed:    7.2s


[CV] ...................... tol=0.001, C=100, score=-2.392983 -   2.4s
[CV] tol=0.001, C=500 ................................................
[CV] ...................... tol=0.001, C=100, score=-2.382596 -   2.4s
[CV] tol=0.0001, C=500 ...............................................
[CV] ...................... tol=0.005, C=100, score=-2.395230 -   2.3s
[CV] tol=0.0001, C=500 ...............................................
[CV] ...................... tol=0.005, C=100, score=-2.376936 -   2.3s
[CV] ...................... tol=0.005, C=100, score=-2.383454 -   2.3s
[CV] tol=0.0001, C=500 ...............................................
[CV] tol=0.0001, C=500 ...............................................
[CV] ...................... tol=0.005, C=100, score=-2.382634 -   2.3s
[CV] tol=0.0001, C=500 ...............................................
[CV] ...................... tol=0.005, C=100, score=-2.393056 -   2.3s
[CV] tol=0.005, C=500 ................................................
[CV] .

[Parallel(n_jobs=-1)]: Done  53 tasks      | elapsed:    9.6s


[CV] ...................... tol=0.001, C=500, score=-2.331028 -   2.4s
[CV] tol=0.0001, C=1000 ..............................................
[CV] ...................... tol=0.005, C=500, score=-2.345045 -   2.3s
[CV] tol=0.0001, C=1000 ..............................................
[CV] ...................... tol=0.005, C=500, score=-2.347388 -   2.3s
[CV] tol=0.0001, C=1000 ..............................................
[CV] ...................... tol=0.005, C=500, score=-2.334039 -   2.3s
[CV] tol=0.0001, C=1000 ..............................................
[CV] ...................... tol=0.005, C=500, score=-2.338834 -   2.3s
[CV] tol=0.0001, C=1000 ..............................................
[CV] ...................... tol=0.005, C=500, score=-2.331086 -   2.3s
[CV] tol=0.005, C=1000 ...............................................
[CV] ..................... tol=0.0001, C=500, score=-2.345024 -   2.5s
[CV] tol=0.005, C=1000 ...............................................
[CV] .

[Parallel(n_jobs=-1)]: Done  66 tasks      | elapsed:   11.9s


[CV] ..................... tol=0.001, C=1000, score=-2.331028 -   2.4s
[CV] tol=0.0001, C=2000 ..............................................
[CV] ..................... tol=0.005, C=1000, score=-2.396065 -   2.3s
[CV] tol=0.0001, C=2000 ..............................................
[CV] .................... tol=0.0001, C=1000, score=-2.396043 -   2.5s
[CV] ..................... tol=0.005, C=1000, score=-2.388656 -   2.3s
[CV] tol=0.0001, C=2000 ..............................................
[CV] tol=0.0001, C=2000 ..............................................
[CV] ..................... tol=0.005, C=1000, score=-2.389951 -   2.3s
[CV] tol=0.0001, C=2000 ..............................................
[CV] ..................... tol=0.005, C=1000, score=-2.396199 -   2.3s
[CV] tol=0.005, C=2000 ...............................................
[CV] ..................... tol=0.005, C=1000, score=-2.378698 -   2.3s
[CV] tol=0.005, C=2000 ...............................................
[CV] .

[Parallel(n_jobs=-1)]: Done 105 out of 105 | elapsed:   16.7s finished


GridSearchCV(cv=5, error_score='raise',
       estimator=SVC(C=1.0, cache_size=200, class_weight=None, coef0=0.0,
  decision_function_shape=None, degree=3, gamma='auto', kernel='rbf',
  max_iter=-1, probability=True, random_state=None, shrinking=True,
  tol=0.001, verbose=False),
       fit_params={}, iid=True, n_jobs=-1,
       param_grid={'tol': [0.001, 0.0001, 0.005], 'C': [1, 10, 50, 100, 500, 1000, 2000]},
       pre_dispatch='2*n_jobs', refit=True, scoring='log_loss', verbose=10)

In [39]:
grid.best_score_

-2.3392352530188951

- - - 

In [42]:
from sklearn.feature_selection import SelectFromModel


In [45]:
clf.best_estimator_.coef_.co

(99, 192)

In [80]:
test = pd.read_csv('test.csv')
test_ids = test.pop('id')
x_test = test.values
scaler = StandardScaler().fit(x_test)
x_test = scaler.transform(x_test)

y_test = clf.predict_proba(x_test)

submission = pd.DataFrame(y_test, index=test_ids, columns=le.classes_)
submission.to_csv('submission.csv')