# Loading the data

In [1]:
import pandas as pd
import numpy as np
from sklearn.ensemble import RandomForestClassifier,GradientBoostingClassifier
from sklearn.preprocessing import label_binarize

In [2]:
!ls data

[1m[36mtitanic[m[m [1m[36mwine[m[m


In [3]:
training_data = pd.read_csv('./data/titanic/cleandata.train.csv')
test_data = pd.read_csv('./data/titanic/cleandata.test.csv')

training_data['Training_set'] = 1
test_data['Training_set'] = 0

In [4]:
full_data = pd.concat([training_data, test_data])

In [5]:
full_data

Unnamed: 0,passengerid,survived,pclass,name,sex,age,sibsp,parch,ticket,fare,cabin,embarked,lastName,title,otherName,Training_set
0,522,yes,3,"Vovk, Mr. Janko",male,22.0,0,0,349252,7.8958,,S,Vovk,Mr,Janko,1
1,8,yes,3,"Palsson, Master. Gosta Leonard",male,2.0,3,1,349909,21.0750,,S,Palsson,Master,Gosta Leonard,1
2,262,no,3,"Asplund, Master. Edvin Rojj Felix",male,3.0,4,2,347077,31.3875,,S,Asplund,Master,Edvin Rojj Felix,1
3,247,yes,3,"Lindahl, Miss. Agda Thorilda Viktoria",female,25.0,0,0,347071,7.7750,,S,Lindahl,Miss,Agda Thorilda Viktoria,1
4,722,yes,3,"Jensen, Mr. Svend Lauritz",male,17.0,1,0,350048,7.0542,,S,Jensen,Mr,Svend Lauritz,1
5,231,no,1,"Harris, Mrs. Henry Birkhardt (Irene Wallach)",female,35.0,1,0,36973,83.4750,C83,S,Harris,Mrs,Henry Birkhardt (Irene Wallach),1
6,642,no,1,"Sagesser, Mlle. Emma",female,24.0,0,0,PC 17477,69.3000,B35,C,Sagesser,Miss,Emma,1
7,801,yes,2,"Ponesell, Mr. Martin",male,34.0,0,0,250647,13.0000,,S,Ponesell,Mr,Martin,1
8,839,no,3,"Chip, Mr. Chang",male,32.0,0,0,1601,56.4958,,S,Chip,Mr,Chang,1
9,65,yes,1,"Stewart, Mr. Albert A",male,,0,0,PC 17605,27.7208,,C,Stewart,Mr,Albert A,1


In [6]:
full_data['result'] = label_binarize(full_data['survived'], classes=['no','yes'], neg_label=0, pos_label=1)

In [7]:
full_data

Unnamed: 0,passengerid,survived,pclass,name,sex,age,sibsp,parch,ticket,fare,cabin,embarked,lastName,title,otherName,Training_set,result
0,522,yes,3,"Vovk, Mr. Janko",male,22.0,0,0,349252,7.8958,,S,Vovk,Mr,Janko,1,1
1,8,yes,3,"Palsson, Master. Gosta Leonard",male,2.0,3,1,349909,21.0750,,S,Palsson,Master,Gosta Leonard,1,1
2,262,no,3,"Asplund, Master. Edvin Rojj Felix",male,3.0,4,2,347077,31.3875,,S,Asplund,Master,Edvin Rojj Felix,1,0
3,247,yes,3,"Lindahl, Miss. Agda Thorilda Viktoria",female,25.0,0,0,347071,7.7750,,S,Lindahl,Miss,Agda Thorilda Viktoria,1,1
4,722,yes,3,"Jensen, Mr. Svend Lauritz",male,17.0,1,0,350048,7.0542,,S,Jensen,Mr,Svend Lauritz,1,1
5,231,no,1,"Harris, Mrs. Henry Birkhardt (Irene Wallach)",female,35.0,1,0,36973,83.4750,C83,S,Harris,Mrs,Henry Birkhardt (Irene Wallach),1,0
6,642,no,1,"Sagesser, Mlle. Emma",female,24.0,0,0,PC 17477,69.3000,B35,C,Sagesser,Miss,Emma,1,0
7,801,yes,2,"Ponesell, Mr. Martin",male,34.0,0,0,250647,13.0000,,S,Ponesell,Mr,Martin,1,1
8,839,no,3,"Chip, Mr. Chang",male,32.0,0,0,1601,56.4958,,S,Chip,Mr,Chang,1,0
9,65,yes,1,"Stewart, Mr. Albert A",male,,0,0,PC 17605,27.7208,,C,Stewart,Mr,Albert A,1,1


In [8]:
categories = ['survived', 'pclass', 'sex', 'embarked', 'title']

In [9]:
for variable in categories:
    full_data[variable] = full_data[variable].astype('category')

# Creating dummy variables and cleaning up data

In [10]:
dummy_sex = pd.get_dummies(full_data['sex'], prefix='sex')
dummy_embarked = pd.get_dummies(full_data['embarked'], prefix='embarked')
dummy_title = pd.get_dummies(full_data['title'],prefix='title')
dummy_pclass = pd.get_dummies(full_data['pclass'],prefix='pclass')

In [11]:
# Add missing ages
full_data.age.fillna(value=full_data.age.mean(), inplace=True)

In [12]:
full_data = pd.concat([full_data, dummy_sex, dummy_embarked, dummy_title, dummy_pclass], axis=1)

In [13]:
full_data

Unnamed: 0,passengerid,survived,pclass,name,sex,age,sibsp,parch,ticket,fare,...,embarked_Q,embarked_S,title_Master,title_Miss,title_Mr,title_Mrs,title_Rev,pclass_1,pclass_2,pclass_3
0,522,yes,3,"Vovk, Mr. Janko",male,22.000000,0,0,349252,7.8958,...,0,1,0,0,1,0,0,0,0,1
1,8,yes,3,"Palsson, Master. Gosta Leonard",male,2.000000,3,1,349909,21.0750,...,0,1,1,0,0,0,0,0,0,1
2,262,no,3,"Asplund, Master. Edvin Rojj Felix",male,3.000000,4,2,347077,31.3875,...,0,1,1,0,0,0,0,0,0,1
3,247,yes,3,"Lindahl, Miss. Agda Thorilda Viktoria",female,25.000000,0,0,347071,7.7750,...,0,1,0,1,0,0,0,0,0,1
4,722,yes,3,"Jensen, Mr. Svend Lauritz",male,17.000000,1,0,350048,7.0542,...,0,1,0,0,1,0,0,0,0,1
5,231,no,1,"Harris, Mrs. Henry Birkhardt (Irene Wallach)",female,35.000000,1,0,36973,83.4750,...,0,1,0,0,0,1,0,1,0,0
6,642,no,1,"Sagesser, Mlle. Emma",female,24.000000,0,0,PC 17477,69.3000,...,0,0,0,1,0,0,0,1,0,0
7,801,yes,2,"Ponesell, Mr. Martin",male,34.000000,0,0,250647,13.0000,...,0,1,0,0,1,0,0,0,1,0
8,839,no,3,"Chip, Mr. Chang",male,32.000000,0,0,1601,56.4958,...,0,1,0,0,1,0,0,0,0,1
9,65,yes,1,"Stewart, Mr. Albert A",male,29.699118,0,0,PC 17605,27.7208,...,0,0,0,0,1,0,0,1,0,0


In [14]:
full_data.drop(["sex", "embarked", "title", "pclass", "otherName", "lastName", "name", "passengerid"], inplace=True, axis=1)

In [15]:
full_data.head(10)

Unnamed: 0,survived,age,sibsp,parch,ticket,fare,cabin,Training_set,result,sex_female,...,embarked_Q,embarked_S,title_Master,title_Miss,title_Mr,title_Mrs,title_Rev,pclass_1,pclass_2,pclass_3
0,yes,22.0,0,0,349252,7.8958,,1,1,0,...,0,1,0,0,1,0,0,0,0,1
1,yes,2.0,3,1,349909,21.075,,1,1,0,...,0,1,1,0,0,0,0,0,0,1
2,no,3.0,4,2,347077,31.3875,,1,0,0,...,0,1,1,0,0,0,0,0,0,1
3,yes,25.0,0,0,347071,7.775,,1,1,1,...,0,1,0,1,0,0,0,0,0,1
4,yes,17.0,1,0,350048,7.0542,,1,1,0,...,0,1,0,0,1,0,0,0,0,1
5,no,35.0,1,0,36973,83.475,C83,1,0,1,...,0,1,0,0,0,1,0,1,0,0
6,no,24.0,0,0,PC 17477,69.3,B35,1,0,1,...,0,0,0,1,0,0,0,1,0,0
7,yes,34.0,0,0,250647,13.0,,1,1,0,...,0,1,0,0,1,0,0,0,1,0
8,no,32.0,0,0,1601,56.4958,,1,0,0,...,0,1,0,0,1,0,0,0,0,1
9,yes,29.699118,0,0,PC 17605,27.7208,,1,1,0,...,0,0,0,0,1,0,0,1,0,0


In [16]:
full_data.survived = full_data.survived.apply(lambda label: 1 if label == "yes" else 0)

In [17]:
full_data.survived.value_counts()

1    549
0    342
Name: survived, dtype: int64

# Splitting data into training and test

In [18]:
training_data = full_data[full_data['Training_set'] == 1]
test_data = full_data[full_data['Training_set'] == 0]

In [19]:
training_data

Unnamed: 0,survived,age,sibsp,parch,ticket,fare,cabin,Training_set,result,sex_female,...,embarked_Q,embarked_S,title_Master,title_Miss,title_Mr,title_Mrs,title_Rev,pclass_1,pclass_2,pclass_3
0,1,22.000000,0,0,349252,7.8958,,1,1,0,...,0,1,0,0,1,0,0,0,0,1
1,1,2.000000,3,1,349909,21.0750,,1,1,0,...,0,1,1,0,0,0,0,0,0,1
2,0,3.000000,4,2,347077,31.3875,,1,0,0,...,0,1,1,0,0,0,0,0,0,1
3,1,25.000000,0,0,347071,7.7750,,1,1,1,...,0,1,0,1,0,0,0,0,0,1
4,1,17.000000,1,0,350048,7.0542,,1,1,0,...,0,1,0,0,1,0,0,0,0,1
5,0,35.000000,1,0,36973,83.4750,C83,1,0,1,...,0,1,0,0,0,1,0,1,0,0
6,0,24.000000,0,0,PC 17477,69.3000,B35,1,0,1,...,0,0,0,1,0,0,0,1,0,0
7,1,34.000000,0,0,250647,13.0000,,1,1,0,...,0,1,0,0,1,0,0,0,1,0
8,0,32.000000,0,0,1601,56.4958,,1,0,0,...,0,1,0,0,1,0,0,0,0,1
9,1,29.699118,0,0,PC 17605,27.7208,,1,1,0,...,0,0,0,0,1,0,0,1,0,0


# Random Forest implementation

In [20]:
rf = RandomForestClassifier(max_features=10,n_estimators=1000)

In [21]:
full_data.columns.values

array(['survived', 'age', 'sibsp', 'parch', 'ticket', 'fare', 'cabin',
       'Training_set', 'result', 'sex_female', 'sex_male', 'embarked_C',
       'embarked_Q', 'embarked_S', 'title_Master', 'title_Miss',
       'title_Mr', 'title_Mrs', 'title_Rev', 'pclass_1', 'pclass_2',
       'pclass_3'], dtype=object)

In [22]:
relevant_x_columns = ['age','sibsp','parch','fare',
                     'sex_female', 'sex_male', 'embarked_C',
                     'embarked_Q', 'embarked_S', 'title_Master',
                     'title_Miss', 'title_Mr', 'title_Rev', 'pclass_1',
                     'pclass_2', 'pclass_3']

In [23]:
X_train = np.array(training_data[relevant_x_columns])
y_train = np.array(training_data['survived'])

In [24]:
X_test = np.array(test_data[relevant_x_columns])
y_test = np.array(test_data['result'])

In [25]:
print(X_train.shape)
print(X_test.shape)
print(y_test.shape)
print(y_train.shape)

(712, 16)
(179, 16)
(179,)
(712,)


In [26]:
rf.fit(X_train,y_train)

RandomForestClassifier(bootstrap=True, class_weight=None, criterion='gini',
            max_depth=None, max_features=10, max_leaf_nodes=None,
            min_impurity_split=1e-07, min_samples_leaf=1,
            min_samples_split=2, min_weight_fraction_leaf=0.0,
            n_estimators=1000, n_jobs=1, oob_score=False,
            random_state=None, verbose=0, warm_start=False)

In [27]:
y_pred = rf.predict(X_test)

In [28]:
rf.score(X_test, y_test)

0.81005586592178769

In [29]:
rf.feature_importances_

array([ 0.22023559,  0.04817397,  0.02422236,  0.2295941 ,  0.09616498,
        0.09117046,  0.01099272,  0.00913498,  0.01607898,  0.01182036,
        0.0084982 ,  0.11985606,  0.0066148 ,  0.02385303,  0.01268124,
        0.07090818])

# GradientBoostedTrees Implementation

In [30]:
from sklearn.ensemble import GradientBoostingClassifier

In [31]:
GBC = GradientBoostingClassifier(n_estimators=1000, max_depth=5)

In [32]:
GBC.fit(X_train,y_train)

GradientBoostingClassifier(criterion='friedman_mse', init=None,
              learning_rate=0.1, loss='deviance', max_depth=5,
              max_features=None, max_leaf_nodes=None,
              min_impurity_split=1e-07, min_samples_leaf=1,
              min_samples_split=2, min_weight_fraction_leaf=0.0,
              n_estimators=1000, presort='auto', random_state=None,
              subsample=1.0, verbose=0, warm_start=False)

In [33]:
GBC.predict(X_test)

array([0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1,
       0, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0,
       0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1,
       0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 0,
       1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1,
       1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0,
       1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1])

In [34]:
GBC.score(X_test,y_test)

0.78770949720670391

# GridSearch

In [38]:
from sklearn.grid_search import GridSearchCV
from sklearn.svm import SVC

In [39]:
parameters = {'kernel':['rbf','linear'], 'C':np.logspace(-3,3,5), 'gamma':np.logspace(-3,3,5)}

In [40]:
GridsearchSVM = GridSearchCV(SVC(), parameters, cv=5, verbose=10, scoring='roc_auc', n_jobs=2)

In [None]:
GridsearchSVM.fit(X_train, y_train)

Fitting 5 folds for each of 50 candidates, totalling 250 fits
[CV] kernel=rbf, C=0.001, gamma=0.001 ................................
[CV] kernel=rbf, C=0.001, gamma=0.001 ................................
[CV] kernel=rbf, C=0.001, gamma=0.001 ................................
[CV] ....... kernel=rbf, C=0.001, gamma=0.001, score=0.698847 -   0.0s
[CV] kernel=rbf, C=0.001, gamma=0.001 ................................
[CV] kernel=rbf, C=0.001, gamma=0.001 ................................
[CV] kernel=linear, C=0.001, gamma=0.001 .............................
[CV] kernel=linear, C=0.001, gamma=0.001 .............................
[CV] ....... kernel=rbf, C=0.001, gamma=0.001, score=0.708910 -   0.1s
[CV] kernel=linear, C=0.001, gamma=0.001 .............................
[CV] ....... kernel=rbf, C=0.001, gamma=0.001, score=0.655289 -   0.1s
[CV] ....... kernel=rbf, C=0.001, gamma=0.001, score=0.696417 -   0.0s
[CV] ....... kernel=rbf, C=0.001, gamma=0.001, score=0.749629 -   0.0s
[CV] .... kerne

[Parallel(n_jobs=7)]: Batch computation too fast (0.1103s.) Setting batch_size=2.
[Parallel(n_jobs=7)]: Done   5 tasks      | elapsed:    0.2s
[Parallel(n_jobs=7)]: Done  12 tasks      | elapsed:    0.2s
[Parallel(n_jobs=7)]: Batch computation too fast (0.1708s.) Setting batch_size=4.


[CV] kernel=rbf, C=0.001, gamma=31.6227766017 ........................
[CV] kernel=linear, C=0.001, gamma=1.0 ...............................
[CV] kernel=linear, C=0.001, gamma=1.0 ...............................
[CV] kernel=linear, C=0.001, gamma=1.0 ...............................
[CV]  kernel=linear, C=0.001, gamma=0.0316227766017, score=0.753021 -   0.0s
[CV]  kernel=rbf, C=0.001, gamma=31.6227766017, score=0.727044 -   0.0s
[CV] kernel=rbf, C=0.001, gamma=31.6227766017 ........................
[CV] ......... kernel=rbf, C=0.001, gamma=1.0, score=0.764256 -   0.1s
[CV] kernel=rbf, C=0.001, gamma=31.6227766017 ........................
[CV] ...... kernel=linear, C=0.001, gamma=1.0, score=0.766143 -   0.0s
[CV] ...... kernel=linear, C=0.001, gamma=1.0, score=0.822769 -   0.0s
[CV] ......... kernel=rbf, C=0.001, gamma=1.0, score=0.754717 -   0.1s
[CV] ...... kernel=linear, C=0.001, gamma=1.0, score=0.818344 -   0.0s
[CV] kernel=rbf, C=0.001, gamma=31.6227766017 ........................

[Parallel(n_jobs=7)]: Done  26 tasks      | elapsed:    0.4s


[CV]  kernel=rbf, C=0.0316227766017, gamma=0.0316227766017, score=0.749205 -   0.0s
[CV]  kernel=rbf, C=0.0316227766017, gamma=0.001, score=0.715618 -   0.0s
[CV] kernel=rbf, C=0.0316227766017, gamma=0.001 ......................
[CV] kernel=rbf, C=0.001, gamma=1000.0 ...............................
[CV] kernel=rbf, C=0.0316227766017, gamma=0.0316227766017 ............
[CV] kernel=linear, C=0.001, gamma=1000.0 ............................
[CV] ...... kernel=rbf, C=0.001, gamma=1000.0, score=0.641403 -   0.0s
[CV] kernel=linear, C=0.001, gamma=1000.0 ............................
[CV] ... kernel=linear, C=0.001, gamma=1000.0, score=0.822769 -   0.0s
[CV]  kernel=rbf, C=0.0316227766017, gamma=0.001, score=0.658045 -   0.0s
[CV]  kernel=rbf, C=0.0316227766017, gamma=0.0316227766017, score=0.780369 -   0.0s
[CV] kernel=linear, C=0.001, gamma=1000.0 ............................
[CV] kernel=rbf, C=0.0316227766017, gamma=0.001 ......................
[CV] kernel=rbf, C=0.0316227766017, gamma=0.0

[Parallel(n_jobs=7)]: Done  50 tasks      | elapsed:    0.7s


[CV] kernel=rbf, C=0.0316227766017, gamma=31.6227766017 ..............
[CV] kernel=rbf, C=0.0316227766017, gamma=1.0 ........................
[CV]  kernel=rbf, C=0.0316227766017, gamma=31.6227766017, score=0.695357 -   0.0s
[CV]  kernel=rbf, C=0.0316227766017, gamma=1.0, score=0.760653 -   0.0s
[CV] kernel=rbf, C=0.0316227766017, gamma=31.6227766017 ..............
[CV] kernel=linear, C=0.0316227766017, gamma=31.6227766017 ...........
[CV]  kernel=rbf, C=0.0316227766017, gamma=31.6227766017, score=0.708713 -   0.0s
[CV]  kernel=linear, C=0.0316227766017, gamma=0.0316227766017, score=0.819165 -   0.1s
[CV]  kernel=linear, C=0.0316227766017, gamma=0.001, score=0.819165 -   0.1s
[CV] kernel=rbf, C=0.0316227766017, gamma=31.6227766017 ..............
[CV] kernel=linear, C=0.0316227766017, gamma=0.0316227766017 .........
[CV] kernel=rbf, C=0.0316227766017, gamma=1000.0 .....................
[CV]  kernel=linear, C=0.0316227766017, gamma=0.001, score=0.856477 -   0.1s
[CV] kernel=rbf, C=0.03162

[Parallel(n_jobs=7)]: Done  86 tasks      | elapsed:    1.4s


[CV] kernel=rbf, C=1.0, gamma=0.0316227766017 ........................
[CV] kernel=linear, C=0.0316227766017, gamma=1000.0 ..................
[CV] kernel=linear, C=1.0, gamma=0.0316227766017 .....................
[CV]  kernel=rbf, C=1.0, gamma=0.0316227766017, score=0.778673 -   0.0s
[CV] kernel=linear, C=1.0, gamma=0.0316227766017 .....................
[CV]  kernel=linear, C=0.0316227766017, gamma=1000.0, score=0.820649 -   0.4s
[CV] kernel=linear, C=0.0316227766017, gamma=1000.0 ..................
[CV]  kernel=linear, C=0.0316227766017, gamma=31.6227766017, score=0.820649 -   0.4s
[CV] kernel=linear, C=0.0316227766017, gamma=31.6227766017 ...........
[CV]  kernel=linear, C=0.0316227766017, gamma=1000.0, score=0.819165 -   0.1s
[CV] kernel=rbf, C=1.0, gamma=1.0 ....................................
[CV]  kernel=linear, C=0.0316227766017, gamma=1000.0, score=0.856477 -   0.1s
[CV] kernel=rbf, C=1.0, gamma=0.001 ..................................
[CV] ........... kernel=rbf, C=1.0, gamma

[Parallel(n_jobs=7)]: Batch computation too slow (2.6094s.) Setting batch_size=2.


[CV]  kernel=linear, C=1.0, gamma=31.6227766017, score=0.905765 -   4.8s
[CV] kernel=linear, C=1.0, gamma=31.6227766017 .......................
[CV] ...... kernel=linear, C=1.0, gamma=0.001, score=0.803053 -   3.9s
[CV] kernel=linear, C=1.0, gamma=0.001 ...............................
[CV] ........ kernel=linear, C=1.0, gamma=1.0, score=0.803053 -   3.8s
[CV] kernel=linear, C=1.0, gamma=1.0 .................................
[CV]  kernel=linear, C=1.0, gamma=31.6227766017, score=0.835913 -   1.2s
[CV] kernel=linear, C=1.0, gamma=31.6227766017 .......................
[CV]  kernel=linear, C=1.0, gamma=0.0316227766017, score=0.822537 -   1.8s
[CV] kernel=linear, C=1.0, gamma=0.0316227766017 .....................
[CV] ...... kernel=linear, C=1.0, gamma=0.001, score=0.835913 -   1.1s
[CV] kernel=linear, C=1.0, gamma=0.001 ...............................
[CV]  kernel=linear, C=1.0, gamma=31.6227766017, score=0.822537 -   1.7s
[CV] ........ kernel=linear, C=1.0, gamma=1.0, score=0.835913 -   1

[Parallel(n_jobs=7)]: Done 130 tasks      | elapsed:   12.1s


[CV]  kernel=linear, C=1.0, gamma=0.0316227766017, score=0.803053 -   4.1s
[CV] kernel=linear, C=31.6227766017, gamma=0.001 .....................
[CV]  kernel=linear, C=1.0, gamma=31.6227766017, score=0.803053 -   4.1s
[CV] kernel=rbf, C=31.6227766017, gamma=0.0316227766017 ..............
[CV]  kernel=rbf, C=31.6227766017, gamma=0.0316227766017, score=0.787789 -   0.1s
[CV] kernel=rbf, C=31.6227766017, gamma=0.0316227766017 ..............
[CV]  kernel=rbf, C=31.6227766017, gamma=0.0316227766017, score=0.774009 -   0.0s
[CV] kernel=rbf, C=31.6227766017, gamma=0.0316227766017 ..............
[CV]  kernel=rbf, C=31.6227766017, gamma=0.0316227766017, score=0.799661 -   0.0s
[CV] kernel=linear, C=31.6227766017, gamma=0.0316227766017 ...........
[CV]  kernel=linear, C=1.0, gamma=31.6227766017, score=0.850329 -   6.4s
[CV] kernel=rbf, C=1.0, gamma=1000.0 .................................
[CV] ........ kernel=rbf, C=1.0, gamma=1000.0, score=0.695912 -   0.0s
[CV] kernel=rbf, C=1.0, gamma=1000.0

[Parallel(n_jobs=7)]: Batch computation too slow (3.5466s.) Setting batch_size=1.


[CV] . kernel=rbf, C=31.6227766017, gamma=1.0, score=0.785457 -   0.1s
[CV] kernel=linear, C=31.6227766017, gamma=1.0 .......................
[CV] ..... kernel=linear, C=1.0, gamma=1000.0, score=0.835913 -   1.5s
[CV] kernel=linear, C=1.0, gamma=1000.0 ..............................
[CV] ..... kernel=linear, C=1.0, gamma=1000.0, score=0.850329 -   6.5s
[CV] kernel=linear, C=31.6227766017, gamma=1.0 .......................
[CV]  kernel=linear, C=31.6227766017, gamma=0.001, score=0.905136 - 1.2min
[CV] kernel=linear, C=31.6227766017, gamma=0.001 .....................
[CV]  kernel=linear, C=31.6227766017, gamma=0.0316227766017, score=0.905136 - 1.2min
[CV] kernel=linear, C=31.6227766017, gamma=1.0 .......................
[CV]  kernel=linear, C=31.6227766017, gamma=1.0, score=0.905136 - 1.2min
[CV] kernel=rbf, C=31.6227766017, gamma=31.6227766017 ................
[CV]  kernel=rbf, C=31.6227766017, gamma=31.6227766017, score=0.754822 -   0.0s
[CV] kernel=rbf, C=31.6227766017, gamma=31.62277

[Parallel(n_jobs=7)]: Done 166 tasks      | elapsed:  1.5min


[CV]  kernel=linear, C=31.6227766017, gamma=0.001, score=0.834429 - 1.4min
[CV] kernel=linear, C=31.6227766017, gamma=0.001 .....................
[CV]  kernel=linear, C=31.6227766017, gamma=0.0316227766017, score=0.834429 - 1.4min
[CV] kernel=linear, C=31.6227766017, gamma=0.0316227766017 ...........
[CV]  kernel=linear, C=31.6227766017, gamma=0.0316227766017, score=0.826101 - 1.5min
[CV] kernel=linear, C=31.6227766017, gamma=0.0316227766017 ...........
[CV]  kernel=linear, C=31.6227766017, gamma=1.0, score=0.826101 - 1.5min
[CV] kernel=linear, C=31.6227766017, gamma=1.0 .......................
[CV]  kernel=linear, C=31.6227766017, gamma=31.6227766017, score=0.905136 - 1.1min
[CV] kernel=linear, C=31.6227766017, gamma=31.6227766017 .............
[CV]  kernel=linear, C=31.6227766017, gamma=0.001, score=0.852449 -  58.8s
[CV] kernel=rbf, C=31.6227766017, gamma=0.0316227766017 ..............
[CV]  kernel=rbf, C=31.6227766017, gamma=0.0316227766017, score=0.822956 -   0.0s
[CV] kernel=rbf,

[Parallel(n_jobs=7)]: Done 187 tasks      | elapsed:  3.7min


[CV]  kernel=linear, C=31.6227766017, gamma=31.6227766017, score=0.826101 - 1.3min
[CV] kernel=linear, C=31.6227766017, gamma=1000.0 ....................
[CV]  kernel=linear, C=31.6227766017, gamma=31.6227766017, score=0.834429 - 1.2min
[CV] kernel=linear, C=31.6227766017, gamma=1000.0 ....................
[CV]  kernel=linear, C=31.6227766017, gamma=31.6227766017, score=0.804325 - 1.7min
[CV] kernel=linear, C=31.6227766017, gamma=1000.0 ....................
[CV]  kernel=linear, C=31.6227766017, gamma=31.6227766017, score=0.852449 - 1.0min
[CV] kernel=rbf, C=1000.0, gamma=0.001 ...............................
[CV] ...... kernel=rbf, C=1000.0, gamma=0.001, score=0.836583 -   0.3s
[CV] kernel=rbf, C=1000.0, gamma=0.001 ...............................
[CV] ...... kernel=rbf, C=1000.0, gamma=0.001, score=0.829245 -   0.3s
[CV] kernel=rbf, C=1000.0, gamma=0.001 ...............................
[CV] ...... kernel=rbf, C=1000.0, gamma=0.001, score=0.811957 -   0.4s
[CV] kernel=rbf, C=1000.0, ga

[Parallel(n_jobs=7)]: Done 203 tasks      | elapsed:  5.3min


[CV]  kernel=linear, C=31.6227766017, gamma=1000.0, score=0.852449 - 1.0min
[CV] kernel=rbf, C=1000.0, gamma=0.0316227766017 .....................
[CV]  kernel=rbf, C=1000.0, gamma=0.0316227766017, score=0.808910 -   0.2s
[CV] kernel=rbf, C=1000.0, gamma=0.0316227766017 .....................
[CV]  kernel=rbf, C=1000.0, gamma=0.0316227766017, score=0.740147 -   0.2s
[CV] kernel=rbf, C=1000.0, gamma=0.0316227766017 .....................
[CV]  kernel=rbf, C=1000.0, gamma=0.0316227766017, score=0.736909 -   0.2s
[CV] kernel=rbf, C=1000.0, gamma=0.0316227766017 .....................
[CV]  kernel=rbf, C=1000.0, gamma=0.0316227766017, score=0.748569 -   0.3s
[CV] kernel=rbf, C=1000.0, gamma=0.0316227766017 .....................
[CV]  kernel=rbf, C=1000.0, gamma=0.0316227766017, score=0.742209 -   1.0s
[CV] kernel=linear, C=1000.0, gamma=0.0316227766017 ..................
[CV]  kernel=linear, C=31.6227766017, gamma=1000.0, score=0.804325 - 1.7min
[CV] kernel=linear, C=1000.0, gamma=0.031622776

[Parallel(n_jobs=7)]: Done 218 tasks      | elapsed: 14.1min


[CV]  kernel=linear, C=1000.0, gamma=0.0316227766017, score=0.856689 - 4.6min
[CV] kernel=linear, C=1000.0, gamma=1.0 ..............................
[CV] ... kernel=linear, C=1000.0, gamma=0.001, score=0.890671 -11.3min
[CV] kernel=linear, C=1000.0, gamma=1.0 ..............................
[CV]  kernel=linear, C=1000.0, gamma=0.0316227766017, score=0.890671 -11.5min
[CV] kernel=linear, C=1000.0, gamma=1.0 ..............................
[CV]  kernel=linear, C=1000.0, gamma=0.0316227766017, score=0.824677 - 9.5min
[CV] kernel=linear, C=1000.0, gamma=1.0 ..............................
[CV] ..... kernel=linear, C=1000.0, gamma=1.0, score=0.856689 - 4.4min
[CV] kernel=rbf, C=1000.0, gamma=31.6227766017 .......................
[CV]  kernel=rbf, C=1000.0, gamma=31.6227766017, score=0.754298 -   0.0s
[CV] kernel=rbf, C=1000.0, gamma=31.6227766017 .......................
[CV]  kernel=rbf, C=1000.0, gamma=31.6227766017, score=0.660377 -   0.1s
[CV] kernel=rbf, C=1000.0, gamma=31.6227766017 .....

[Parallel(n_jobs=7)]: Done 233 tasks      | elapsed: 27.8min


[CV]  kernel=linear, C=1000.0, gamma=31.6227766017, score=0.804507 - 6.4min
[CV] kernel=rbf, C=1000.0, gamma=1000.0 ..............................
[CV] ..... kernel=rbf, C=1000.0, gamma=1000.0, score=0.692767 -   0.0s
[CV] kernel=rbf, C=1000.0, gamma=1000.0 ..............................
[CV] ..... kernel=rbf, C=1000.0, gamma=1000.0, score=0.623166 -   0.0s
[CV] kernel=rbf, C=1000.0, gamma=1000.0 ..............................
[CV] ..... kernel=rbf, C=1000.0, gamma=1000.0, score=0.607272 -   0.0s
[CV] kernel=rbf, C=1000.0, gamma=1000.0 ..............................
[CV] ..... kernel=rbf, C=1000.0, gamma=1000.0, score=0.636845 -   0.0s
[CV] kernel=rbf, C=1000.0, gamma=1000.0 ..............................
[CV] ..... kernel=rbf, C=1000.0, gamma=1000.0, score=0.640237 -   0.0s
[CV] kernel=linear, C=1000.0, gamma=1000.0 ...........................
[CV]  kernel=linear, C=1000.0, gamma=31.6227766017, score=0.856689 - 4.6min
[CV] kernel=linear, C=1000.0, gamma=1000.0 ........................

[Parallel(n_jobs=7)]: Done 250 out of 250 | elapsed: 46.6min finished


In [None]:
GridsearchSVM.best_params_

In [None]:
GridsearchSVM.best_score_

In [None]:
GridsearchSVM.predict(X_test)

In [None]:
GridsearchSVM.score(X_test,y_test)