# Set Up

## Load libraries

In [87]:
import pandas as pd
import sklearn

from sklearn.model_selection import cross_val_score, GridSearchCV
from sklearn.linear_model import LogisticRegression
from sklearn import svm
from sklearn.tree import DecisionTreeClassifier
from sklearn.ensemble import RandomForestClassifier, AdaBoostClassifier, GradientBoostingClassifier
from sklearn.neighbors import KNeighborsClassifier
from sklearn.neural_network import MLPClassifier
from sklearn.naive_bayes import GaussianNB
from sklearn.decomposition import PCA

## Read in data

In [5]:
df = pd.read_csv("voice.csv")
df.head()

Unnamed: 0,meanfreq,sd,median,Q25,Q75,IQR,skew,kurt,sp.ent,sfm,...,centroid,meanfun,minfun,maxfun,meandom,mindom,maxdom,dfrange,modindx,label
0,0.059781,0.064241,0.032027,0.015071,0.090193,0.075122,12.863462,274.402906,0.893369,0.491918,...,0.059781,0.084279,0.015702,0.275862,0.007812,0.007812,0.007812,0.0,0.0,male
1,0.066009,0.06731,0.040229,0.019414,0.092666,0.073252,22.423285,634.613855,0.892193,0.513724,...,0.066009,0.107937,0.015826,0.25,0.009014,0.007812,0.054688,0.046875,0.052632,male
2,0.077316,0.083829,0.036718,0.008701,0.131908,0.123207,30.757155,1024.927705,0.846389,0.478905,...,0.077316,0.098706,0.015656,0.271186,0.00799,0.007812,0.015625,0.007812,0.046512,male
3,0.151228,0.072111,0.158011,0.096582,0.207955,0.111374,1.232831,4.177296,0.963322,0.727232,...,0.151228,0.088965,0.017798,0.25,0.201497,0.007812,0.5625,0.554688,0.247119,male
4,0.13512,0.079146,0.124656,0.07872,0.206045,0.127325,1.101174,4.333713,0.971955,0.783568,...,0.13512,0.106398,0.016931,0.266667,0.712812,0.007812,5.484375,5.476562,0.208274,male


In [23]:
X = df.loc[:, df.columns != 'label']
X.head()

Unnamed: 0,meanfreq,sd,median,Q25,Q75,IQR,skew,kurt,sp.ent,sfm,mode,centroid,meanfun,minfun,maxfun,meandom,mindom,maxdom,dfrange,modindx
0,0.059781,0.064241,0.032027,0.015071,0.090193,0.075122,12.863462,274.402906,0.893369,0.491918,0.0,0.059781,0.084279,0.015702,0.275862,0.007812,0.007812,0.007812,0.0,0.0
1,0.066009,0.06731,0.040229,0.019414,0.092666,0.073252,22.423285,634.613855,0.892193,0.513724,0.0,0.066009,0.107937,0.015826,0.25,0.009014,0.007812,0.054688,0.046875,0.052632
2,0.077316,0.083829,0.036718,0.008701,0.131908,0.123207,30.757155,1024.927705,0.846389,0.478905,0.0,0.077316,0.098706,0.015656,0.271186,0.00799,0.007812,0.015625,0.007812,0.046512
3,0.151228,0.072111,0.158011,0.096582,0.207955,0.111374,1.232831,4.177296,0.963322,0.727232,0.083878,0.151228,0.088965,0.017798,0.25,0.201497,0.007812,0.5625,0.554688,0.247119
4,0.13512,0.079146,0.124656,0.07872,0.206045,0.127325,1.101174,4.333713,0.971955,0.783568,0.104261,0.13512,0.106398,0.016931,0.266667,0.712812,0.007812,5.484375,5.476562,0.208274


In [22]:
y = df['label']
y.head()

0    male
1    male
2    male
3    male
4    male
Name: label, dtype: object

### Test/train split for grid searches

In [54]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.20, random_state=101)

# Model Comparisons

## Logistic Regression

In [30]:
lm_model = LogisticRegression()
lm_scores = cross_val_score(lm_model, X, y, cv=10)
print("Logistic Regression CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (lm_scores.mean()*100, lm_scores.std() * 2*100))

Logistic Regression CV Accuracy: 89.44% (+/- 18.25%)


## SVM

In [37]:
svm_model = svm.SVC(kernel='linear')
svm_scores = cross_val_score(svm_model, X, y, cv=10)
print("Support Vector Machine CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (svm_scores.mean()*100, svm_scores.std() * 2*100))

Support Vector Machine CV Accuracy: 91.93% (+/- 15.34%)


## CART

In [41]:
CART_model = DecisionTreeClassifier(random_state=0)
CART_scores = cross_val_score(CART_model, X, y, cv=10)
print("CART CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (CART_scores.mean()*100, CART_scores.std() * 2*100))

CART CV Accuracy: 94.99% (+/- 6.51%)


## Random Forest

** Modify once we cover Random Forest **

In [55]:
param_grid = {'max_depth': [3,5,7],
              'n_estimators':[3,5,10,20,30,40],
              'criterion': ['gini', 'entropy']}
random_forest_model = GridSearchCV(RandomForestClassifier(),param_grid,refit=True,verbose=4)
random_forest_model = random_forest_model.fit(X_train, y_train)
print("Best score: %s" % (random_forest_model.best_score_))
print("Best parameter set: %s" % (random_forest_model.best_params_))

Fitting 3 folds for each of 36 candidates, totalling 108 fits
[CV] criterion=gini, max_depth=3, n_estimators=3 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=3, score=0.936094674556213, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=3 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=3, score=0.9633136094674556, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=3 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=3, score=0.9597156398104265, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=5 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=5, score=0.9526627218934911, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=5 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=5, score=0.9644970414201184, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=5 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=5, score=0

[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.1s remaining:    0.0s


[CV]  criterion=gini, max_depth=3, n_estimators=10, score=0.9514218009478673, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=20 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=20, score=0.9633136094674556, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=20 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=20, score=0.9751479289940829, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=20 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=20, score=0.9609004739336493, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=30 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=30, score=0.9668639053254438, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=30 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=30, score=0.9763313609467456, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=30 ....................
[CV]  criterion=gini, 

[CV] criterion=entropy, max_depth=3, n_estimators=10 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=10, score=0.8708530805687204, total=   0.0s
[CV] criterion=entropy, max_depth=3, n_estimators=20 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=20, score=0.9633136094674556, total=   0.1s
[CV] criterion=entropy, max_depth=3, n_estimators=20 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=20, score=0.9822485207100592, total=   0.1s
[CV] criterion=entropy, max_depth=3, n_estimators=20 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=20, score=0.9620853080568721, total=   0.1s
[CV] criterion=entropy, max_depth=3, n_estimators=30 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=30, score=0.9609467455621302, total=   0.1s
[CV] criterion=entropy, max_depth=3, n_estimators=30 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=30, score=0.9739644970414201, total=   0.1s
[CV]

[Parallel(n_jobs=1)]: Done 108 out of 108 | elapsed:    7.9s finished


In [56]:
random_forest_model = RandomForestClassifier(max_depth=7, criterion='entropy', n_estimators=10, random_state=0)
random_forest_scores = cross_val_score(random_forest_model, X, y, cv=10)
print("Random Forest CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (random_forest_scores.mean()*100, random_forest_scores.std() * 2*100))

Random Forest CV Accuracy: 96.18% (+/- 5.30%)


## Nearest Neighbors

In [59]:
param_grid = {'n_neighbors': [3,5,7,9,11,13,15]}
nearest_neighbors_model = GridSearchCV(KNeighborsClassifier(),param_grid,refit=True,verbose=4)
nearest_neighbors_model = nearest_neighbors_model.fit(X_train, y_train)
print("Best score: %s" % (nearest_neighbors_model.best_score_))
print("Best parameter set: %s" % (nearest_neighbors_model.best_params_))

Fitting 3 folds for each of 7 candidates, totalling 21 fits
[CV] n_neighbors=3 ...................................................
[CV] .......... n_neighbors=3, score=0.7124260355029586, total=   0.0s
[CV] n_neighbors=3 ...................................................
[CV] .......... n_neighbors=3, score=0.7159763313609467, total=   0.0s
[CV] n_neighbors=3 ...................................................
[CV] .......... n_neighbors=3, score=0.7002369668246445, total=   0.0s
[CV] n_neighbors=5 ...................................................
[CV] .......... n_neighbors=5, score=0.6946745562130178, total=   0.0s
[CV] n_neighbors=5 ...................................................
[CV] .......... n_neighbors=5, score=0.7112426035502959, total=   0.0s
[CV] n_neighbors=5 ...................................................
[CV] .......... n_neighbors=5, score=0.6990521327014217, total=   0.0s
[CV] n_neighbors=7 ...................................................
[CV] .......... n

[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.1s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.1s remaining:    0.0s


[CV] .......... n_neighbors=7, score=0.7041420118343196, total=   0.0s
[CV] n_neighbors=7 ...................................................
[CV] .......... n_neighbors=7, score=0.6883886255924171, total=   0.0s
[CV] n_neighbors=9 ...................................................
[CV] .......... n_neighbors=9, score=0.6994082840236686, total=   0.0s
[CV] n_neighbors=9 ...................................................
[CV] ........... n_neighbors=9, score=0.714792899408284, total=   0.0s
[CV] n_neighbors=9 ...................................................
[CV] .......... n_neighbors=9, score=0.6883886255924171, total=   0.0s
[CV] n_neighbors=11 ..................................................
[CV] ......... n_neighbors=11, score=0.7005917159763314, total=   0.0s
[CV] n_neighbors=11 ..................................................
[CV] ......... n_neighbors=11, score=0.7017751479289941, total=   0.0s
[CV] n_neighbors=11 ..................................................
[CV] .

[Parallel(n_jobs=1)]: Done  21 out of  21 | elapsed:    0.6s finished


In [60]:
nearest_neighbors_model = KNeighborsClassifier(n_neighbors=3)
nearest_neighbors_scores = cross_val_score(nearest_neighbors_model, X, y, cv=10)
print("Nearest Neighbors CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (nearest_neighbors_scores.mean()*100, nearest_neighbors_scores.std() * 2*100))

Nearest Neighbors CV Accuracy: 68.79% (+/- 11.95%)


## Neural Network

In [73]:
param_grid = {'hidden_layer_sizes': [2, 4, 8, 16, 32, 64],
              'alpha': [0.0001, 0.001,0.01,0.1,1,10],
              'solver' : ['lbfgs', 'adam'],
              'activation': ['logistic']}

neural_network_model = GridSearchCV(MLPClassifier(random_state=0),param_grid,refit=True,verbose=4)
neural_network_model = neural_network_model.fit(X_train, y_train)
print("Best score: %s" % (neural_network_model.best_score_))
print("Best parameter set: %s" % (neural_network_model.best_params_))

Fitting 3 folds for each of 72 candidates, totalling 216 fits
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs, score=0.8355029585798817, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs 


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.2s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.4s remaining:    0.0s


[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs, score=0.919526627218935, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs, score=0.8649289099526066, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam 


[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.5s remaining:    0.0s


[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam, score=0.7905325443786982, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam, score=0.7751479289940828, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam, score=0.7665876777251185, total=   0.6s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs, score=0.9183431952662722, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs, score=0.9396449704142011, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs, score=0.8696682464454977, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam, score=0.7739644970414201, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam, score=0.7550295857988165, total=   0.6s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam, score=0.7322274881516587, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs, score=0.8319526627218935, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs, score=0.9325443786982248, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs, score=0.943127962085308, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam, score=0.8130177514792899, total=   0.6s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam, score=0.7893491124260354, total=   0.6s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam, score=0.7914691943127962, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=lbfgs, score=0.8899408284023669, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=lbfgs, score=0.9266272189349113, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=lbfgs, score=0.8637440758293838, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=adam, score=0.8248520710059172, total=   0.8s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=adam, score=0.8035502958579882, total=   0.8s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=16, solver=adam, score=0.8199052132701422, total=   0.8s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=lbfgs, score=0.808284023668639, total=   0.4s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=lbfgs, score=0.9230769230769231, total=   0.4s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=lbfgs, score=0.8151658767772512, total=   0.3s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=adam, score=0.8579881656804734, total=   0.9s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=adam, score=0.8473372781065088, total=   0.8s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=32, solver=adam, score=0.8483412322274881, total=   0.9s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=lbfgs, score=0.808284023668639, total=   0.6s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=lbfgs, score=0.8532544378698225, total=   0.6s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=lbfgs, score=0.8258293838862559, total=   0.6s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=adam, score=0.8994082840236687, total=   1.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=adam, score=0.8804733727810651, total=   1.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=64, solver=adam, score=0.8838862559241706, total=   1.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=lbfgs, score=0.8520710059171598, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=lbfgs, score=0.914792899408284, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=lbfgs, score=0.8969194312796208, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam, score=0.7905325443786982, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam, score=0.7751479289940828, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam, score=0.7665876777251185, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs, score=0.9230769230769231, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs, score=0.9183431952662722, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs, score=0.8862559241706162, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam, score=0.7727810650887574, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam, score=0.7550295857988165, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam, score=0.7322274881516587, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs, score=0.8579881656804734, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs, score=0.9337278106508876, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs, score=0.8471563981042654, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam, score=0.8130177514792899, total=   0.5s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam, score=0.7893491124260354, total=   0.5s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam, score=0.7914691943127962, total=   0.5s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=lbfgs, score=0.8698224852071006, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=lbfgs, score=0.9076923076923077, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=lbfgs, score=0.7879146919431279, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=adam, score=0.821301775147929, total=   0.7s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=adam, score=0.8059171597633136, total=   0.7s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=16, solver=adam, score=0.8199052132701422, total=   0.7s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=lbfgs, score=0.8721893491124261, total=   0.3s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=lbfgs, score=0.906508875739645, total=   0.3s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=lbfgs, score=0.7748815165876777, total=   0.3s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=adam, score=0.8579881656804734, total=   0.8s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=adam, score=0.8461538461538461, total=   0.8s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=32, solver=adam, score=0.8483412322274881, total=   0.8s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=lbfgs, score=0.7940828402366864, total=   0.6s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=lbfgs, score=0.8497041420118343, total=   0.7s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=lbfgs, score=0.8139810426540285, total=   0.6s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=adam, score=0.8970414201183432, total=   1.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=adam, score=0.8804733727810651, total=   1.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=64, solver=adam, score=0.8838862559241706, total=   1.4s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=lbfgs, score=0.7917159763313609, total=   0.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=lbfgs, score=0.9230769230769231, total=   0.1s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=lbfgs, score=0.7784360189573459, total=   0.1s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam, score=0.7893491124260354, total=   0.6s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam, score=0.7727810650887574, total=   0.6s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam, score=0.7654028436018957, total=   0.7s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs, score=0.9230769230769231, total=   0.3s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs, score=0.9242603550295858, total=   0.3s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs, score=0.9016587677725119, total=   0.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam, score=0.7668639053254438, total=   0.8s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam, score=0.7562130177514793, total=   0.8s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam, score=0.7345971563981043, total=   0.6s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs, score=0.8710059171597633, total=   0.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs, score=0.914792899408284, total=   0.3s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs, score=0.8459715639810427, total=   0.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam, score=0.8130177514792899, total=   0.6s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam, score=0.7881656804733728, total=   0.6s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam, score=0.7914691943127962, total=   0.8s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=lbfgs, score=0.8544378698224852, total=   0.4s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=lbfgs, score=0.9159763313609467, total=   0.4s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=lbfgs, score=0.830568720379147, total=   0.4s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=adam, score=0.8189349112426035, total=   0.8s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=adam, score=0.8047337278106509, total=   0.9s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=16, solver=adam, score=0.8116113744075829, total=   0.9s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=lbfgs, score=0.8568047337278106, total=   0.4s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=lbfgs, score=0.7692307692307693, total=   0.3s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=lbfgs, score=0.9241706161137441, total=   0.3s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=adam, score=0.855621301775148, total=   0.8s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=adam, score=0.8437869822485207, total=   1.0s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=32, solver=adam, score=0.8459715639810427, total=   0.9s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=lbfgs, score=0.8023668639053254, total=   0.7s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=lbfgs, score=0.8189349112426035, total=   0.6s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=lbfgs, score=0.8447867298578199, total=   0.7s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=adam, score=0.8875739644970414, total=   1.1s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=adam, score=0.8769230769230769, total=   1.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=64, solver=adam, score=0.8779620853080569, total=   1.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=lbfgs, score=0.9171597633136095, total=   0.1s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=lbfgs, score=0.9396449704142011, total=   0.1s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=lbfgs, score=0.8270142180094787, total=   0.1s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam, score=0.778698224852071, total=   0.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam, score=0.7597633136094675, total=   0.5s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam, score=0.7582938388625592, total=   0.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs, score=0.9550295857988166, total=   0.1s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs, score=0.8532544378698225, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs, score=0.8459715639810427, total=   0.1s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam, score=0.7502958579881657, total=   0.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam, score=0.7479289940828402, total=   0.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam, score=0.7215639810426541, total=   0.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs, score=0.9325443786982248, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs, score=0.9159763313609467, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs, score=0.8270142180094787, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam, score=0.7869822485207101, total=   0.5s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam, score=0.7715976331360946, total=   0.5s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam, score=0.7654028436018957, total=   0.5s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=lbfgs, score=0.8615384615384616, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=lbfgs, score=0.8627218934911243, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=lbfgs, score=0.8507109004739336, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=adam, score=0.7988165680473372, total=   0.7s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=adam, score=0.7928994082840237, total=   0.7s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=16, solver=adam, score=0.7701421800947867, total=   0.7s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=lbfgs, score=0.7976331360946746, total=   0.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=lbfgs, score=0.8260355029585799, total=   0.3s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=lbfgs, score=0.8495260663507109, total=   0.3s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=adam, score=0.8236686390532545, total=   0.8s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=adam, score=0.8153846153846154, total=   0.8s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=32, solver=adam, score=0.8127962085308057, total=   0.8s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=lbfgs, score=0.8402366863905325, total=   0.6s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=lbfgs, score=0.850887573964497, total=   0.6s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=lbfgs, score=0.8045023696682464, total=   0.7s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=adam 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=adam, score=0.7005917159763314, total=   0.6s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=64, solver=adam 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=64,



[CV]  activation=logistic, alpha=1, hidden_layer_sizes=2, solver=adam, score=0.6982248520710059, total=   0.7s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=2, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=2, solver=adam, score=0.6895734597156398, total=   0.7s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=lbfgs, score=0.8402366863905325, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=lbfgs, score=0.9029585798816568, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=lbfgs, score=0.8483412322274881, total=   0.1s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam, score=0.6686390532544378, total=   0.5s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam, score=0.6710059171597633, total=   0.6s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam, score=0.6421800947867299, total=   0.7s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs, score=0.8355029585798817, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs, score=0.8710059171597633, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs, score=0.8933649289099526, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam, score=0.7076923076923077, total=   0.5s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam, score=0.7076923076923077, total=   0.5s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam, score=0.6943127962085308, total=   0.5s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=16, solver=lbfgs, score=0.7905325443786982, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=16, solver=lbfgs, score=0.7751479289940828, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=16, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=16, solver=lbfgs, score=0.8045023696682464, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=16, solver=adam 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=16, solver=adam, score=0.685207100591716, total=   0.5s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=16, solver=adam 




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=16, solver=adam, score=0.6994082840236686, total=   0.7s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=16, solver=adam 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=16, solver=adam, score=0.6729857819905213, total=   0.7s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=32, solver=lbfgs, score=0.7751479289940828, total=   0.4s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=32, solver=lbfgs, score=0.8650887573964497, total=   0.3s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=32, solver=lbfgs, score=0.7819905213270142, total=   0.3s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=32, solver=adam 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=32, solver=adam, score=0

[CV]  activation=logistic, alpha=10, hidden_layer_sizes=64, solver=lbfgs, score=0.7171597633136094, total=   0.6s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=64, solver=lbfgs 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=64, solver=lbfgs, score=0.7049763033175356, total=   0.6s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=64, solver=adam 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=64, solver=adam, score=0.6497041420118344, total=   0.2s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=64, solver=adam 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=64, solver=adam, score=0.6792899408284023, total=   0.2s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=64, solver=adam 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=64, solver=adam, score=0.6670616113744076, total=   0.2s
Best score: 0.9163378058405682
Best parameter set: {'activation': 'logistic', 'alpha': 0.01, 'hidden_layer_sizes': 4, 'solver': 'lbfgs'}


[Parallel(n_jobs=1)]: Done 216 out of 216 | elapsed:  1.6min finished


In [75]:
neural_network_model = MLPClassifier(activation='logistic', solver='lbfgs', alpha=0.01, hidden_layer_sizes=4, random_state=0)
neural_network_scores = cross_val_score(neural_network_model, X, y, cv=10)
print("Neural Network CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (neural_network_scores.mean()*100, neural_network_scores.std() * 2*100))

Neural Network CV Accuracy: 87.04% (+/- 18.04%)


## Boosted Trees

### AdaBoost Tree

In [79]:
param_grid = {'n_estimators': [10,50,100,150,200,250,300,350,400]}
adaboost_model = GridSearchCV(AdaBoostClassifier(),param_grid,refit=True,verbose=4)
adaboost_model = adaboost_model.fit(X_train, y_train)
print("Best score: %s" % (adaboost_model.best_score_))
print("Best parameter set: %s" % (adaboost_model.best_params_))

Fitting 3 folds for each of 9 candidates, totalling 27 fits
[CV] n_estimators=10 .................................................
[CV] ........ n_estimators=10, score=0.9633136094674556, total=   0.1s
[CV] n_estimators=10 .................................................
[CV] ........ n_estimators=10, score=0.9680473372781065, total=   0.1s
[CV] n_estimators=10 .................................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.1s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.2s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.3s remaining:    0.0s


[CV] ........ n_estimators=10, score=0.9644549763033176, total=   0.1s
[CV] n_estimators=50 .................................................
[CV] ........ n_estimators=50, score=0.9727810650887574, total=   0.3s
[CV] n_estimators=50 .................................................
[CV] ......... n_estimators=50, score=0.978698224852071, total=   0.4s
[CV] n_estimators=50 .................................................
[CV] ........ n_estimators=50, score=0.9715639810426541, total=   0.4s
[CV] n_estimators=100 ................................................
[CV] ....... n_estimators=100, score=0.9775147928994082, total=   0.6s
[CV] n_estimators=100 ................................................
[CV] ....... n_estimators=100, score=0.9810650887573964, total=   0.6s
[CV] n_estimators=100 ................................................
[CV] ....... n_estimators=100, score=0.9774881516587678, total=   0.5s
[CV] n_estimators=150 ................................................
[CV] .

[Parallel(n_jobs=1)]: Done  27 out of  27 | elapsed:   32.2s finished


Best score: 0.9818468823993686
Best parameter set: {'n_estimators': 400}


In [81]:
adaboost_model = AdaBoostClassifier(n_estimators=200)
adaboost_model_scores = cross_val_score(adaboost_model, X, y, cv=10)
print("AdaBoost Tree CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (adaboost_model_scores.mean()*100, adaboost_model_scores.std() * 2*100))

AdaBoost Tree CV Accuracy: 96.06% (+/- 6.21%)


### Gradient Boosted Tree

In [83]:
param_grid = {'n_estimators': [10,50,100,150,200,250,300,350,400],
             'learning_rate': [0.001, 0.01, 0.1, 1, 10],
             'max_depth': [1,2,3,4,5]}
gb_tree_model = GridSearchCV(GradientBoostingClassifier(random_state=0),param_grid,refit=True,verbose=4)
gb_tree_model = gb_tree_model.fit(X_train, y_train)
print("Best score: %s" % (gb_tree_model.best_score_))
print("Best parameter set: %s" % (gb_tree_model.best_params_))

Fitting 3 folds for each of 225 candidates, totalling 675 fits
[CV] learning_rate=0.001, max_depth=1, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=10, score=0.9562130177514793, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=10, score=0.9538461538461539, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=10, score=0.9490521327014217, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=50, score=0.9562130177514793, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=50 ...............


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.1s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.1s remaining:    0.0s


[CV]  learning_rate=0.001, max_depth=1, n_estimators=50, score=0.9538461538461539, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=50, score=0.9490521327014217, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=100, score=0.9562130177514793, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=100, score=0.9538461538461539, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=100, score=0.9490521327014217, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=150 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=150, score=0.9562130177514793, total=   0.2s
[CV] learning_rate=0.001, max_depth=1, n_estimators=150 ...

[CV]  learning_rate=0.001, max_depth=2, n_estimators=400, score=0.9597156398104265, total=   0.9s
[CV] learning_rate=0.001, max_depth=3, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=10, score=0.9644970414201184, total=   0.0s
[CV] learning_rate=0.001, max_depth=3, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=10, score=0.9313609467455621, total=   0.0s
[CV] learning_rate=0.001, max_depth=3, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=10, score=0.9443127962085308, total=   0.0s
[CV] learning_rate=0.001, max_depth=3, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=50, score=0.9609467455621302, total=   0.2s
[CV] learning_rate=0.001, max_depth=3, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=50, score=0.9739644970414201, total=   0.2s
[CV] learning_rate=0.001, max_depth=3, n_estimators=50 .......

[CV]  learning_rate=0.001, max_depth=4, n_estimators=350, score=0.9656804733727811, total=   1.5s
[CV] learning_rate=0.001, max_depth=4, n_estimators=350 ..............
[CV]  learning_rate=0.001, max_depth=4, n_estimators=350, score=0.978698224852071, total=   1.7s
[CV] learning_rate=0.001, max_depth=4, n_estimators=350 ..............
[CV]  learning_rate=0.001, max_depth=4, n_estimators=350, score=0.9644549763033176, total=   1.6s
[CV] learning_rate=0.001, max_depth=4, n_estimators=400 ..............
[CV]  learning_rate=0.001, max_depth=4, n_estimators=400, score=0.9656804733727811, total=   1.9s
[CV] learning_rate=0.001, max_depth=4, n_estimators=400 ..............
[CV]  learning_rate=0.001, max_depth=4, n_estimators=400, score=0.978698224852071, total=   1.9s
[CV] learning_rate=0.001, max_depth=4, n_estimators=400 ..............
[CV]  learning_rate=0.001, max_depth=4, n_estimators=400, score=0.9632701421800948, total=   1.8s
[CV] learning_rate=0.001, max_depth=5, n_estimators=10 ....

[CV]  learning_rate=0.01, max_depth=1, n_estimators=250, score=0.9656804733727811, total=   0.3s
[CV] learning_rate=0.01, max_depth=1, n_estimators=250 ...............
[CV]  learning_rate=0.01, max_depth=1, n_estimators=250, score=0.9561611374407583, total=   0.3s
[CV] learning_rate=0.01, max_depth=1, n_estimators=300 ...............
[CV]  learning_rate=0.01, max_depth=1, n_estimators=300, score=0.9621301775147929, total=   0.3s
[CV] learning_rate=0.01, max_depth=1, n_estimators=300 ...............
[CV]  learning_rate=0.01, max_depth=1, n_estimators=300, score=0.9656804733727811, total=   0.3s
[CV] learning_rate=0.01, max_depth=1, n_estimators=300 ...............
[CV]  learning_rate=0.01, max_depth=1, n_estimators=300, score=0.9585308056872038, total=   0.3s
[CV] learning_rate=0.01, max_depth=1, n_estimators=350 ...............
[CV]  learning_rate=0.01, max_depth=1, n_estimators=350, score=0.9621301775147929, total=   0.4s
[CV] learning_rate=0.01, max_depth=1, n_estimators=350 ........

[CV]  learning_rate=0.01, max_depth=3, n_estimators=150, score=0.966824644549763, total=   0.5s
[CV] learning_rate=0.01, max_depth=3, n_estimators=200 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=200, score=0.9668639053254438, total=   0.6s
[CV] learning_rate=0.01, max_depth=3, n_estimators=200 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=200, score=0.9798816568047337, total=   0.7s
[CV] learning_rate=0.01, max_depth=3, n_estimators=200 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=200, score=0.966824644549763, total=   0.7s
[CV] learning_rate=0.01, max_depth=3, n_estimators=250 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=250, score=0.9704142011834319, total=   0.9s
[CV] learning_rate=0.01, max_depth=3, n_estimators=250 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=250, score=0.9798816568047337, total=   0.8s
[CV] learning_rate=0.01, max_depth=3, n_estimators=250 ..........

[CV]  learning_rate=0.01, max_depth=5, n_estimators=100, score=0.9692307692307692, total=   0.5s
[CV] learning_rate=0.01, max_depth=5, n_estimators=100 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=100, score=0.9822485207100592, total=   0.6s
[CV] learning_rate=0.01, max_depth=5, n_estimators=100 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=100, score=0.9620853080568721, total=   0.6s
[CV] learning_rate=0.01, max_depth=5, n_estimators=150 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=150, score=0.9692307692307692, total=   0.8s
[CV] learning_rate=0.01, max_depth=5, n_estimators=150 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=150, score=0.9810650887573964, total=   0.9s
[CV] learning_rate=0.01, max_depth=5, n_estimators=150 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=150, score=0.9680094786729858, total=   0.9s
[CV] learning_rate=0.01, max_depth=5, n_estimators=200 ........

[CV]  learning_rate=0.1, max_depth=2, n_estimators=50, score=0.9692307692307692, total=   0.1s
[CV] learning_rate=0.1, max_depth=2, n_estimators=50 .................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=50, score=0.9798816568047337, total=   0.1s
[CV] learning_rate=0.1, max_depth=2, n_estimators=50 .................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=50, score=0.9691943127962085, total=   0.1s
[CV] learning_rate=0.1, max_depth=2, n_estimators=100 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=100, score=0.9739644970414201, total=   0.2s
[CV] learning_rate=0.1, max_depth=2, n_estimators=100 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=100, score=0.9834319526627219, total=   0.3s
[CV] learning_rate=0.1, max_depth=2, n_estimators=100 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=100, score=0.9715639810426541, total=   0.2s
[CV] learning_rate=0.1, max_depth=2, n_estimators=150 ................
[

[CV]  learning_rate=0.1, max_depth=3, n_estimators=400, score=0.9727488151658767, total=   1.4s
[CV] learning_rate=0.1, max_depth=4, n_estimators=10 .................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=10, score=0.9704142011834319, total=   0.1s
[CV] learning_rate=0.1, max_depth=4, n_estimators=10 .................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=10, score=0.9798816568047337, total=   0.1s
[CV] learning_rate=0.1, max_depth=4, n_estimators=10 .................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=10, score=0.966824644549763, total=   0.0s
[CV] learning_rate=0.1, max_depth=4, n_estimators=50 .................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=50, score=0.9715976331360947, total=   0.2s
[CV] learning_rate=0.1, max_depth=4, n_estimators=50 .................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=50, score=0.9798816568047337, total=   0.2s
[CV] learning_rate=0.1, max_depth=4, n_estimators=50 .................
[CV]

[CV]  learning_rate=0.1, max_depth=5, n_estimators=350, score=0.9846153846153847, total=   1.1s
[CV] learning_rate=0.1, max_depth=5, n_estimators=350 ................
[CV]  learning_rate=0.1, max_depth=5, n_estimators=350, score=0.9715639810426541, total=   1.0s
[CV] learning_rate=0.1, max_depth=5, n_estimators=400 ................
[CV]  learning_rate=0.1, max_depth=5, n_estimators=400, score=0.9775147928994082, total=   1.2s
[CV] learning_rate=0.1, max_depth=5, n_estimators=400 ................
[CV]  learning_rate=0.1, max_depth=5, n_estimators=400, score=0.9846153846153847, total=   1.1s
[CV] learning_rate=0.1, max_depth=5, n_estimators=400 ................
[CV]  learning_rate=0.1, max_depth=5, n_estimators=400, score=0.9715639810426541, total=   1.0s
[CV] learning_rate=1, max_depth=1, n_estimators=10 ...................
[CV]  learning_rate=1, max_depth=1, n_estimators=10, score=0.9727810650887574, total=   0.0s
[CV] learning_rate=1, max_depth=1, n_estimators=10 ...................
[

[CV]  learning_rate=1, max_depth=2, n_estimators=300, score=0.9727810650887574, total=   0.3s
[CV] learning_rate=1, max_depth=2, n_estimators=300 ..................
[CV]  learning_rate=1, max_depth=2, n_estimators=300, score=0.9822485207100592, total=   0.3s
[CV] learning_rate=1, max_depth=2, n_estimators=300 ..................
[CV]  learning_rate=1, max_depth=2, n_estimators=300, score=0.9751184834123223, total=   0.3s
[CV] learning_rate=1, max_depth=2, n_estimators=350 ..................
[CV]  learning_rate=1, max_depth=2, n_estimators=350, score=0.9727810650887574, total=   0.3s
[CV] learning_rate=1, max_depth=2, n_estimators=350 ..................
[CV]  learning_rate=1, max_depth=2, n_estimators=350, score=0.9822485207100592, total=   0.3s
[CV] learning_rate=1, max_depth=2, n_estimators=350 ..................
[CV]  learning_rate=1, max_depth=2, n_estimators=350, score=0.9751184834123223, total=   0.2s
[CV] learning_rate=1, max_depth=2, n_estimators=400 ..................
[CV]  lear

[CV]  learning_rate=1, max_depth=4, n_estimators=200, score=0.9656398104265402, total=   0.2s
[CV] learning_rate=1, max_depth=4, n_estimators=250 ..................
[CV]  learning_rate=1, max_depth=4, n_estimators=250, score=0.9775147928994082, total=   0.3s
[CV] learning_rate=1, max_depth=4, n_estimators=250 ..................
[CV]  learning_rate=1, max_depth=4, n_estimators=250, score=0.9739644970414201, total=   0.3s
[CV] learning_rate=1, max_depth=4, n_estimators=250 ..................
[CV]  learning_rate=1, max_depth=4, n_estimators=250, score=0.9656398104265402, total=   0.2s
[CV] learning_rate=1, max_depth=4, n_estimators=300 ..................
[CV]  learning_rate=1, max_depth=4, n_estimators=300, score=0.9775147928994082, total=   0.3s
[CV] learning_rate=1, max_depth=4, n_estimators=300 ..................
[CV]  learning_rate=1, max_depth=4, n_estimators=300, score=0.9739644970414201, total=   0.3s
[CV] learning_rate=1, max_depth=4, n_estimators=300 ..................
[CV]  lear

[CV]  learning_rate=10, max_depth=1, n_estimators=150, score=0.0509478672985782, total=   0.2s
[CV] learning_rate=10, max_depth=1, n_estimators=200 .................
[CV]  learning_rate=10, max_depth=1, n_estimators=200, score=0.04497041420118343, total=   0.2s
[CV] learning_rate=10, max_depth=1, n_estimators=200 .................
[CV]  learning_rate=10, max_depth=1, n_estimators=200, score=0.046153846153846156, total=   0.2s
[CV] learning_rate=10, max_depth=1, n_estimators=200 .................
[CV]  learning_rate=10, max_depth=1, n_estimators=200, score=0.0509478672985782, total=   0.2s
[CV] learning_rate=10, max_depth=1, n_estimators=250 .................
[CV]  learning_rate=10, max_depth=1, n_estimators=250, score=0.04497041420118343, total=   0.3s
[CV] learning_rate=10, max_depth=1, n_estimators=250 .................
[CV]  learning_rate=10, max_depth=1, n_estimators=250, score=0.046153846153846156, total=   0.3s
[CV] learning_rate=10, max_depth=1, n_estimators=250 ................

[CV]  learning_rate=10, max_depth=3, n_estimators=100, score=0.1408284023668639, total=   0.3s
[CV] learning_rate=10, max_depth=3, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=3, n_estimators=100, score=0.5035545023696683, total=   0.3s
[CV] learning_rate=10, max_depth=3, n_estimators=150 .................
[CV]  learning_rate=10, max_depth=3, n_estimators=150, score=0.41893491124260357, total=   0.5s
[CV] learning_rate=10, max_depth=3, n_estimators=150 .................
[CV]  learning_rate=10, max_depth=3, n_estimators=150, score=0.1408284023668639, total=   0.5s
[CV] learning_rate=10, max_depth=3, n_estimators=150 .................
[CV]  learning_rate=10, max_depth=3, n_estimators=150, score=0.5035545023696683, total=   0.5s
[CV] learning_rate=10, max_depth=3, n_estimators=200 .................
[CV]  learning_rate=10, max_depth=3, n_estimators=200, score=0.41893491124260357, total=   0.6s
[CV] learning_rate=10, max_depth=3, n_estimators=200 .................
[C

[CV]  learning_rate=10, max_depth=5, n_estimators=50, score=0.3408284023668639, total=   0.3s
[CV] learning_rate=10, max_depth=5, n_estimators=50 ..................
[CV]  learning_rate=10, max_depth=5, n_estimators=50, score=0.41183431952662725, total=   0.3s
[CV] learning_rate=10, max_depth=5, n_estimators=50 ..................
[CV]  learning_rate=10, max_depth=5, n_estimators=50, score=0.07464454976303317, total=   0.3s
[CV] learning_rate=10, max_depth=5, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=5, n_estimators=100, score=0.3408284023668639, total=   0.6s
[CV] learning_rate=10, max_depth=5, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=5, n_estimators=100, score=0.41183431952662725, total=   0.7s
[CV] learning_rate=10, max_depth=5, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=5, n_estimators=100, score=0.07464454976303317, total=   0.6s
[CV] learning_rate=10, max_depth=5, n_estimators=150 .................
[CV

[Parallel(n_jobs=1)]: Done 675 out of 675 | elapsed:  6.6min finished


Best score: 0.9806629834254144
Best parameter set: {'learning_rate': 0.1, 'max_depth': 2, 'n_estimators': 400}


In [85]:
gb_tree_model = GradientBoostingClassifier(n_estimators=400, learning_rate=0.1, max_depth=2, random_state=0)
gb_tree_scores = cross_val_score(gb_tree_model, X, y, cv=10)
print("Gradient Boosted Tree CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (gb_tree_scores.mean()*100, gb_tree_scores.std() * 2*100))

Gradient Boosted Tree CV Accuracy: 97.00% (+/- 4.75%)


## Naive Bayes

In [86]:
naive_bayes_model = GaussianNB()
naive_bayes_scores = cross_val_score(naive_bayes_model, X, y, cv=10)
print("Naive Bayes CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (naive_bayes_scores.mean()*100, naive_bayes_scores.std() * 2*100))

Naive Bayes CV Accuracy: 85.67% (+/- 15.46%)


# Model Comparison Using Principal Component Analysis

## PCA

In [91]:
param_grid = {'n_components': [1,2,3,4,5,6,7,8]}
pca_model = GridSearchCV(PCA(),param_grid,refit=True,verbose=4)
pca_model = pca_model.fit(X_train, y_train)
print("Best score: %s" % (pca_model.best_score_))
print("Best parameter set: %s" % (pca_model.best_params_))

Fitting 3 folds for each of 8 candidates, totalling 24 fits
[CV] n_components=1 ..................................................
[CV] ........ n_components=1, score=-35.682692247528166, total=   0.0s
[CV] n_components=1 ..................................................
[CV] ......... n_components=1, score=-34.98405588269396, total=   0.0s
[CV] n_components=1 ..................................................
[CV] ......... n_components=1, score=-36.52779392790749, total=   0.0s
[CV] n_components=2 ..................................................
[CV] .......... n_components=2, score=-8.26304640386624, total=   0.0s
[CV] n_components=2 ..................................................
[CV] ......... n_components=2, score=-7.928744471857906, total=   0.0s
[CV] n_components=2 ..................................................
[CV] ......... n_components=2, score=-8.787424580373761, total=   0.0s
[CV] n_components=3 ..................................................
[CV] .......... n

[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.0s remaining:    0.0s


[CV] .......... n_components=8, score=23.28535872068322, total=   0.0s
[CV] n_components=8 ..................................................
[CV] ......... n_components=8, score=22.673176359623124, total=   0.0s
[CV] n_components=8 ..................................................
[CV] ......... n_components=8, score=23.307115332290437, total=   0.0s
Best score: 23.088463884495656
Best parameter set: {'n_components': 8}


[Parallel(n_jobs=1)]: Done  24 out of  24 | elapsed:    0.2s finished


In [105]:
n_components = [1,2,3,4,5,6,7,8,9,10]
for n in n_components:
    pca = PCA(n_components=n).fit(X_train)
    print("%d components captures %0.5f of the variance" % (n, sum(pca.explained_variance_ratio_)))

1 components captures 0.99869 of the variance
2 components captures 0.99995 of the variance
3 components captures 0.99999 of the variance
4 components captures 1.00000 of the variance
5 components captures 1.00000 of the variance
6 components captures 1.00000 of the variance
7 components captures 1.00000 of the variance
8 components captures 1.00000 of the variance
9 components captures 1.00000 of the variance
10 components captures 1.00000 of the variance


In [114]:
pca = PCA(n_components=3).fit(X_train)
X_pca = pca.transform(X)
X_train_pca = pca.transform(X_train)
X_test_pca = pca.transform(X_test)

## Logicstic Regression 

In [113]:
lm_model = LogisticRegression()
lm_scores = cross_val_score(lm_model, X_pca, y, cv=10)
print("Logistic Regression CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (lm_scores.mean()*100, lm_scores.std() * 2*100))

Logistic Regression CV Accuracy: 66.40% (+/- 18.98%)


## Support Vector Machine

In [115]:
svm_model = svm.SVC(kernel='linear')
svm_scores = cross_val_score(svm_model, X_pca, y, cv=10)
print("Support Vector Machine CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (svm_scores.mean()*100, svm_scores.std() * 2*100))

Support Vector Machine CV Accuracy: 66.49% (+/- 17.99%)


## CART

In [116]:
CART_model = DecisionTreeClassifier(random_state=0)
CART_scores = cross_val_score(CART_model, X_pca, y, cv=10)
print("CART CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (CART_scores.mean()*100, CART_scores.std() * 2*100))

CART CV Accuracy: 65.25% (+/- 12.69%)


## Random Forest

** Modify once we cover Random Forest **

In [117]:
param_grid = {'max_depth': [3,5,7],
              'n_estimators':[3,5,10,20,30,40],
              'criterion': ['gini', 'entropy']}
random_forest_model = GridSearchCV(RandomForestClassifier(),param_grid,refit=True,verbose=4)
random_forest_model = random_forest_model.fit(X_train_pca, y_train)
print("Best score: %s" % (random_forest_model.best_score_))
print("Best parameter set: %s" % (random_forest_model.best_params_))

Fitting 3 folds for each of 36 candidates, totalling 108 fits
[CV] criterion=gini, max_depth=3, n_estimators=3 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=3, score=0.6568047337278107, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=3 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=3, score=0.676923076923077, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=3 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=3, score=0.6883886255924171, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=5 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=5, score=0.663905325443787, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=5 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=5, score=0.6863905325443787, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=5 .....................
[CV]  criterion=gini, max_depth=3, n_estimators=5, score=0.

[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.0s remaining:    0.0s


[CV]  criterion=gini, max_depth=3, n_estimators=20, score=0.6733727810650888, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=20 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=20, score=0.6946745562130178, total=   0.0s
[CV] criterion=gini, max_depth=3, n_estimators=20 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=20, score=0.6682464454976303, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=30 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=30, score=0.6863905325443787, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=30 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=30, score=0.6816568047337278, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=30 ....................
[CV]  criterion=gini, max_depth=3, n_estimators=30, score=0.6753554502369669, total=   0.1s
[CV] criterion=gini, max_depth=3, n_estimators=40 ....................
[CV]  criterion=gini, 

[CV]  criterion=entropy, max_depth=3, n_estimators=10, score=0.6911242603550296, total=   0.0s
[CV] criterion=entropy, max_depth=3, n_estimators=10 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=10, score=0.6777251184834123, total=   0.0s
[CV] criterion=entropy, max_depth=3, n_estimators=20 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=20, score=0.6840236686390533, total=   0.1s
[CV] criterion=entropy, max_depth=3, n_estimators=20 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=20, score=0.6804733727810651, total=   0.1s
[CV] criterion=entropy, max_depth=3, n_estimators=20 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=20, score=0.6765402843601895, total=   0.0s
[CV] criterion=entropy, max_depth=3, n_estimators=30 .................
[CV]  criterion=entropy, max_depth=3, n_estimators=30, score=0.6840236686390533, total=   0.1s
[CV] criterion=entropy, max_depth=3, n_estimators=30 .................
[CV]

[Parallel(n_jobs=1)]: Done 108 out of 108 | elapsed:    5.5s finished


In [121]:
random_forest_model = RandomForestClassifier(max_depth=7, criterion='gini', n_estimators=40, random_state=0)
random_forest_scores = cross_val_score(random_forest_model, X_pca, y, cv=10)
print("Random Forest CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (random_forest_scores.mean()*100, random_forest_scores.std() * 2*100))

Random Forest CV Accuracy: 69.19% (+/- 16.13%)


## Nearest Neighbors

In [120]:
param_grid = {'n_neighbors': [3,5,7,9,11,13,15]}
nearest_neighbors_model = GridSearchCV(KNeighborsClassifier(),param_grid,refit=True,verbose=4)
nearest_neighbors_model = nearest_neighbors_model.fit(X_train_pca, y_train)
print("Best score: %s" % (nearest_neighbors_model.best_score_))
print("Best parameter set: %s" % (nearest_neighbors_model.best_params_))

Fitting 3 folds for each of 7 candidates, totalling 21 fits
[CV] n_neighbors=3 ...................................................
[CV] .......... n_neighbors=3, score=0.7124260355029586, total=   0.0s
[CV] n_neighbors=3 ...................................................
[CV] .......... n_neighbors=3, score=0.7159763313609467, total=   0.0s
[CV] n_neighbors=3 ...................................................
[CV] .......... n_neighbors=3, score=0.7002369668246445, total=   0.0s
[CV] n_neighbors=5 ...................................................
[CV] .......... n_neighbors=5, score=0.6946745562130178, total=   0.0s
[CV] n_neighbors=5 ...................................................
[CV] .......... n_neighbors=5, score=0.7112426035502959, total=   0.0s
[CV] n_neighbors=5 ...................................................
[CV] .......... n_neighbors=5, score=0.6990521327014217, total=   0.0s
[CV] n_neighbors=7 ...................................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.1s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.1s remaining:    0.0s


[CV] .......... n_neighbors=7, score=0.7029585798816568, total=   0.0s
[CV] n_neighbors=7 ...................................................
[CV] .......... n_neighbors=7, score=0.7041420118343196, total=   0.0s
[CV] n_neighbors=7 ...................................................
[CV] .......... n_neighbors=7, score=0.6883886255924171, total=   0.0s
[CV] n_neighbors=9 ...................................................
[CV] .......... n_neighbors=9, score=0.6994082840236686, total=   0.0s
[CV] n_neighbors=9 ...................................................
[CV] ........... n_neighbors=9, score=0.714792899408284, total=   0.0s
[CV] n_neighbors=9 ...................................................
[CV] .......... n_neighbors=9, score=0.6883886255924171, total=   0.0s
[CV] n_neighbors=11 ..................................................
[CV] ......... n_neighbors=11, score=0.7005917159763314, total=   0.0s
[CV] n_neighbors=11 ..................................................
[CV] .

[Parallel(n_jobs=1)]: Done  21 out of  21 | elapsed:    0.7s finished


In [124]:
nearest_neighbors_model = KNeighborsClassifier(n_neighbors=3)
nearest_neighbors_scores = cross_val_score(nearest_neighbors_model, X_pca, y, cv=10)
print("Nearest Neighbors CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (nearest_neighbors_scores.mean()*100, nearest_neighbors_scores.std() * 2*100))

Nearest Neighbors CV Accuracy: 64.15% (+/- 12.16%)


## Neural Network

In [125]:
param_grid = {'hidden_layer_sizes': [2, 4, 8, 16, 32, 64],
              'alpha': [0.0001, 0.001,0.01,0.1,1,10],
              'solver' : ['lbfgs', 'adam'],
              'activation': ['logistic']}

neural_network_model = GridSearchCV(MLPClassifier(random_state=0),param_grid,refit=True,verbose=4)
neural_network_model = neural_network_model.fit(X_train_pca, y_train)
print("Best score: %s" % (neural_network_model.best_score_))
print("Best parameter set: %s" % (neural_network_model.best_params_))

Fitting 3 folds for each of 72 candidates, totalling 216 fits
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs, score=0.693491124260355, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs 


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.1s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.2s remaining:    0.0s


[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs, score=0.7005917159763314, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=lbfgs, score=0.693127962085308, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam 


[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.3s remaining:    0.0s


[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam, score=0.6958579881656805, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam, score=0.6863905325443787, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=2, solver=adam, score=0.6753554502369669, total=   0.4s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs, score=0.6674556213017752, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs, score=0.6946745562130178, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=lbfgs, score=0.6860189573459715, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam, score=0.6887573964497041, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam, score=0.693491124260355, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=4, solver=adam, score=0.6872037914691943, total=   0.5s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs, score=0.6911242603550296, total=   0.1s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs, score=0.7005917159763314, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=lbfgs, score=0.6895734597156398, total=   0.2s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam, score=0.7029585798816568, total=   0.4s
[CV] activation=logistic, alpha=0.0001, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.0001



[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam, score=0.6958579881656805, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam, score=0.6863905325443787, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=2, solver=adam, score=0.6753554502369669, total=   0.5s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs, score=0.6923076923076923, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs, score=0.6970414201183432, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=lbfgs, score=0.6966824644549763, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam, score=0.6887573964497041, total=   0.4s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam, score=0.693491124260355, total=   0.5s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=4, solver=adam, score=0.6872037914691943, total=   0.5s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs, score=0.693491124260355, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs, score=0.6982248520710059, total=   0.2s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=lbfgs, score=0.7002369668246445, total=   0.1s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam, score=0.7041420118343196, total=   0.5s
[CV] activation=logistic, alpha=0.001, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.001, hidden_lay



[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam, score=0.6958579881656805, total=   0.5s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam, score=0.6863905325443787, total=   0.6s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=2, solver=adam, score=0.6753554502369669, total=   0.5s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs, score=0.6958579881656805, total=   0.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs, score=0.6958579881656805, total=   0.1s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=lbfgs, score=0.693127962085308, total=   0.1s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam, score=0.6887573964497041, total=   0.8s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam, score=0.6946745562130178, total=   0.7s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=4, solver=adam, score=0.6860189573459715, total=   0.5s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs, score=0.7076923076923077, total=   0.3s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs, score=0.6970414201183432, total=   0.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=lbfgs, score=0.6966824644549763, total=   0.2s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam, score=0.7029585798816568, total=   0.7s
[CV] activation=logistic, alpha=0.01, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.01, hidden_layer_sizes=8



[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam, score=0.6958579881656805, total=   0.7s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam, score=0.6863905325443787, total=   0.8s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=2, solver=adam, score=0.6741706161137441, total=   0.8s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs, score=0.6899408284023668, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs, score=0.7029585798816568, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=lbfgs, score=0.6966824644549763, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam, score=0.6899408284023668, total=   0.8s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam, score=0.6923076923076923, total=   0.5s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam 




[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=4, solver=adam, score=0.6860189573459715, total=   0.6s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs, score=0.7112426035502959, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs, score=0.7005917159763314, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=lbfgs, score=0.6800947867298578, total=   0.2s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam, score=0.7065088757396449, total=   0.4s
[CV] activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=adam 
[CV]  activation=logistic, alpha=0.1, hidden_layer_sizes=8, solver=ad



[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam, score=0.6816568047337278, total=   0.4s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam, score=0.7076923076923077, total=   0.5s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam .




[CV]  activation=logistic, alpha=1, hidden_layer_sizes=4, solver=adam, score=0.6907582938388626, total=   0.4s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs, score=0.693491124260355, total=   0.1s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs, score=0.6982248520710059, total=   0.2s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs 
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=lbfgs, score=0.6954976303317536, total=   0.1s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam .
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam, score=0.6911242603550296, total=   0.3s
[CV] activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam .
[CV]  activation=logistic, alpha=1, hidden_layer_sizes=8, solver=adam, score=0.698224852

[CV]  activation=logistic, alpha=10, hidden_layer_sizes=16, solver=lbfgs, score=0.6800947867298578, total=   0.2s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=16, solver=adam 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=16, solver=adam, score=0.6295857988165681, total=   0.2s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=16, solver=adam 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=16, solver=adam, score=0.6319526627218935, total=   0.3s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=16, solver=adam 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=16, solver=adam, score=0.6279620853080569, total=   0.2s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=32, solver=lbfgs, score=0.7029585798816568, total=   0.3s
[CV] activation=logistic, alpha=10, hidden_layer_sizes=32, solver=lbfgs 
[CV]  activation=logistic, alpha=10, hidden_layer_sizes=32, solver=lbfg

[Parallel(n_jobs=1)]: Done 216 out of 216 | elapsed:  1.4min finished


Best score: 0.7154696132596685
Best parameter set: {'activation': 'logistic', 'alpha': 0.0001, 'hidden_layer_sizes': 16, 'solver': 'lbfgs'}


In [126]:
neural_network_model = MLPClassifier(activation='logistic', solver='lbfgs', alpha=0.0001, hidden_layer_sizes=16, random_state=0)
neural_network_scores = cross_val_score(neural_network_model, X_pca, y, cv=10)
print("Neural Network CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (neural_network_scores.mean()*100, neural_network_scores.std() * 2*100))

Neural Network CV Accuracy: 67.21% (+/- 15.96%)


## Boosted Trees

### AdaBoost Tree

In [127]:
param_grid = {'n_estimators': [10,50,100,150,200,250,300,350,400]}
adaboost_model = GridSearchCV(AdaBoostClassifier(),param_grid,refit=True,verbose=4)
adaboost_model = adaboost_model.fit(X_train_pca, y_train)
print("Best score: %s" % (adaboost_model.best_score_))
print("Best parameter set: %s" % (adaboost_model.best_params_))

Fitting 3 folds for each of 9 candidates, totalling 27 fits
[CV] n_estimators=10 .................................................
[CV] ........ n_estimators=10, score=0.6745562130177515, total=   0.0s
[CV] n_estimators=10 .................................................
[CV] ........ n_estimators=10, score=0.6828402366863905, total=   0.0s
[CV] n_estimators=10 .................................................
[CV] ........ n_estimators=10, score=0.6765402843601895, total=   0.0s
[CV] n_estimators=50 .................................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.1s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.1s remaining:    0.0s


[CV] ........ n_estimators=50, score=0.7053254437869823, total=   0.2s
[CV] n_estimators=50 .................................................
[CV] ........ n_estimators=50, score=0.6840236686390533, total=   0.2s
[CV] n_estimators=50 .................................................
[CV] ........ n_estimators=50, score=0.6824644549763034, total=   0.2s
[CV] n_estimators=100 ................................................
[CV] ....... n_estimators=100, score=0.7088757396449704, total=   0.3s
[CV] n_estimators=100 ................................................
[CV] ....... n_estimators=100, score=0.6923076923076923, total=   0.3s
[CV] n_estimators=100 ................................................
[CV] ....... n_estimators=100, score=0.6943127962085308, total=   0.3s
[CV] n_estimators=150 ................................................
[CV] ....... n_estimators=150, score=0.7053254437869823, total=   0.5s
[CV] n_estimators=150 ................................................
[CV] .

[Parallel(n_jobs=1)]: Done  27 out of  27 | elapsed:   19.7s finished


Best score: 0.7075769534333071
Best parameter set: {'n_estimators': 200}


In [128]:
adaboost_model = AdaBoostClassifier(n_estimators=200)
adaboost_model_scores = cross_val_score(adaboost_model, X_pca, y, cv=10)
print("AdaBoost Tree CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (adaboost_model_scores.mean()*100, adaboost_model_scores.std() * 2*100))

AdaBoost Tree CV Accuracy: 67.78% (+/- 16.51%)


### Gradient Boosted Tree

In [129]:
param_grid = {'n_estimators': [10,50,100,150,200,250,300,350,400],
             'learning_rate': [0.001, 0.01, 0.1, 1, 10],
             'max_depth': [1,2,3,4,5]}
gb_tree_model = GridSearchCV(GradientBoostingClassifier(random_state=0),param_grid,refit=True,verbose=4)
gb_tree_model = gb_tree_model.fit(X_train_pca, y_train)
print("Best score: %s" % (gb_tree_model.best_score_))
print("Best parameter set: %s" % (gb_tree_model.best_params_))

Fitting 3 folds for each of 225 candidates, totalling 675 fits
[CV] learning_rate=0.001, max_depth=1, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=10, score=0.5029585798816568, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=10, score=0.5029585798816568, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=10 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=10, score=0.5035545023696683, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=50, score=0.6544378698224852, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=50, score=0.6568047337278107, total=   0.0s
[CV] learning_rate=0.001, max_depth=1, n_estimators=50 ...............
[CV]  learning_rate=0.001,

[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.0s remaining:    0.0s


[CV]  learning_rate=0.001, max_depth=1, n_estimators=100, score=0.6544378698224852, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=100, score=0.6568047337278107, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=100, score=0.6492890995260664, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=150 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=150, score=0.6544378698224852, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=150 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=150, score=0.6568047337278107, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=150 ..............
[CV]  learning_rate=0.001, max_depth=1, n_estimators=150, score=0.6492890995260664, total=   0.1s
[CV] learning_rate=0.001, max_depth=1, n_estimators=200 .

[CV]  learning_rate=0.001, max_depth=3, n_estimators=50, score=0.6741706161137441, total=   0.1s
[CV] learning_rate=0.001, max_depth=3, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=100, score=0.6923076923076923, total=   0.1s
[CV] learning_rate=0.001, max_depth=3, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=100, score=0.7041420118343196, total=   0.1s
[CV] learning_rate=0.001, max_depth=3, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=100, score=0.6741706161137441, total=   0.1s
[CV] learning_rate=0.001, max_depth=3, n_estimators=150 ..............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=150, score=0.6923076923076923, total=   0.2s
[CV] learning_rate=0.001, max_depth=3, n_estimators=150 ..............
[CV]  learning_rate=0.001, max_depth=3, n_estimators=150, score=0.7041420118343196, total=   0.2s
[CV] learning_rate=0.001, max_depth=3, n_estimators=150 ..

[CV]  learning_rate=0.001, max_depth=5, n_estimators=50, score=0.6840236686390533, total=   0.1s
[CV] learning_rate=0.001, max_depth=5, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=5, n_estimators=50, score=0.6804733727810651, total=   0.1s
[CV] learning_rate=0.001, max_depth=5, n_estimators=50 ...............
[CV]  learning_rate=0.001, max_depth=5, n_estimators=50, score=0.6978672985781991, total=   0.1s
[CV] learning_rate=0.001, max_depth=5, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=5, n_estimators=100, score=0.7053254437869823, total=   0.3s
[CV] learning_rate=0.001, max_depth=5, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=5, n_estimators=100, score=0.7017751479289941, total=   0.2s
[CV] learning_rate=0.001, max_depth=5, n_estimators=100 ..............
[CV]  learning_rate=0.001, max_depth=5, n_estimators=100, score=0.6966824644549763, total=   0.2s
[CV] learning_rate=0.001, max_depth=5, n_estimators=150 ....

[CV]  learning_rate=0.01, max_depth=1, n_estimators=400, score=0.6863905325443787, total=   0.2s
[CV] learning_rate=0.01, max_depth=1, n_estimators=400 ...............
[CV]  learning_rate=0.01, max_depth=1, n_estimators=400, score=0.6706161137440758, total=   0.2s
[CV] learning_rate=0.01, max_depth=2, n_estimators=10 ................
[CV]  learning_rate=0.01, max_depth=2, n_estimators=10, score=0.6603550295857988, total=   0.0s
[CV] learning_rate=0.01, max_depth=2, n_estimators=10 ................
[CV]  learning_rate=0.01, max_depth=2, n_estimators=10, score=0.6650887573964497, total=   0.0s
[CV] learning_rate=0.01, max_depth=2, n_estimators=10 ................
[CV]  learning_rate=0.01, max_depth=2, n_estimators=10, score=0.6481042654028436, total=   0.0s
[CV] learning_rate=0.01, max_depth=2, n_estimators=50 ................
[CV]  learning_rate=0.01, max_depth=2, n_estimators=50, score=0.6674556213017752, total=   0.0s
[CV] learning_rate=0.01, max_depth=2, n_estimators=50 .............

[CV]  learning_rate=0.01, max_depth=3, n_estimators=300, score=0.7191943127962085, total=   0.3s
[CV] learning_rate=0.01, max_depth=3, n_estimators=350 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=350, score=0.7337278106508875, total=   0.4s
[CV] learning_rate=0.01, max_depth=3, n_estimators=350 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=350, score=0.7313609467455622, total=   0.4s
[CV] learning_rate=0.01, max_depth=3, n_estimators=350 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=350, score=0.7203791469194313, total=   0.3s
[CV] learning_rate=0.01, max_depth=3, n_estimators=400 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=400, score=0.7372781065088757, total=   0.4s
[CV] learning_rate=0.01, max_depth=3, n_estimators=400 ...............
[CV]  learning_rate=0.01, max_depth=3, n_estimators=400, score=0.7313609467455622, total=   0.4s
[CV] learning_rate=0.01, max_depth=3, n_estimators=400 ........

[CV]  learning_rate=0.01, max_depth=5, n_estimators=250, score=0.7325443786982249, total=   0.5s
[CV] learning_rate=0.01, max_depth=5, n_estimators=250 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=250, score=0.7372781065088757, total=   0.5s
[CV] learning_rate=0.01, max_depth=5, n_estimators=250 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=250, score=0.726303317535545, total=   0.5s
[CV] learning_rate=0.01, max_depth=5, n_estimators=300 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=300, score=0.7289940828402367, total=   0.6s
[CV] learning_rate=0.01, max_depth=5, n_estimators=300 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=300, score=0.7467455621301775, total=   0.6s
[CV] learning_rate=0.01, max_depth=5, n_estimators=300 ...............
[CV]  learning_rate=0.01, max_depth=5, n_estimators=300, score=0.731042654028436, total=   0.6s
[CV] learning_rate=0.01, max_depth=5, n_estimators=350 ..........

[CV]  learning_rate=0.1, max_depth=2, n_estimators=150, score=0.7002369668246445, total=   0.1s
[CV] learning_rate=0.1, max_depth=2, n_estimators=200 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=200, score=0.7183431952662722, total=   0.1s
[CV] learning_rate=0.1, max_depth=2, n_estimators=200 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=200, score=0.7396449704142012, total=   0.2s
[CV] learning_rate=0.1, max_depth=2, n_estimators=200 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=200, score=0.6978672985781991, total=   0.1s
[CV] learning_rate=0.1, max_depth=2, n_estimators=250 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=250, score=0.7171597633136094, total=   0.2s
[CV] learning_rate=0.1, max_depth=2, n_estimators=250 ................
[CV]  learning_rate=0.1, max_depth=2, n_estimators=250, score=0.7396449704142012, total=   0.2s
[CV] learning_rate=0.1, max_depth=2, n_estimators=250 ...............

[CV]  learning_rate=0.1, max_depth=4, n_estimators=100, score=0.7215639810426541, total=   0.1s
[CV] learning_rate=0.1, max_depth=4, n_estimators=150 ................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=150, score=0.7313609467455622, total=   0.2s
[CV] learning_rate=0.1, max_depth=4, n_estimators=150 ................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=150, score=0.736094674556213, total=   0.2s
[CV] learning_rate=0.1, max_depth=4, n_estimators=150 ................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=150, score=0.7120853080568721, total=   0.2s
[CV] learning_rate=0.1, max_depth=4, n_estimators=200 ................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=200, score=0.7183431952662722, total=   0.3s
[CV] learning_rate=0.1, max_depth=4, n_estimators=200 ................
[CV]  learning_rate=0.1, max_depth=4, n_estimators=200, score=0.7337278106508875, total=   0.3s
[CV] learning_rate=0.1, max_depth=4, n_estimators=200 ................

[CV]  learning_rate=1, max_depth=1, n_estimators=50, score=0.6919431279620853, total=   0.0s
[CV] learning_rate=1, max_depth=1, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=1, n_estimators=100, score=0.7076923076923077, total=   0.1s
[CV] learning_rate=1, max_depth=1, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=1, n_estimators=100, score=0.7159763313609467, total=   0.1s
[CV] learning_rate=1, max_depth=1, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=1, n_estimators=100, score=0.6990521327014217, total=   0.1s
[CV] learning_rate=1, max_depth=1, n_estimators=150 ..................
[CV]  learning_rate=1, max_depth=1, n_estimators=150, score=0.7088757396449704, total=   0.1s
[CV] learning_rate=1, max_depth=1, n_estimators=150 ..................
[CV]  learning_rate=1, max_depth=1, n_estimators=150, score=0.714792899408284, total=   0.1s
[CV] learning_rate=1, max_depth=1, n_estimators=150 ..................
[CV]  learni

[CV]  learning_rate=1, max_depth=3, n_estimators=50, score=0.6789099526066351, total=   0.1s
[CV] learning_rate=1, max_depth=3, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=3, n_estimators=100, score=0.6792899408284023, total=   0.1s
[CV] learning_rate=1, max_depth=3, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=3, n_estimators=100, score=0.6982248520710059, total=   0.1s
[CV] learning_rate=1, max_depth=3, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=3, n_estimators=100, score=0.6706161137440758, total=   0.1s
[CV] learning_rate=1, max_depth=3, n_estimators=150 ..................
[CV]  learning_rate=1, max_depth=3, n_estimators=150, score=0.6792899408284023, total=   0.2s
[CV] learning_rate=1, max_depth=3, n_estimators=150 ..................
[CV]  learning_rate=1, max_depth=3, n_estimators=150, score=0.6958579881656805, total=   0.1s
[CV] learning_rate=1, max_depth=3, n_estimators=150 ..................
[CV]  learn

[CV]  learning_rate=1, max_depth=5, n_estimators=50, score=0.6875739644970414, total=   0.1s
[CV] learning_rate=1, max_depth=5, n_estimators=50 ...................
[CV]  learning_rate=1, max_depth=5, n_estimators=50, score=0.6943127962085308, total=   0.1s
[CV] learning_rate=1, max_depth=5, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=5, n_estimators=100, score=0.6958579881656805, total=   0.2s
[CV] learning_rate=1, max_depth=5, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=5, n_estimators=100, score=0.6911242603550296, total=   0.2s
[CV] learning_rate=1, max_depth=5, n_estimators=100 ..................
[CV]  learning_rate=1, max_depth=5, n_estimators=100, score=0.6848341232227488, total=   0.2s
[CV] learning_rate=1, max_depth=5, n_estimators=150 ..................
[CV]  learning_rate=1, max_depth=5, n_estimators=150, score=0.6863905325443787, total=   0.3s
[CV] learning_rate=1, max_depth=5, n_estimators=150 ..................
[CV]  learni

[CV]  learning_rate=10, max_depth=2, n_estimators=100, score=0.4284023668639053, total=   0.1s
[CV] learning_rate=10, max_depth=2, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=2, n_estimators=100, score=0.34437869822485206, total=   0.1s
[CV] learning_rate=10, max_depth=2, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=2, n_estimators=100, score=0.3495260663507109, total=   0.1s
[CV] learning_rate=10, max_depth=2, n_estimators=150 .................
[CV]  learning_rate=10, max_depth=2, n_estimators=150, score=0.4284023668639053, total=   0.1s
[CV] learning_rate=10, max_depth=2, n_estimators=150 .................
[CV]  learning_rate=10, max_depth=2, n_estimators=150, score=0.34437869822485206, total=   0.1s
[CV] learning_rate=10, max_depth=2, n_estimators=150 .................
[CV]  learning_rate=10, max_depth=2, n_estimators=150, score=0.3495260663507109, total=   0.1s
[CV] learning_rate=10, max_depth=2, n_estimators=200 .................
[C

[CV]  learning_rate=10, max_depth=4, n_estimators=50, score=0.49940828402366866, total=   0.1s
[CV] learning_rate=10, max_depth=4, n_estimators=50 ..................
[CV]  learning_rate=10, max_depth=4, n_estimators=50, score=0.580568720379147, total=   0.1s
[CV] learning_rate=10, max_depth=4, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=4, n_estimators=100, score=0.47928994082840237, total=   0.1s
[CV] learning_rate=10, max_depth=4, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=4, n_estimators=100, score=0.49940828402366866, total=   0.2s
[CV] learning_rate=10, max_depth=4, n_estimators=100 .................
[CV]  learning_rate=10, max_depth=4, n_estimators=100, score=0.580568720379147, total=   0.1s
[CV] learning_rate=10, max_depth=4, n_estimators=150 .................
[CV]  learning_rate=10, max_depth=4, n_estimators=150, score=0.47928994082840237, total=   0.2s
[CV] learning_rate=10, max_depth=4, n_estimators=150 .................
[CV]

[Parallel(n_jobs=1)]: Done 675 out of 675 | elapsed:  2.7min finished


Best score: 0.7403314917127072
Best parameter set: {'learning_rate': 0.01, 'max_depth': 4, 'n_estimators': 300}


In [130]:
gb_tree_model = GradientBoostingClassifier(n_estimators=300, learning_rate=0.01, max_depth=4, random_state=0)
gb_tree_scores = cross_val_score(gb_tree_model, X_pca, y, cv=10)
print("Gradient Boosted Tree CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (gb_tree_scores.mean()*100, gb_tree_scores.std() * 2*100))

Gradient Boosted Tree CV Accuracy: 69.32% (+/- 16.90%)


## Naive Bayes

In [131]:
naive_bayes_model = GaussianNB()
naive_bayes_scores = cross_val_score(naive_bayes_model, X_pca, y, cv=10)
print("Naive Bayes CV Accuracy: %0.2f%% (+/- %0.2f%%)" % (naive_bayes_scores.mean()*100, naive_bayes_scores.std() * 2*100))

Naive Bayes CV Accuracy: 62.75% (+/- 16.82%)
