In [46]:
import pandas as pd
import numpy as np
from sklearn.ensemble import RandomForestClassifier
from sklearn.ensemble import VotingClassifier
from sklearn.linear_model import LogisticRegression
from sklearn.ensemble import GradientBoostingClassifier
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import MinMaxScaler, StandardScaler, LabelEncoder

In [47]:
df = pd.read_csv('Employee_Attrition.csv')

In [48]:
df.head()

Unnamed: 0,Age,Attrition,BusinessTravel,DailyRate,Department,DistanceFromHome,Education,EducationField,EmployeeCount,EmployeeNumber,...,RelationshipSatisfaction,StandardHours,StockOptionLevel,TotalWorkingYears,TrainingTimesLastYear,WorkLifeBalance,YearsAtCompany,YearsInCurrentRole,YearsSinceLastPromotion,YearsWithCurrManager
0,41,Yes,Travel_Rarely,1102,Sales,1,2,Life Sciences,1,1,...,1,80,0,8,0,1,6,4,0,5
1,49,No,Travel_Frequently,279,Research & Development,8,1,Life Sciences,1,2,...,4,80,1,10,3,3,10,7,1,7
2,37,Yes,Travel_Rarely,1373,Research & Development,2,2,Other,1,4,...,2,80,0,7,3,3,0,0,0,0
3,33,No,Travel_Frequently,1392,Research & Development,3,4,Life Sciences,1,5,...,3,80,0,8,3,3,8,7,3,0
4,27,No,Travel_Rarely,591,Research & Development,2,1,Medical,1,7,...,4,80,1,6,3,3,2,2,2,2


In [49]:
df.isnull().sum()

Age                         0
Attrition                   0
BusinessTravel              0
DailyRate                   0
Department                  0
DistanceFromHome            0
Education                   0
EducationField              0
EmployeeCount               0
EmployeeNumber              0
EnvironmentSatisfaction     0
Gender                      0
HourlyRate                  0
JobInvolvement              0
JobLevel                    0
JobRole                     0
JobSatisfaction             0
MaritalStatus               0
MonthlyIncome               0
MonthlyRate                 0
NumCompaniesWorked          0
Over18                      0
OverTime                    0
PercentSalaryHike           0
PerformanceRating           0
RelationshipSatisfaction    0
StandardHours               0
StockOptionLevel            0
TotalWorkingYears           0
TrainingTimesLastYear       0
WorkLifeBalance             0
YearsAtCompany              0
YearsInCurrentRole          0
YearsSince

In [50]:
X_df = df.drop('Attrition', axis=1)
y = df['Attrition']

X_df.shape,y.shape

((1470, 34), (1470,))

In [51]:
objList = X_df.select_dtypes(include = "object").columns #
print (objList)

Index(['BusinessTravel', 'Department', 'EducationField', 'Gender', 'JobRole',
       'MaritalStatus', 'Over18', 'OverTime'],
      dtype='object')


In [52]:
from sklearn.preprocessing import LabelEncoder #encoder package of sklearn
le = LabelEncoder() #le variable has been assigned a labelencoder function

for Shiv in objList:
    X_df[Shiv] = le.fit_transform(X_df[Shiv].astype(str))

print (X_df.info())

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1470 entries, 0 to 1469
Data columns (total 34 columns):
 #   Column                    Non-Null Count  Dtype
---  ------                    --------------  -----
 0   Age                       1470 non-null   int64
 1   BusinessTravel            1470 non-null   int32
 2   DailyRate                 1470 non-null   int64
 3   Department                1470 non-null   int32
 4   DistanceFromHome          1470 non-null   int64
 5   Education                 1470 non-null   int64
 6   EducationField            1470 non-null   int32
 7   EmployeeCount             1470 non-null   int64
 8   EmployeeNumber            1470 non-null   int64
 9   EnvironmentSatisfaction   1470 non-null   int64
 10  Gender                    1470 non-null   int32
 11  HourlyRate                1470 non-null   int64
 12  JobInvolvement            1470 non-null   int64
 13  JobLevel                  1470 non-null   int64
 14  JobRole                   1470 non-null 

In [53]:
# Split feature and label sets to train and data sets.

X_train, X_test, y_train, y_test = train_test_split(X_df, y, test_size = 0.2, random_state = 10)
X_train.shape, X_test.shape, y_train.shape, y_test.shape

((1176, 34), (294, 34), (1176,), (294,))

In [54]:
scaler = MinMaxScaler(feature_range = (0,1))
scaler.fit(X_train)
scaler.fit(X_test)
X_train = scaler.transform(X_train)
X_test = scaler.transform(X_test)

# Grid Search for all the algo's individually 

In [55]:
from sklearn.model_selection import GridSearchCV
param_grid = {'C':np.linspace(0.1, 10, 20), 'gamma':[1,0.1,0.01,0.001], 'kernel' : ['linear', 'poly', 'rbf']}

In [56]:
grid = GridSearchCV(SVC(), param_grid, refit = True, verbose=3, cv=5)
grid.fit(X_train, y_train)

Fitting 5 folds for each of 240 candidates, totalling 1200 fits
[CV 1/5] END .....C=0.1, gamma=1, kernel=linear;, score=0.843 total time=   0.0s
[CV 2/5] END .....C=0.1, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END .....C=0.1, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 4/5] END .....C=0.1, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END .....C=0.1, gamma=1, kernel=linear;, score=0.843 total time=   0.0s
[CV 1/5] END .......C=0.1, gamma=1, kernel=poly;, score=0.835 total time=   0.0s
[CV 2/5] END .......C=0.1, gamma=1, kernel=poly;, score=0.838 total time=   0.0s
[CV 3/5] END .......C=0.1, gamma=1, kernel=poly;, score=0.847 total time=   0.0s
[CV 4/5] END .......C=0.1, gamma=1, kernel=poly;, score=0.791 total time=   0.0s
[CV 5/5] END .......C=0.1, gamma=1, kernel=poly;, score=0.830 total time=   0.0s
[CV 1/5] END ........C=0.1, gamma=1, kernel=rbf;, score=0.843 total time=   0.0s
[CV 2/5] END ........C=0.1, gamma=1, kernel=r

[CV 1/5] END C=0.6210526315789474, gamma=0.001, kernel=linear;, score=0.843 total time=   0.0s
[CV 2/5] END C=0.6210526315789474, gamma=0.001, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=0.6210526315789474, gamma=0.001, kernel=linear;, score=0.855 total time=   0.0s
[CV 4/5] END C=0.6210526315789474, gamma=0.001, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=0.6210526315789474, gamma=0.001, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=0.6210526315789474, gamma=0.001, kernel=poly;, score=0.843 total time=   0.0s
[CV 2/5] END C=0.6210526315789474, gamma=0.001, kernel=poly;, score=0.847 total time=   0.0s
[CV 3/5] END C=0.6210526315789474, gamma=0.001, kernel=poly;, score=0.847 total time=   0.0s
[CV 4/5] END C=0.6210526315789474, gamma=0.001, kernel=poly;, score=0.847 total time=   0.0s
[CV 5/5] END C=0.6210526315789474, gamma=0.001, kernel=poly;, score=0.843 total time=   0.0s
[CV 1/5] END C=0.6210526315789474, gamma=0.001, kernel=rbf;,

[CV 2/5] END C=1.6631578947368424, gamma=0.1, kernel=rbf;, score=0.847 total time=   0.0s
[CV 3/5] END C=1.6631578947368424, gamma=0.1, kernel=rbf;, score=0.860 total time=   0.0s
[CV 4/5] END C=1.6631578947368424, gamma=0.1, kernel=rbf;, score=0.855 total time=   0.0s
[CV 5/5] END C=1.6631578947368424, gamma=0.1, kernel=rbf;, score=0.847 total time=   0.0s
[CV 1/5] END C=1.6631578947368424, gamma=0.01, kernel=linear;, score=0.843 total time=   0.0s
[CV 2/5] END C=1.6631578947368424, gamma=0.01, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=1.6631578947368424, gamma=0.01, kernel=linear;, score=0.864 total time=   0.0s
[CV 4/5] END C=1.6631578947368424, gamma=0.01, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=1.6631578947368424, gamma=0.01, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=1.6631578947368424, gamma=0.01, kernel=poly;, score=0.843 total time=   0.0s
[CV 2/5] END C=1.6631578947368424, gamma=0.01, kernel=poly;, score=0.847 total

[CV 3/5] END C=2.18421052631579, gamma=0.001, kernel=rbf;, score=0.847 total time=   0.0s
[CV 4/5] END C=2.18421052631579, gamma=0.001, kernel=rbf;, score=0.847 total time=   0.0s
[CV 5/5] END C=2.18421052631579, gamma=0.001, kernel=rbf;, score=0.843 total time=   0.0s
[CV 1/5] END C=2.7052631578947373, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 2/5] END C=2.7052631578947373, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=2.7052631578947373, gamma=1, kernel=linear;, score=0.868 total time=   0.0s
[CV 4/5] END C=2.7052631578947373, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=2.7052631578947373, gamma=1, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=2.7052631578947373, gamma=1, kernel=poly;, score=0.792 total time=   0.0s
[CV 2/5] END C=2.7052631578947373, gamma=1, kernel=poly;, score=0.826 total time=   0.0s
[CV 3/5] END C=2.7052631578947373, gamma=1, kernel=poly;, score=0.830 total time=   0.0s
[CV 4/5]

[CV 5/5] END C=3.2263157894736847, gamma=0.01, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=3.2263157894736847, gamma=0.01, kernel=poly;, score=0.843 total time=   0.0s
[CV 2/5] END C=3.2263157894736847, gamma=0.01, kernel=poly;, score=0.847 total time=   0.0s
[CV 3/5] END C=3.2263157894736847, gamma=0.01, kernel=poly;, score=0.847 total time=   0.0s
[CV 4/5] END C=3.2263157894736847, gamma=0.01, kernel=poly;, score=0.847 total time=   0.0s
[CV 5/5] END C=3.2263157894736847, gamma=0.01, kernel=poly;, score=0.843 total time=   0.0s
[CV 1/5] END C=3.2263157894736847, gamma=0.01, kernel=rbf;, score=0.843 total time=   0.0s
[CV 2/5] END C=3.2263157894736847, gamma=0.01, kernel=rbf;, score=0.847 total time=   0.0s
[CV 3/5] END C=3.2263157894736847, gamma=0.01, kernel=rbf;, score=0.847 total time=   0.0s
[CV 4/5] END C=3.2263157894736847, gamma=0.01, kernel=rbf;, score=0.847 total time=   0.0s
[CV 5/5] END C=3.2263157894736847, gamma=0.01, kernel=rbf;, score=0.843 total time

[CV 4/5] END C=4.268421052631579, gamma=1, kernel=poly;, score=0.787 total time=   0.0s
[CV 5/5] END C=4.268421052631579, gamma=1, kernel=poly;, score=0.791 total time=   0.0s
[CV 1/5] END C=4.268421052631579, gamma=1, kernel=rbf;, score=0.847 total time=   0.0s
[CV 2/5] END C=4.268421052631579, gamma=1, kernel=rbf;, score=0.834 total time=   0.0s
[CV 3/5] END C=4.268421052631579, gamma=1, kernel=rbf;, score=0.872 total time=   0.0s
[CV 4/5] END C=4.268421052631579, gamma=1, kernel=rbf;, score=0.860 total time=   0.0s
[CV 5/5] END C=4.268421052631579, gamma=1, kernel=rbf;, score=0.855 total time=   0.0s
[CV 1/5] END C=4.268421052631579, gamma=0.1, kernel=linear;, score=0.852 total time=   0.0s
[CV 2/5] END C=4.268421052631579, gamma=0.1, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=4.268421052631579, gamma=0.1, kernel=linear;, score=0.864 total time=   0.0s
[CV 4/5] END C=4.268421052631579, gamma=0.1, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=4.2684

[CV 3/5] END C=4.7894736842105265, gamma=0.01, kernel=rbf;, score=0.847 total time=   0.0s
[CV 4/5] END C=4.7894736842105265, gamma=0.01, kernel=rbf;, score=0.847 total time=   0.0s
[CV 5/5] END C=4.7894736842105265, gamma=0.01, kernel=rbf;, score=0.843 total time=   0.0s
[CV 1/5] END C=4.7894736842105265, gamma=0.001, kernel=linear;, score=0.852 total time=   0.0s
[CV 2/5] END C=4.7894736842105265, gamma=0.001, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=4.7894736842105265, gamma=0.001, kernel=linear;, score=0.864 total time=   0.0s
[CV 4/5] END C=4.7894736842105265, gamma=0.001, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=4.7894736842105265, gamma=0.001, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=4.7894736842105265, gamma=0.001, kernel=poly;, score=0.843 total time=   0.0s
[CV 2/5] END C=4.7894736842105265, gamma=0.001, kernel=poly;, score=0.847 total time=   0.0s
[CV 3/5] END C=4.7894736842105265, gamma=0.001, kernel=poly;, scor

[CV 1/5] END C=5.831578947368421, gamma=0.1, kernel=linear;, score=0.856 total time=   0.0s
[CV 2/5] END C=5.831578947368421, gamma=0.1, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=5.831578947368421, gamma=0.1, kernel=linear;, score=0.864 total time=   0.0s
[CV 4/5] END C=5.831578947368421, gamma=0.1, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=5.831578947368421, gamma=0.1, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=5.831578947368421, gamma=0.1, kernel=poly;, score=0.860 total time=   0.0s
[CV 2/5] END C=5.831578947368421, gamma=0.1, kernel=poly;, score=0.885 total time=   0.0s
[CV 3/5] END C=5.831578947368421, gamma=0.1, kernel=poly;, score=0.868 total time=   0.0s
[CV 4/5] END C=5.831578947368421, gamma=0.1, kernel=poly;, score=0.881 total time=   0.0s
[CV 5/5] END C=5.831578947368421, gamma=0.1, kernel=poly;, score=0.843 total time=   0.0s
[CV 1/5] END C=5.831578947368421, gamma=0.1, kernel=rbf;, score=0.856 total time=   0.0s
[

[CV 5/5] END C=6.352631578947369, gamma=0.001, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=6.352631578947369, gamma=0.001, kernel=poly;, score=0.843 total time=   0.0s
[CV 2/5] END C=6.352631578947369, gamma=0.001, kernel=poly;, score=0.847 total time=   0.0s
[CV 3/5] END C=6.352631578947369, gamma=0.001, kernel=poly;, score=0.847 total time=   0.0s
[CV 4/5] END C=6.352631578947369, gamma=0.001, kernel=poly;, score=0.847 total time=   0.0s
[CV 5/5] END C=6.352631578947369, gamma=0.001, kernel=poly;, score=0.843 total time=   0.0s
[CV 1/5] END C=6.352631578947369, gamma=0.001, kernel=rbf;, score=0.843 total time=   0.0s
[CV 2/5] END C=6.352631578947369, gamma=0.001, kernel=rbf;, score=0.847 total time=   0.0s
[CV 3/5] END C=6.352631578947369, gamma=0.001, kernel=rbf;, score=0.847 total time=   0.0s
[CV 4/5] END C=6.352631578947369, gamma=0.001, kernel=rbf;, score=0.847 total time=   0.0s
[CV 5/5] END C=6.352631578947369, gamma=0.001, kernel=rbf;, score=0.843 total time

[CV 4/5] END C=7.394736842105264, gamma=0.1, kernel=poly;, score=0.877 total time=   0.0s
[CV 5/5] END C=7.394736842105264, gamma=0.1, kernel=poly;, score=0.834 total time=   0.0s
[CV 1/5] END C=7.394736842105264, gamma=0.1, kernel=rbf;, score=0.852 total time=   0.0s
[CV 2/5] END C=7.394736842105264, gamma=0.1, kernel=rbf;, score=0.885 total time=   0.0s
[CV 3/5] END C=7.394736842105264, gamma=0.1, kernel=rbf;, score=0.864 total time=   0.0s
[CV 4/5] END C=7.394736842105264, gamma=0.1, kernel=rbf;, score=0.872 total time=   0.0s
[CV 5/5] END C=7.394736842105264, gamma=0.1, kernel=rbf;, score=0.847 total time=   0.0s
[CV 1/5] END C=7.394736842105264, gamma=0.01, kernel=linear;, score=0.856 total time=   0.0s
[CV 2/5] END C=7.394736842105264, gamma=0.01, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=7.394736842105264, gamma=0.01, kernel=linear;, score=0.868 total time=   0.0s
[CV 4/5] END C=7.394736842105264, gamma=0.01, kernel=linear;, score=0.847 total time=   0.0s
[CV

[CV 1/5] END C=8.436842105263159, gamma=1, kernel=linear;, score=0.852 total time=   0.0s
[CV 2/5] END C=8.436842105263159, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END C=8.436842105263159, gamma=1, kernel=linear;, score=0.864 total time=   0.0s
[CV 4/5] END C=8.436842105263159, gamma=1, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=8.436842105263159, gamma=1, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=8.436842105263159, gamma=1, kernel=poly;, score=0.792 total time=   0.0s
[CV 2/5] END C=8.436842105263159, gamma=1, kernel=poly;, score=0.826 total time=   0.0s
[CV 3/5] END C=8.436842105263159, gamma=1, kernel=poly;, score=0.830 total time=   0.0s
[CV 4/5] END C=8.436842105263159, gamma=1, kernel=poly;, score=0.787 total time=   0.0s
[CV 5/5] END C=8.436842105263159, gamma=1, kernel=poly;, score=0.791 total time=   0.0s
[CV 1/5] END C=8.436842105263159, gamma=1, kernel=rbf;, score=0.847 total time=   0.0s
[CV 2/5] END C=8.436842

[CV 3/5] END C=8.957894736842105, gamma=0.01, kernel=linear;, score=0.860 total time=   0.0s
[CV 4/5] END C=8.957894736842105, gamma=0.01, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END C=8.957894736842105, gamma=0.01, kernel=linear;, score=0.855 total time=   0.0s
[CV 1/5] END C=8.957894736842105, gamma=0.01, kernel=poly;, score=0.843 total time=   0.0s
[CV 2/5] END C=8.957894736842105, gamma=0.01, kernel=poly;, score=0.847 total time=   0.0s
[CV 3/5] END C=8.957894736842105, gamma=0.01, kernel=poly;, score=0.847 total time=   0.0s
[CV 4/5] END C=8.957894736842105, gamma=0.01, kernel=poly;, score=0.847 total time=   0.0s
[CV 5/5] END C=8.957894736842105, gamma=0.01, kernel=poly;, score=0.843 total time=   0.0s
[CV 1/5] END C=8.957894736842105, gamma=0.01, kernel=rbf;, score=0.843 total time=   0.0s
[CV 2/5] END C=8.957894736842105, gamma=0.01, kernel=rbf;, score=0.847 total time=   0.0s
[CV 3/5] END C=8.957894736842105, gamma=0.01, kernel=rbf;, score=0.847 total time=   0

[CV 3/5] END ......C=10.0, gamma=1, kernel=poly;, score=0.830 total time=   0.0s
[CV 4/5] END ......C=10.0, gamma=1, kernel=poly;, score=0.787 total time=   0.0s
[CV 5/5] END ......C=10.0, gamma=1, kernel=poly;, score=0.791 total time=   0.0s
[CV 1/5] END .......C=10.0, gamma=1, kernel=rbf;, score=0.847 total time=   0.0s
[CV 2/5] END .......C=10.0, gamma=1, kernel=rbf;, score=0.834 total time=   0.0s
[CV 3/5] END .......C=10.0, gamma=1, kernel=rbf;, score=0.872 total time=   0.0s
[CV 4/5] END .......C=10.0, gamma=1, kernel=rbf;, score=0.860 total time=   0.0s
[CV 5/5] END .......C=10.0, gamma=1, kernel=rbf;, score=0.855 total time=   0.0s
[CV 1/5] END ..C=10.0, gamma=0.1, kernel=linear;, score=0.847 total time=   0.0s
[CV 2/5] END ..C=10.0, gamma=0.1, kernel=linear;, score=0.847 total time=   0.0s
[CV 3/5] END ..C=10.0, gamma=0.1, kernel=linear;, score=0.860 total time=   0.0s
[CV 4/5] END ..C=10.0, gamma=0.1, kernel=linear;, score=0.847 total time=   0.0s
[CV 5/5] END ..C=10.0, gamma

GridSearchCV(cv=5, estimator=SVC(),
             param_grid={'C': array([ 0.1       ,  0.62105263,  1.14210526,  1.66315789,  2.18421053,
        2.70526316,  3.22631579,  3.74736842,  4.26842105,  4.78947368,
        5.31052632,  5.83157895,  6.35263158,  6.87368421,  7.39473684,
        7.91578947,  8.43684211,  8.95789474,  9.47894737, 10.        ]),
                         'gamma': [1, 0.1, 0.01, 0.001],
                         'kernel': ['linear', 'poly', 'rbf']},
             verbose=3)

In [57]:
print(grid.best_params_)

{'C': 8.957894736842105, 'gamma': 0.1, 'kernel': 'rbf'}


In [58]:
from sklearn.model_selection import GridSearchCV
param_grid = {'n_estimators':list(range(10,101,10)), 'max_depth' : list(range(5,20,5))}

In [59]:
grid = GridSearchCV(RandomForestClassifier(), param_grid, refit = True, verbose=3, cv=5)
grid.fit(X_train, y_train)

Fitting 5 folds for each of 30 candidates, totalling 150 fits
[CV 1/5] END ......max_depth=5, n_estimators=10;, score=0.843 total time=   0.0s
[CV 2/5] END ......max_depth=5, n_estimators=10;, score=0.847 total time=   0.0s
[CV 3/5] END ......max_depth=5, n_estimators=10;, score=0.855 total time=   0.0s
[CV 4/5] END ......max_depth=5, n_estimators=10;, score=0.847 total time=   0.0s
[CV 5/5] END ......max_depth=5, n_estimators=10;, score=0.834 total time=   0.0s
[CV 1/5] END ......max_depth=5, n_estimators=20;, score=0.860 total time=   0.0s
[CV 2/5] END ......max_depth=5, n_estimators=20;, score=0.855 total time=   0.0s
[CV 3/5] END ......max_depth=5, n_estimators=20;, score=0.855 total time=   0.0s
[CV 4/5] END ......max_depth=5, n_estimators=20;, score=0.847 total time=   0.0s
[CV 5/5] END ......max_depth=5, n_estimators=20;, score=0.843 total time=   0.0s
[CV 1/5] END ......max_depth=5, n_estimators=30;, score=0.852 total time=   0.0s
[CV 2/5] END ......max_depth=5, n_estimators=30

[CV 3/5] END .....max_depth=15, n_estimators=10;, score=0.855 total time=   0.0s
[CV 4/5] END .....max_depth=15, n_estimators=10;, score=0.855 total time=   0.0s
[CV 5/5] END .....max_depth=15, n_estimators=10;, score=0.843 total time=   0.0s
[CV 1/5] END .....max_depth=15, n_estimators=20;, score=0.852 total time=   0.0s
[CV 2/5] END .....max_depth=15, n_estimators=20;, score=0.855 total time=   0.0s
[CV 3/5] END .....max_depth=15, n_estimators=20;, score=0.864 total time=   0.0s
[CV 4/5] END .....max_depth=15, n_estimators=20;, score=0.847 total time=   0.0s
[CV 5/5] END .....max_depth=15, n_estimators=20;, score=0.860 total time=   0.0s
[CV 1/5] END .....max_depth=15, n_estimators=30;, score=0.860 total time=   0.0s
[CV 2/5] END .....max_depth=15, n_estimators=30;, score=0.855 total time=   0.0s
[CV 3/5] END .....max_depth=15, n_estimators=30;, score=0.868 total time=   0.0s
[CV 4/5] END .....max_depth=15, n_estimators=30;, score=0.860 total time=   0.0s
[CV 5/5] END .....max_depth=

GridSearchCV(cv=5, estimator=RandomForestClassifier(),
             param_grid={'max_depth': [5, 10, 15],
                         'n_estimators': [10, 20, 30, 40, 50, 60, 70, 80, 90,
                                          100]},
             verbose=3)

In [60]:
print(grid.best_params_)

{'max_depth': 10, 'n_estimators': 60}


In [61]:
from sklearn.model_selection import GridSearchCV
param_grid = {'C' : np.linspace(1, 10, 20), 'solver' : ['liblinear'], 'penalty' : ['l1', 'l2']}

In [62]:
grid = GridSearchCV(LogisticRegression(), param_grid, refit = True, verbose=3, cv=5)
grid.fit(X_train, y_train)

Fitting 5 folds for each of 40 candidates, totalling 200 fits
[CV 1/5] END C=1.0, penalty=l1, solver=liblinear;, score=0.860 total time=   0.0s
[CV 2/5] END C=1.0, penalty=l1, solver=liblinear;, score=0.864 total time=   0.0s
[CV 3/5] END C=1.0, penalty=l1, solver=liblinear;, score=0.877 total time=   0.0s
[CV 4/5] END C=1.0, penalty=l1, solver=liblinear;, score=0.872 total time=   0.0s
[CV 5/5] END C=1.0, penalty=l1, solver=liblinear;, score=0.860 total time=   0.0s
[CV 1/5] END C=1.0, penalty=l2, solver=liblinear;, score=0.856 total time=   0.0s
[CV 2/5] END C=1.0, penalty=l2, solver=liblinear;, score=0.872 total time=   0.0s
[CV 3/5] END C=1.0, penalty=l2, solver=liblinear;, score=0.877 total time=   0.0s
[CV 4/5] END C=1.0, penalty=l2, solver=liblinear;, score=0.881 total time=   0.0s
[CV 5/5] END C=1.0, penalty=l2, solver=liblinear;, score=0.860 total time=   0.0s
[CV 1/5] END C=1.4736842105263157, penalty=l1, solver=liblinear;, score=0.856 total time=   0.0s
[CV 2/5] END C=1.4736

[CV 2/5] END C=4.789473684210526, penalty=l2, solver=liblinear;, score=0.877 total time=   0.0s
[CV 3/5] END C=4.789473684210526, penalty=l2, solver=liblinear;, score=0.860 total time=   0.0s
[CV 4/5] END C=4.789473684210526, penalty=l2, solver=liblinear;, score=0.889 total time=   0.0s
[CV 5/5] END C=4.789473684210526, penalty=l2, solver=liblinear;, score=0.864 total time=   0.0s
[CV 1/5] END C=5.263157894736842, penalty=l1, solver=liblinear;, score=0.852 total time=   0.0s
[CV 2/5] END C=5.263157894736842, penalty=l1, solver=liblinear;, score=0.877 total time=   0.0s
[CV 3/5] END C=5.263157894736842, penalty=l1, solver=liblinear;, score=0.864 total time=   0.0s
[CV 4/5] END C=5.263157894736842, penalty=l1, solver=liblinear;, score=0.889 total time=   0.0s
[CV 5/5] END C=5.263157894736842, penalty=l1, solver=liblinear;, score=0.864 total time=   0.0s
[CV 1/5] END C=5.263157894736842, penalty=l2, solver=liblinear;, score=0.852 total time=   0.0s
[CV 2/5] END C=5.263157894736842, penalt

[CV 3/5] END C=10.0, penalty=l1, solver=liblinear;, score=0.860 total time=   0.0s
[CV 4/5] END C=10.0, penalty=l1, solver=liblinear;, score=0.894 total time=   0.0s
[CV 5/5] END C=10.0, penalty=l1, solver=liblinear;, score=0.864 total time=   0.0s
[CV 1/5] END C=10.0, penalty=l2, solver=liblinear;, score=0.843 total time=   0.0s
[CV 2/5] END C=10.0, penalty=l2, solver=liblinear;, score=0.881 total time=   0.0s
[CV 3/5] END C=10.0, penalty=l2, solver=liblinear;, score=0.864 total time=   0.0s
[CV 4/5] END C=10.0, penalty=l2, solver=liblinear;, score=0.894 total time=   0.0s
[CV 5/5] END C=10.0, penalty=l2, solver=liblinear;, score=0.860 total time=   0.0s


GridSearchCV(cv=5, estimator=LogisticRegression(),
             param_grid={'C': array([ 1.        ,  1.47368421,  1.94736842,  2.42105263,  2.89473684,
        3.36842105,  3.84210526,  4.31578947,  4.78947368,  5.26315789,
        5.73684211,  6.21052632,  6.68421053,  7.15789474,  7.63157895,
        8.10526316,  8.57894737,  9.05263158,  9.52631579, 10.        ]),
                         'penalty': ['l1', 'l2'], 'solver': ['liblinear']},
             verbose=3)

In [63]:
print(grid.best_params_)

{'C': 7.63157894736842, 'penalty': 'l1', 'solver': 'liblinear'}


In [64]:
from sklearn.model_selection import GridSearchCV
param_grid = {'n_estimators' : list(range(10,101,10)), 'learning_rate' : np.linspace(0.1, 10, 50)}

In [65]:
grid = GridSearchCV(GradientBoostingClassifier(), param_grid, refit = True, verbose=3, cv=5)
grid.fit(X_train, y_train)

Fitting 5 folds for each of 500 candidates, totalling 2500 fits
[CV 1/5] END learning_rate=0.1, n_estimators=10;, score=0.843 total time=   0.0s
[CV 2/5] END learning_rate=0.1, n_estimators=10;, score=0.851 total time=   0.0s
[CV 3/5] END learning_rate=0.1, n_estimators=10;, score=0.851 total time=   0.0s
[CV 4/5] END learning_rate=0.1, n_estimators=10;, score=0.851 total time=   0.0s
[CV 5/5] END learning_rate=0.1, n_estimators=10;, score=0.847 total time=   0.0s
[CV 1/5] END learning_rate=0.1, n_estimators=20;, score=0.860 total time=   0.0s
[CV 2/5] END learning_rate=0.1, n_estimators=20;, score=0.860 total time=   0.0s
[CV 3/5] END learning_rate=0.1, n_estimators=20;, score=0.860 total time=   0.0s
[CV 4/5] END learning_rate=0.1, n_estimators=20;, score=0.864 total time=   0.0s
[CV 5/5] END learning_rate=0.1, n_estimators=20;, score=0.843 total time=   0.0s
[CV 1/5] END learning_rate=0.1, n_estimators=30;, score=0.860 total time=   0.0s
[CV 2/5] END learning_rate=0.1, n_estimators=

[CV 4/5] END learning_rate=0.3020408163265306, n_estimators=90;, score=0.877 total time=   0.1s
[CV 5/5] END learning_rate=0.3020408163265306, n_estimators=90;, score=0.830 total time=   0.1s
[CV 1/5] END learning_rate=0.3020408163265306, n_estimators=100;, score=0.847 total time=   0.2s
[CV 2/5] END learning_rate=0.3020408163265306, n_estimators=100;, score=0.864 total time=   0.2s
[CV 3/5] END learning_rate=0.3020408163265306, n_estimators=100;, score=0.868 total time=   0.2s
[CV 4/5] END learning_rate=0.3020408163265306, n_estimators=100;, score=0.872 total time=   0.2s
[CV 5/5] END learning_rate=0.3020408163265306, n_estimators=100;, score=0.838 total time=   0.1s
[CV 1/5] END learning_rate=0.5040816326530613, n_estimators=10;, score=0.860 total time=   0.0s
[CV 2/5] END learning_rate=0.5040816326530613, n_estimators=10;, score=0.851 total time=   0.0s
[CV 3/5] END learning_rate=0.5040816326530613, n_estimators=10;, score=0.851 total time=   0.0s
[CV 4/5] END learning_rate=0.504081

[CV 1/5] END learning_rate=0.7061224489795919, n_estimators=70;, score=0.860 total time=   0.1s
[CV 2/5] END learning_rate=0.7061224489795919, n_estimators=70;, score=0.868 total time=   0.1s
[CV 3/5] END learning_rate=0.7061224489795919, n_estimators=70;, score=0.851 total time=   0.1s
[CV 4/5] END learning_rate=0.7061224489795919, n_estimators=70;, score=0.864 total time=   0.1s
[CV 5/5] END learning_rate=0.7061224489795919, n_estimators=70;, score=0.830 total time=   0.1s
[CV 1/5] END learning_rate=0.7061224489795919, n_estimators=80;, score=0.881 total time=   0.1s
[CV 2/5] END learning_rate=0.7061224489795919, n_estimators=80;, score=0.877 total time=   0.1s
[CV 3/5] END learning_rate=0.7061224489795919, n_estimators=80;, score=0.847 total time=   0.1s
[CV 4/5] END learning_rate=0.7061224489795919, n_estimators=80;, score=0.855 total time=   0.1s
[CV 5/5] END learning_rate=0.7061224489795919, n_estimators=80;, score=0.834 total time=   0.1s
[CV 1/5] END learning_rate=0.70612244897

[CV 2/5] END learning_rate=1.1102040816326533, n_estimators=40;, score=0.809 total time=   0.0s
[CV 3/5] END learning_rate=1.1102040816326533, n_estimators=40;, score=0.864 total time=   0.0s
[CV 4/5] END learning_rate=1.1102040816326533, n_estimators=40;, score=0.838 total time=   0.0s
[CV 5/5] END learning_rate=1.1102040816326533, n_estimators=40;, score=0.838 total time=   0.0s
[CV 1/5] END learning_rate=1.1102040816326533, n_estimators=50;, score=0.826 total time=   0.0s
[CV 2/5] END learning_rate=1.1102040816326533, n_estimators=50;, score=0.834 total time=   0.0s
[CV 3/5] END learning_rate=1.1102040816326533, n_estimators=50;, score=0.855 total time=   0.0s
[CV 4/5] END learning_rate=1.1102040816326533, n_estimators=50;, score=0.830 total time=   0.0s
[CV 5/5] END learning_rate=1.1102040816326533, n_estimators=50;, score=0.838 total time=   0.0s
[CV 1/5] END learning_rate=1.1102040816326533, n_estimators=60;, score=0.822 total time=   0.0s
[CV 2/5] END learning_rate=1.11020408163

[CV 2/5] END learning_rate=1.5142857142857145, n_estimators=20;, score=0.826 total time=   0.0s
[CV 3/5] END learning_rate=1.5142857142857145, n_estimators=20;, score=0.826 total time=   0.0s
[CV 4/5] END learning_rate=1.5142857142857145, n_estimators=20;, score=0.804 total time=   0.0s
[CV 5/5] END learning_rate=1.5142857142857145, n_estimators=20;, score=0.787 total time=   0.0s
[CV 1/5] END learning_rate=1.5142857142857145, n_estimators=30;, score=0.835 total time=   0.0s
[CV 2/5] END learning_rate=1.5142857142857145, n_estimators=30;, score=0.809 total time=   0.0s
[CV 3/5] END learning_rate=1.5142857142857145, n_estimators=30;, score=0.830 total time=   0.0s
[CV 4/5] END learning_rate=1.5142857142857145, n_estimators=30;, score=0.817 total time=   0.0s
[CV 5/5] END learning_rate=1.5142857142857145, n_estimators=30;, score=0.800 total time=   0.0s
[CV 1/5] END learning_rate=1.5142857142857145, n_estimators=40;, score=0.839 total time=   0.0s
[CV 2/5] END learning_rate=1.51428571428

[CV 3/5] END learning_rate=1.716326530612245, n_estimators=90;, score=0.689 total time=   0.1s
[CV 4/5] END learning_rate=1.716326530612245, n_estimators=90;, score=0.664 total time=   0.1s
[CV 5/5] END learning_rate=1.716326530612245, n_estimators=90;, score=0.779 total time=   0.1s
[CV 1/5] END learning_rate=1.716326530612245, n_estimators=100;, score=0.754 total time=   0.2s
[CV 2/5] END learning_rate=1.716326530612245, n_estimators=100;, score=0.613 total time=   0.2s
[CV 3/5] END learning_rate=1.716326530612245, n_estimators=100;, score=0.689 total time=   0.2s
[CV 4/5] END learning_rate=1.716326530612245, n_estimators=100;, score=0.660 total time=   0.2s
[CV 5/5] END learning_rate=1.716326530612245, n_estimators=100;, score=0.779 total time=   0.2s
[CV 1/5] END learning_rate=1.9183673469387756, n_estimators=10;, score=0.572 total time=   0.0s
[CV 2/5] END learning_rate=1.9183673469387756, n_estimators=10;, score=0.843 total time=   0.0s
[CV 3/5] END learning_rate=1.91836734693877

[CV 5/5] END learning_rate=2.1204081632653065, n_estimators=60;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=2.1204081632653065, n_estimators=70;, score=0.572 total time=   0.1s
[CV 2/5] END learning_rate=2.1204081632653065, n_estimators=70;, score=0.294 total time=   0.1s
[CV 3/5] END learning_rate=2.1204081632653065, n_estimators=70;, score=0.694 total time=   0.1s
[CV 4/5] END learning_rate=2.1204081632653065, n_estimators=70;, score=0.549 total time=   0.1s
[CV 5/5] END learning_rate=2.1204081632653065, n_estimators=70;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=2.1204081632653065, n_estimators=80;, score=0.572 total time=   0.1s
[CV 2/5] END learning_rate=2.1204081632653065, n_estimators=80;, score=0.294 total time=   0.1s
[CV 3/5] END learning_rate=2.1204081632653065, n_estimators=80;, score=0.694 total time=   0.1s
[CV 4/5] END learning_rate=2.1204081632653065, n_estimators=80;, score=0.549 total time=   0.1s
[CV 5/5] END learning_rate=2.12040816326

[CV 2/5] END learning_rate=2.5244897959183676, n_estimators=40;, score=0.187 total time=   0.0s
[CV 3/5] END learning_rate=2.5244897959183676, n_estimators=40;, score=0.404 total time=   0.0s
[CV 4/5] END learning_rate=2.5244897959183676, n_estimators=40;, score=0.357 total time=   0.0s
[CV 5/5] END learning_rate=2.5244897959183676, n_estimators=40;, score=0.498 total time=   0.0s
[CV 1/5] END learning_rate=2.5244897959183676, n_estimators=50;, score=0.720 total time=   0.0s
[CV 2/5] END learning_rate=2.5244897959183676, n_estimators=50;, score=0.187 total time=   0.0s
[CV 3/5] END learning_rate=2.5244897959183676, n_estimators=50;, score=0.404 total time=   0.0s
[CV 4/5] END learning_rate=2.5244897959183676, n_estimators=50;, score=0.357 total time=   0.0s
[CV 5/5] END learning_rate=2.5244897959183676, n_estimators=50;, score=0.498 total time=   0.0s
[CV 1/5] END learning_rate=2.5244897959183676, n_estimators=60;, score=0.720 total time=   0.1s
[CV 2/5] END learning_rate=2.52448979591

[CV 2/5] END learning_rate=2.928571428571429, n_estimators=20;, score=0.804 total time=   0.0s
[CV 3/5] END learning_rate=2.928571428571429, n_estimators=20;, score=0.238 total time=   0.0s
[CV 4/5] END learning_rate=2.928571428571429, n_estimators=20;, score=0.191 total time=   0.0s
[CV 5/5] END learning_rate=2.928571428571429, n_estimators=20;, score=0.243 total time=   0.0s
[CV 1/5] END learning_rate=2.928571428571429, n_estimators=30;, score=0.292 total time=   0.0s
[CV 2/5] END learning_rate=2.928571428571429, n_estimators=30;, score=0.804 total time=   0.0s
[CV 3/5] END learning_rate=2.928571428571429, n_estimators=30;, score=0.238 total time=   0.0s
[CV 4/5] END learning_rate=2.928571428571429, n_estimators=30;, score=0.191 total time=   0.0s
[CV 5/5] END learning_rate=2.928571428571429, n_estimators=30;, score=0.243 total time=   0.0s
[CV 1/5] END learning_rate=2.928571428571429, n_estimators=40;, score=0.292 total time=   0.0s
[CV 2/5] END learning_rate=2.928571428571429, n_es

[CV 3/5] END learning_rate=3.1306122448979594, n_estimators=90;, score=0.400 total time=   0.1s
[CV 4/5] END learning_rate=3.1306122448979594, n_estimators=90;, score=0.281 total time=   0.1s
[CV 5/5] END learning_rate=3.1306122448979594, n_estimators=90;, score=0.455 total time=   0.1s
[CV 1/5] END learning_rate=3.1306122448979594, n_estimators=100;, score=0.784 total time=   0.2s
[CV 2/5] END learning_rate=3.1306122448979594, n_estimators=100;, score=0.719 total time=   0.2s
[CV 3/5] END learning_rate=3.1306122448979594, n_estimators=100;, score=0.400 total time=   0.2s
[CV 4/5] END learning_rate=3.1306122448979594, n_estimators=100;, score=0.281 total time=   0.1s
[CV 5/5] END learning_rate=3.1306122448979594, n_estimators=100;, score=0.455 total time=   0.2s
[CV 1/5] END learning_rate=3.33265306122449, n_estimators=10;, score=0.322 total time=   0.0s
[CV 2/5] END learning_rate=3.33265306122449, n_estimators=10;, score=0.191 total time=   0.0s
[CV 3/5] END learning_rate=3.3326530612

[CV 5/5] END learning_rate=3.5346938775510206, n_estimators=60;, score=0.753 total time=   0.1s
[CV 1/5] END learning_rate=3.5346938775510206, n_estimators=70;, score=0.157 total time=   0.1s
[CV 2/5] END learning_rate=3.5346938775510206, n_estimators=70;, score=0.677 total time=   0.1s
[CV 3/5] END learning_rate=3.5346938775510206, n_estimators=70;, score=0.660 total time=   0.1s
[CV 4/5] END learning_rate=3.5346938775510206, n_estimators=70;, score=0.187 total time=   0.1s
[CV 5/5] END learning_rate=3.5346938775510206, n_estimators=70;, score=0.753 total time=   0.1s
[CV 1/5] END learning_rate=3.5346938775510206, n_estimators=80;, score=0.157 total time=   0.1s
[CV 2/5] END learning_rate=3.5346938775510206, n_estimators=80;, score=0.677 total time=   0.1s
[CV 3/5] END learning_rate=3.5346938775510206, n_estimators=80;, score=0.660 total time=   0.1s
[CV 4/5] END learning_rate=3.5346938775510206, n_estimators=80;, score=0.187 total time=   0.1s
[CV 5/5] END learning_rate=3.53469387755

[CV 2/5] END learning_rate=3.938775510204082, n_estimators=40;, score=0.766 total time=   0.0s
[CV 3/5] END learning_rate=3.938775510204082, n_estimators=40;, score=0.157 total time=   0.0s
[CV 4/5] END learning_rate=3.938775510204082, n_estimators=40;, score=0.838 total time=   0.0s
[CV 5/5] END learning_rate=3.938775510204082, n_estimators=40;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=3.938775510204082, n_estimators=50;, score=0.288 total time=   0.0s
[CV 2/5] END learning_rate=3.938775510204082, n_estimators=50;, score=0.766 total time=   0.0s
[CV 3/5] END learning_rate=3.938775510204082, n_estimators=50;, score=0.157 total time=   0.0s
[CV 4/5] END learning_rate=3.938775510204082, n_estimators=50;, score=0.838 total time=   0.0s
[CV 5/5] END learning_rate=3.938775510204082, n_estimators=50;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=3.938775510204082, n_estimators=60;, score=0.288 total time=   0.1s
[CV 2/5] END learning_rate=3.938775510204082, n_es

[CV 2/5] END learning_rate=4.3428571428571425, n_estimators=20;, score=0.821 total time=   0.0s
[CV 3/5] END learning_rate=4.3428571428571425, n_estimators=20;, score=0.153 total time=   0.0s
[CV 4/5] END learning_rate=4.3428571428571425, n_estimators=20;, score=0.336 total time=   0.0s
[CV 5/5] END learning_rate=4.3428571428571425, n_estimators=20;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=4.3428571428571425, n_estimators=30;, score=0.818 total time=   0.0s
[CV 2/5] END learning_rate=4.3428571428571425, n_estimators=30;, score=0.821 total time=   0.0s
[CV 3/5] END learning_rate=4.3428571428571425, n_estimators=30;, score=0.153 total time=   0.0s
[CV 4/5] END learning_rate=4.3428571428571425, n_estimators=30;, score=0.336 total time=   0.0s
[CV 5/5] END learning_rate=4.3428571428571425, n_estimators=30;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=4.3428571428571425, n_estimators=40;, score=0.818 total time=   0.0s
[CV 2/5] END learning_rate=4.34285714285

[CV 3/5] END learning_rate=4.544897959183674, n_estimators=90;, score=0.749 total time=   0.1s
[CV 4/5] END learning_rate=4.544897959183674, n_estimators=90;, score=0.609 total time=   0.1s
[CV 5/5] END learning_rate=4.544897959183674, n_estimators=90;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=4.544897959183674, n_estimators=100;, score=0.818 total time=   0.2s
[CV 2/5] END learning_rate=4.544897959183674, n_estimators=100;, score=0.821 total time=   0.2s
[CV 3/5] END learning_rate=4.544897959183674, n_estimators=100;, score=0.749 total time=   0.2s
[CV 4/5] END learning_rate=4.544897959183674, n_estimators=100;, score=0.609 total time=   0.2s
[CV 5/5] END learning_rate=4.544897959183674, n_estimators=100;, score=0.728 total time=   0.2s
[CV 1/5] END learning_rate=4.746938775510204, n_estimators=10;, score=0.818 total time=   0.0s
[CV 2/5] END learning_rate=4.746938775510204, n_estimators=10;, score=0.821 total time=   0.0s
[CV 3/5] END learning_rate=4.746938775510204,

[CV 5/5] END learning_rate=4.948979591836735, n_estimators=60;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=4.948979591836735, n_estimators=70;, score=0.818 total time=   0.1s
[CV 2/5] END learning_rate=4.948979591836735, n_estimators=70;, score=0.834 total time=   0.1s
[CV 3/5] END learning_rate=4.948979591836735, n_estimators=70;, score=0.170 total time=   0.1s
[CV 4/5] END learning_rate=4.948979591836735, n_estimators=70;, score=0.230 total time=   0.1s
[CV 5/5] END learning_rate=4.948979591836735, n_estimators=70;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=4.948979591836735, n_estimators=80;, score=0.818 total time=   0.1s
[CV 2/5] END learning_rate=4.948979591836735, n_estimators=80;, score=0.834 total time=   0.1s
[CV 3/5] END learning_rate=4.948979591836735, n_estimators=80;, score=0.170 total time=   0.1s
[CV 4/5] END learning_rate=4.948979591836735, n_estimators=80;, score=0.230 total time=   0.1s
[CV 5/5] END learning_rate=4.948979591836735, n_es

[CV 2/5] END learning_rate=5.353061224489796, n_estimators=40;, score=0.847 total time=   0.0s
[CV 3/5] END learning_rate=5.353061224489796, n_estimators=40;, score=0.251 total time=   0.0s
[CV 4/5] END learning_rate=5.353061224489796, n_estimators=40;, score=0.804 total time=   0.0s
[CV 5/5] END learning_rate=5.353061224489796, n_estimators=40;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=5.353061224489796, n_estimators=50;, score=0.818 total time=   0.0s
[CV 2/5] END learning_rate=5.353061224489796, n_estimators=50;, score=0.847 total time=   0.0s
[CV 3/5] END learning_rate=5.353061224489796, n_estimators=50;, score=0.251 total time=   0.0s
[CV 4/5] END learning_rate=5.353061224489796, n_estimators=50;, score=0.804 total time=   0.0s
[CV 5/5] END learning_rate=5.353061224489796, n_estimators=50;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=5.353061224489796, n_estimators=60;, score=0.818 total time=   0.1s
[CV 2/5] END learning_rate=5.353061224489796, n_es

[CV 2/5] END learning_rate=5.757142857142857, n_estimators=20;, score=0.851 total time=   0.0s
[CV 3/5] END learning_rate=5.757142857142857, n_estimators=20;, score=0.157 total time=   0.0s
[CV 4/5] END learning_rate=5.757142857142857, n_estimators=20;, score=0.285 total time=   0.0s
[CV 5/5] END learning_rate=5.757142857142857, n_estimators=20;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=5.757142857142857, n_estimators=30;, score=0.708 total time=   0.0s
[CV 2/5] END learning_rate=5.757142857142857, n_estimators=30;, score=0.851 total time=   0.0s
[CV 3/5] END learning_rate=5.757142857142857, n_estimators=30;, score=0.157 total time=   0.0s
[CV 4/5] END learning_rate=5.757142857142857, n_estimators=30;, score=0.285 total time=   0.0s
[CV 5/5] END learning_rate=5.757142857142857, n_estimators=30;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=5.757142857142857, n_estimators=40;, score=0.708 total time=   0.0s
[CV 2/5] END learning_rate=5.757142857142857, n_es

[CV 4/5] END learning_rate=5.959183673469387, n_estimators=90;, score=0.285 total time=   0.1s
[CV 5/5] END learning_rate=5.959183673469387, n_estimators=90;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=5.959183673469387, n_estimators=100;, score=0.157 total time=   0.1s
[CV 2/5] END learning_rate=5.959183673469387, n_estimators=100;, score=0.851 total time=   0.2s
[CV 3/5] END learning_rate=5.959183673469387, n_estimators=100;, score=0.174 total time=   0.1s
[CV 4/5] END learning_rate=5.959183673469387, n_estimators=100;, score=0.285 total time=   0.2s
[CV 5/5] END learning_rate=5.959183673469387, n_estimators=100;, score=0.728 total time=   0.2s
[CV 1/5] END learning_rate=6.161224489795918, n_estimators=10;, score=0.157 total time=   0.0s
[CV 2/5] END learning_rate=6.161224489795918, n_estimators=10;, score=0.770 total time=   0.0s
[CV 3/5] END learning_rate=6.161224489795918, n_estimators=10;, score=0.174 total time=   0.0s
[CV 4/5] END learning_rate=6.161224489795918,

[CV 1/5] END learning_rate=6.3632653061224485, n_estimators=70;, score=0.157 total time=   0.1s
[CV 2/5] END learning_rate=6.3632653061224485, n_estimators=70;, score=0.770 total time=   0.1s
[CV 3/5] END learning_rate=6.3632653061224485, n_estimators=70;, score=0.174 total time=   0.1s
[CV 4/5] END learning_rate=6.3632653061224485, n_estimators=70;, score=0.285 total time=   0.1s
[CV 5/5] END learning_rate=6.3632653061224485, n_estimators=70;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=6.3632653061224485, n_estimators=80;, score=0.157 total time=   0.1s
[CV 2/5] END learning_rate=6.3632653061224485, n_estimators=80;, score=0.770 total time=   0.1s
[CV 3/5] END learning_rate=6.3632653061224485, n_estimators=80;, score=0.174 total time=   0.1s
[CV 4/5] END learning_rate=6.3632653061224485, n_estimators=80;, score=0.285 total time=   0.1s
[CV 5/5] END learning_rate=6.3632653061224485, n_estimators=80;, score=0.728 total time=   0.1s
[CV 1/5] END learning_rate=6.36326530612

[CV 2/5] END learning_rate=6.7673469387755105, n_estimators=40;, score=0.745 total time=   0.0s
[CV 3/5] END learning_rate=6.7673469387755105, n_estimators=40;, score=0.264 total time=   0.0s
[CV 4/5] END learning_rate=6.7673469387755105, n_estimators=40;, score=0.281 total time=   0.0s
[CV 5/5] END learning_rate=6.7673469387755105, n_estimators=40;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=6.7673469387755105, n_estimators=50;, score=0.157 total time=   0.0s
[CV 2/5] END learning_rate=6.7673469387755105, n_estimators=50;, score=0.745 total time=   0.0s
[CV 3/5] END learning_rate=6.7673469387755105, n_estimators=50;, score=0.264 total time=   0.0s
[CV 4/5] END learning_rate=6.7673469387755105, n_estimators=50;, score=0.281 total time=   0.0s
[CV 5/5] END learning_rate=6.7673469387755105, n_estimators=50;, score=0.728 total time=   0.0s
[CV 1/5] END learning_rate=6.7673469387755105, n_estimators=60;, score=0.157 total time=   0.1s
[CV 2/5] END learning_rate=6.76734693877

[CV 2/5] END learning_rate=7.171428571428572, n_estimators=20;, score=0.745 total time=   0.0s
[CV 3/5] END learning_rate=7.171428571428572, n_estimators=20;, score=0.149 total time=   0.0s
[CV 4/5] END learning_rate=7.171428571428572, n_estimators=20;, score=0.157 total time=   0.0s
[CV 5/5] END learning_rate=7.171428571428572, n_estimators=20;, score=0.285 total time=   0.0s
[CV 1/5] END learning_rate=7.171428571428572, n_estimators=30;, score=0.157 total time=   0.0s
[CV 2/5] END learning_rate=7.171428571428572, n_estimators=30;, score=0.745 total time=   0.0s
[CV 3/5] END learning_rate=7.171428571428572, n_estimators=30;, score=0.149 total time=   0.0s
[CV 4/5] END learning_rate=7.171428571428572, n_estimators=30;, score=0.157 total time=   0.0s
[CV 5/5] END learning_rate=7.171428571428572, n_estimators=30;, score=0.285 total time=   0.0s
[CV 1/5] END learning_rate=7.171428571428572, n_estimators=40;, score=0.157 total time=   0.0s
[CV 2/5] END learning_rate=7.171428571428572, n_es

[CV 4/5] END learning_rate=7.373469387755102, n_estimators=90;, score=0.166 total time=   0.1s
[CV 5/5] END learning_rate=7.373469387755102, n_estimators=90;, score=0.289 total time=   0.1s
[CV 1/5] END learning_rate=7.373469387755102, n_estimators=100;, score=0.165 total time=   0.2s
[CV 2/5] END learning_rate=7.373469387755102, n_estimators=100;, score=0.745 total time=   0.2s
[CV 3/5] END learning_rate=7.373469387755102, n_estimators=100;, score=0.149 total time=   0.1s
[CV 4/5] END learning_rate=7.373469387755102, n_estimators=100;, score=0.166 total time=   0.2s
[CV 5/5] END learning_rate=7.373469387755102, n_estimators=100;, score=0.289 total time=   0.2s
[CV 1/5] END learning_rate=7.575510204081633, n_estimators=10;, score=0.165 total time=   0.0s
[CV 2/5] END learning_rate=7.575510204081633, n_estimators=10;, score=0.745 total time=   0.0s
[CV 3/5] END learning_rate=7.575510204081633, n_estimators=10;, score=0.153 total time=   0.0s
[CV 4/5] END learning_rate=7.575510204081633,

[CV 2/5] END learning_rate=7.777551020408163, n_estimators=70;, score=0.745 total time=   0.1s
[CV 3/5] END learning_rate=7.777551020408163, n_estimators=70;, score=0.149 total time=   0.1s
[CV 4/5] END learning_rate=7.777551020408163, n_estimators=70;, score=0.170 total time=   0.1s
[CV 5/5] END learning_rate=7.777551020408163, n_estimators=70;, score=0.289 total time=   0.1s
[CV 1/5] END learning_rate=7.777551020408163, n_estimators=80;, score=0.165 total time=   0.1s
[CV 2/5] END learning_rate=7.777551020408163, n_estimators=80;, score=0.745 total time=   0.1s
[CV 3/5] END learning_rate=7.777551020408163, n_estimators=80;, score=0.149 total time=   0.1s
[CV 4/5] END learning_rate=7.777551020408163, n_estimators=80;, score=0.170 total time=   0.1s
[CV 5/5] END learning_rate=7.777551020408163, n_estimators=80;, score=0.289 total time=   0.1s
[CV 1/5] END learning_rate=7.777551020408163, n_estimators=90;, score=0.165 total time=   0.1s
[CV 2/5] END learning_rate=7.777551020408163, n_es

[CV 5/5] END learning_rate=8.181632653061225, n_estimators=40;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=8.181632653061225, n_estimators=50;, score=0.169 total time=   0.0s
[CV 2/5] END learning_rate=8.181632653061225, n_estimators=50;, score=0.745 total time=   0.0s
[CV 3/5] END learning_rate=8.181632653061225, n_estimators=50;, score=0.149 total time=   0.0s
[CV 4/5] END learning_rate=8.181632653061225, n_estimators=50;, score=0.170 total time=   0.0s
[CV 5/5] END learning_rate=8.181632653061225, n_estimators=50;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=8.181632653061225, n_estimators=60;, score=0.169 total time=   0.1s
[CV 2/5] END learning_rate=8.181632653061225, n_estimators=60;, score=0.745 total time=   0.1s
[CV 3/5] END learning_rate=8.181632653061225, n_estimators=60;, score=0.149 total time=   0.1s
[CV 4/5] END learning_rate=8.181632653061225, n_estimators=60;, score=0.170 total time=   0.1s
[CV 5/5] END learning_rate=8.181632653061225, n_es

[CV 1/5] END learning_rate=8.585714285714285, n_estimators=30;, score=0.169 total time=   0.0s
[CV 2/5] END learning_rate=8.585714285714285, n_estimators=30;, score=0.783 total time=   0.0s
[CV 3/5] END learning_rate=8.585714285714285, n_estimators=30;, score=0.268 total time=   0.0s
[CV 4/5] END learning_rate=8.585714285714285, n_estimators=30;, score=0.166 total time=   0.0s
[CV 5/5] END learning_rate=8.585714285714285, n_estimators=30;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=8.585714285714285, n_estimators=40;, score=0.169 total time=   0.0s
[CV 2/5] END learning_rate=8.585714285714285, n_estimators=40;, score=0.783 total time=   0.0s
[CV 3/5] END learning_rate=8.585714285714285, n_estimators=40;, score=0.268 total time=   0.0s
[CV 4/5] END learning_rate=8.585714285714285, n_estimators=40;, score=0.166 total time=   0.0s
[CV 5/5] END learning_rate=8.585714285714285, n_estimators=40;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=8.585714285714285, n_es

[CV 3/5] END learning_rate=8.787755102040816, n_estimators=100;, score=0.268 total time=   0.2s
[CV 4/5] END learning_rate=8.787755102040816, n_estimators=100;, score=0.379 total time=   0.2s
[CV 5/5] END learning_rate=8.787755102040816, n_estimators=100;, score=0.289 total time=   0.1s
[CV 1/5] END learning_rate=8.989795918367347, n_estimators=10;, score=0.169 total time=   0.0s
[CV 2/5] END learning_rate=8.989795918367347, n_estimators=10;, score=0.783 total time=   0.0s
[CV 3/5] END learning_rate=8.989795918367347, n_estimators=10;, score=0.268 total time=   0.0s
[CV 4/5] END learning_rate=8.989795918367347, n_estimators=10;, score=0.379 total time=   0.0s
[CV 5/5] END learning_rate=8.989795918367347, n_estimators=10;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=8.989795918367347, n_estimators=20;, score=0.169 total time=   0.0s
[CV 2/5] END learning_rate=8.989795918367347, n_estimators=20;, score=0.783 total time=   0.0s
[CV 3/5] END learning_rate=8.989795918367347, n

[CV 1/5] END learning_rate=9.191836734693878, n_estimators=80;, score=0.305 total time=   0.1s
[CV 2/5] END learning_rate=9.191836734693878, n_estimators=80;, score=0.783 total time=   0.1s
[CV 3/5] END learning_rate=9.191836734693878, n_estimators=80;, score=0.268 total time=   0.1s
[CV 4/5] END learning_rate=9.191836734693878, n_estimators=80;, score=0.426 total time=   0.1s
[CV 5/5] END learning_rate=9.191836734693878, n_estimators=80;, score=0.289 total time=   0.1s
[CV 1/5] END learning_rate=9.191836734693878, n_estimators=90;, score=0.305 total time=   0.1s
[CV 2/5] END learning_rate=9.191836734693878, n_estimators=90;, score=0.783 total time=   0.1s
[CV 3/5] END learning_rate=9.191836734693878, n_estimators=90;, score=0.268 total time=   0.1s
[CV 4/5] END learning_rate=9.191836734693878, n_estimators=90;, score=0.426 total time=   0.1s
[CV 5/5] END learning_rate=9.191836734693878, n_estimators=90;, score=0.289 total time=   0.1s
[CV 1/5] END learning_rate=9.191836734693878, n_es

[CV 4/5] END learning_rate=9.595918367346938, n_estimators=50;, score=0.391 total time=   0.0s
[CV 5/5] END learning_rate=9.595918367346938, n_estimators=50;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=9.595918367346938, n_estimators=60;, score=0.288 total time=   0.1s
[CV 2/5] END learning_rate=9.595918367346938, n_estimators=60;, score=0.783 total time=   0.1s
[CV 3/5] END learning_rate=9.595918367346938, n_estimators=60;, score=0.268 total time=   0.1s
[CV 4/5] END learning_rate=9.595918367346938, n_estimators=60;, score=0.391 total time=   0.1s
[CV 5/5] END learning_rate=9.595918367346938, n_estimators=60;, score=0.289 total time=   0.1s
[CV 1/5] END learning_rate=9.595918367346938, n_estimators=70;, score=0.288 total time=   0.1s
[CV 2/5] END learning_rate=9.595918367346938, n_estimators=70;, score=0.783 total time=   0.1s
[CV 3/5] END learning_rate=9.595918367346938, n_estimators=70;, score=0.268 total time=   0.1s
[CV 4/5] END learning_rate=9.595918367346938, n_es

[CV 4/5] END learning_rate=10.0, n_estimators=30;, score=0.170 total time=   0.0s
[CV 5/5] END learning_rate=10.0, n_estimators=30;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=10.0, n_estimators=40;, score=0.288 total time=   0.0s
[CV 2/5] END learning_rate=10.0, n_estimators=40;, score=0.783 total time=   0.0s
[CV 3/5] END learning_rate=10.0, n_estimators=40;, score=0.268 total time=   0.0s
[CV 4/5] END learning_rate=10.0, n_estimators=40;, score=0.170 total time=   0.0s
[CV 5/5] END learning_rate=10.0, n_estimators=40;, score=0.289 total time=   0.0s
[CV 1/5] END learning_rate=10.0, n_estimators=50;, score=0.288 total time=   0.0s
[CV 2/5] END learning_rate=10.0, n_estimators=50;, score=0.783 total time=   0.0s
[CV 3/5] END learning_rate=10.0, n_estimators=50;, score=0.268 total time=   0.0s
[CV 4/5] END learning_rate=10.0, n_estimators=50;, score=0.170 total time=   0.0s
[CV 5/5] END learning_rate=10.0, n_estimators=50;, score=0.289 total time=   0.0s
[CV 1/5] END lea

GridSearchCV(cv=5, estimator=GradientBoostingClassifier(),
             param_grid={'learning_rate': array([ 0.1       ,  0.30204082,  0.50408163,  0.70612245,  0.90816327,
        1.11020408,  1.3122449 ,  1.51428571,  1.71632653,  1.91836735,
        2.12040816,  2.32244898,  2.5244898 ,  2.72653061,  2.92857143,
        3.13061224,  3.33265306,  3.53469388,  3.73673469,  3.93877551,
        4.14081633,  4.34285714,  4.54489796,  4.74693878,  4.94897959,
        5.15102041,  5.35306122,  5.55510204,  5.75714286,  5.95918367,
        6.16122449,  6.36326531,  6.56530612,  6.76734694,  6.96938776,
        7.17142857,  7.37346939,  7.5755102 ,  7.77755102,  7.97959184,
        8.18163265,  8.38367347,  8.58571429,  8.7877551 ,  8.98979592,
        9.19183673,  9.39387755,  9.59591837,  9.79795918, 10.        ]),
                         'n_estimators': [10, 20, 30, 40, 50, 60, 70, 80, 90,
                                          100]},
             verbose=3)

In [66]:
print(grid.best_params_)

{'learning_rate': 0.1, 'n_estimators': 100}


# With new parameters

In [67]:
log_clf = LogisticRegression(C= 7.63157894736842, penalty = 'l1', solver='liblinear')
rnd_clf = RandomForestClassifier(max_depth= 15, n_estimators= 50)
svm_clf = SVC(C= 8.957894736842105, gamma= 0.1, kernel= 'rbf', probability = True)
gb_clf = GradientBoostingClassifier(learning_rate= 0.1, n_estimators= 100)
voting_clf = VotingClassifier(estimators=[('lr', log_clf), ('rf', rnd_clf), ('svc', svm_clf),('gb',gb_clf)],voting='soft')
voting_clf.fit(X_train, y_train)

VotingClassifier(estimators=[('lr',
                              LogisticRegression(C=7.63157894736842,
                                                 penalty='l1',
                                                 solver='liblinear')),
                             ('rf',
                              RandomForestClassifier(max_depth=15,
                                                     n_estimators=50)),
                             ('svc',
                              SVC(C=8.957894736842105, gamma=0.1,
                                  probability=True)),
                             ('gb', GradientBoostingClassifier())],
                 voting='soft')

In [69]:
for clf in (log_clf, rnd_clf, svm_clf, gb_clf, voting_clf):
    clf.fit(X_train, y_train)
    y_pred = clf.predict(X_test)
    print(clf.__class__.__name__, accuracy_score(y_test, y_pred))

LogisticRegression 0.8605442176870748
RandomForestClassifier 0.8333333333333334
SVC 0.8605442176870748
GradientBoostingClassifier 0.8741496598639455
VotingClassifier 0.8639455782312925


# Bagging

In [12]:
from sklearn.ensemble import BaggingClassifier
from sklearn.tree import DecisionTreeClassifier

In [13]:
bag_clf = BaggingClassifier(DecisionTreeClassifier(), n_estimators=500,max_samples=500, bootstrap=True, n_jobs=-1)
bag_clf.fit(X_train, y_train)
y_pred = bag_clf.predict(X_test)
accuracy_score(y_test, y_pred)

0.8367346938775511

In [14]:
bag_clf = BaggingClassifier(DecisionTreeClassifier(), n_estimators=500,max_samples=500,bootstrap=True, oob_score=True, n_jobs=-1)

bag_clf.fit(X_train, y_train)

y_pred = bag_clf.predict(X_test)

accuracy_score(y_test, y_pred)

0.8401360544217688

In [15]:
bag_clf.oob_score_

0.8605442176870748

In [16]:
bag_clf = BaggingClassifier(DecisionTreeClassifier(), n_estimators=500,max_samples=500,bootstrap=False, n_jobs=-1)

bag_clf.fit(X_train, y_train)

y_pred = bag_clf.predict(X_test)

accuracy_score(y_test, y_pred)

0.8469387755102041

# Boosting

In [17]:
from sklearn.ensemble import AdaBoostClassifier
ada_clf = AdaBoostClassifier(DecisionTreeClassifier(max_depth=1), n_estimators=200, learning_rate=0.5)
ada_clf.fit(X_train, y_train)
y_pred = ada_clf.predict(X_test)
accuracy_score(y_test, y_pred)

0.8775510204081632