In [None]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:
import pandas as pd
import numpy as np
from scipy import sparse

from sklearn.pipeline import Pipeline
from sklearn.preprocessing import MinMaxScaler
from sklearn.metrics import classification_report
from sklearn.model_selection import GridSearchCV
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier
from sklearn.linear_model import LogisticRegression, SGDClassifier
from sklearn.svm import LinearSVC

In [None]:
def get_data(path,sc=None,rem_extra=0,sparse=True,train=1):
    d = pd.read_csv(path)
    extra_cols = ['Code_blocks','Body_size','Extra_tags','Code_Lines','Num_Tags']
    d.drop('Unnamed: 0',axis=1,inplace=True)
    if rem_extra == 1:
        d.drop(extra_cols,axis=1,inplace=True)
    else:
        if train == 1:
            sc = MinMaxScaler()
            d[extra_cols] = sc.fit_transform(d[extra_cols])
        else:
            assert sc != None
            d[extra_cols] = sc.transform(d[extra_cols])
    new_values = {'HQ':2, 'LQ_EDIT':1, 'LQ_CLOSE':0}
    d['Y']  = d.Y.replace(new_values)
    y = d['Y']
    d.drop('Y',axis=1,inplace=True)
    return d,y,sc    

# Loading data

Data without the extra columns (bosdy-size, number of tags etc).

In [None]:
path_train = '/content/drive/MyDrive/EE769Project/glove_sent_encoding_Traindata_10Sent.csv'
path_test = '/content/drive/MyDrive/EE769Project/glove_sent_encoding_Testdata_10Sent.csv'
d_train,y_train,sc_train = get_data(path_train,rem_extra=1)
d_test,y_test,sc_train = get_data(path_test,sc=sc_train,rem_extra=1,train=0)

print(d_train.shape)
print(d_test.shape)
print(y_train.shape)
print(y_test.shape)

(45000, 3300)
(15000, 3300)
(45000,)
(15000,)


# Model building and testing

In [None]:
clf_dict = {
    'LogisticRegression': LogisticRegression(),
    'SGDClassifier': SGDClassifier(),
    'LinearSVC': LinearSVC(),
    'RandomForestClassifier': RandomForestClassifier(),
    'GradientBoostingClassifier': GradientBoostingClassifier(),
}

def do_gridSearch(clf,d_train,y_train,d_test,y_test,hyperparams):
    opt = GridSearchCV(clf, cv=5, param_grid=hyperparams,  scoring='f1_weighted', verbose=2.1)
    opt.fit(d_train, np.squeeze(y_train))
    print('Best parameters:')
    print(opt.best_params_)
    scoring='f1_weighted'
    print('Best' + scoring + ":" + str(opt.best_score_))
    print('Train classification report:')
    y_true, y_pred = np.squeeze(y_train), opt.predict(d_train)
    print(classification_report(y_true, y_pred))
    print('Test classification report:')
    y_true, y_pred = np.squeeze(y_test), opt.predict(d_test)
    print(classification_report(y_true, y_pred))
    return opt

In [None]:
d_train = sparse.csr_matrix(d_train)
d_test = sparse.csr_matrix(d_test)

## Logistic Regression

In [None]:
result_10_rem = {}
m = 'LogisticRegression'
param_grid = {'C':[0.01,0.1,1.0,10.0,100.0],'max_iter':[50,150,300,600],'multi_class':['auto']}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 20 candidates, totalling 100 fits
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:   31.8s remaining:    0.0s


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.629, total=  31.8s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:  1.0min remaining:    0.0s


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.646, total=  30.7s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.635, total=  31.2s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.643, total=  32.2s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.629, total=  30.0s
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.629, total= 1.1min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.646, total= 1.3min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.636, total= 1.4min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.643, total= 1.2min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.631, total= 1.3min
[CV] C=0.01, max_iter=300, multi_class=auto ..........................
[CV]  C=0.01, max_iter=300, multi_class=auto, score=0.629, total= 1.1min
[CV] C=0.01, max_iter=300, multi_class=auto ....................

STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.623, total=  31.1s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.645, total=  30.6s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.638, total=  31.2s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.636, total=  31.1s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.630, total=  31.1s
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.628, total= 1.5min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.647, total= 1.5min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.637, total= 1.5min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.638, total= 1.5min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.634, total= 1.5min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.627, total= 3.0min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.646, total= 3.1min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.637, total= 3.1min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.639, total= 3.0min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.633, total= 3.0min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.627, total= 3.4min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.646, total= 3.4min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.637, total= 3.2min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.639, total= 3.2min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.633, total= 3.2min
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.622, total=  31.6s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.643, total=  31.1s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.634, total=  31.7s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.634, total=  29.4s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.624, total=  29.9s
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.625, total= 1.5min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.641, total= 1.5min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.631, total= 1.5min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.635, total= 1.5min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.630, total= 1.5min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.624, total= 3.0min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.639, total= 2.9min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.633, total= 3.0min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.636, total= 3.0min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.631, total= 3.0min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.625, total= 5.9min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.641, total= 6.0min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.632, total= 6.0min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.635, total= 6.0min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.631, total= 6.0min
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.623, total=  31.6s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.642, total=  31.1s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.631, total=  31.1s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.629, total=  29.4s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.624, total=  30.4s
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.621, total= 1.5min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.637, total= 1.5min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.628, total= 1.5min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.633, total= 1.5min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.629, total= 1.5min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.621, total= 3.0min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.635, total= 3.0min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.629, total= 3.0min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.630, total= 3.0min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.626, total= 3.0min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.615, total= 5.9min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.633, total= 5.9min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.623, total= 6.0min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.626, total= 6.0min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.622, total= 5.9min
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.619, total=  32.1s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.642, total=  31.0s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.633, total=  30.0s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.634, total=  29.4s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.623, total=  29.9s
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.623, total= 1.5min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.635, total= 1.5min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.628, total= 1.5min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.632, total= 1.5min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.629, total= 1.5min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.620, total= 3.0min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.630, total= 3.0min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.630, total= 3.0min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.629, total= 3.0min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.625, total= 3.0min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.614, total= 6.0min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.633, total= 6.0min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.621, total= 6.0min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.624, total= 6.0min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
[Parallel(n_jobs=1)]: Done 100 out of 100 | elapsed: 227.9min finished


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.620, total= 6.0min
Best parameters:
{'C': 0.01, 'max_iter': 150, 'multi_class': 'auto'}
Bestf1_weighted:0.6368528123927485
Train classification report:
              precision    recall  f1-score   support

           0       0.61      0.61      0.61     15000
           1       0.69      0.64      0.66     15000
           2       0.71      0.76      0.74     15000

    accuracy                           0.67     45000
   macro avg       0.67      0.67      0.67     45000
weighted avg       0.67      0.67      0.67     45000

Test classification report:
              precision    recall  f1-score   support

           0       0.58      0.58      0.58      5000
           1       0.67      0.61      0.64      5000
           2       0.69      0.75      0.72      5000

    accuracy                           0.65     15000
   macro avg       0.65      0.65      0.65     15000
weighted avg       0.65      0.65      0.65     15000



## Linear SVC

In [None]:
result_10_rem = {}
m = 'LinearSVC'
param_grid = params = {'C':[0.01,0.1,1.0,10.0,100.0]}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 5 candidates, totalling 25 fits
[CV] C=0.01 ..........................................................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.


[CV] .............................. C=0.01, score=0.629, total=  20.8s
[CV] C=0.01 ..........................................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:   20.8s remaining:    0.0s


[CV] .............................. C=0.01, score=0.649, total=  20.2s
[CV] C=0.01 ..........................................................


[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:   41.0s remaining:    0.0s


[CV] .............................. C=0.01, score=0.636, total=  19.4s
[CV] C=0.01 ..........................................................
[CV] .............................. C=0.01, score=0.639, total=  20.3s
[CV] C=0.01 ..........................................................
[CV] .............................. C=0.01, score=0.630, total=  20.0s
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.627, total= 2.3min
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.642, total= 2.3min
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.635, total= 2.7min
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.637, total= 2.3min
[CV] C=0.1 ...........................................................
[CV] .



[CV] ............................... C=1.0, score=0.621, total= 6.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.635, total= 6.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.628, total= 6.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.634, total= 6.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.627, total= 6.5min
[CV] C=10.0 ..........................................................
[CV] .............................. C=10.0, score=0.588, total= 7.1min
[CV] C=10.0 ..........................................................
[CV] .............................. C=10.0, score=0.613, total= 7.2min
[CV] C=10.0 ..........................................................
[CV] .

[Parallel(n_jobs=1)]: Done  25 out of  25 | elapsed: 118.3min finished


Best parameters:
{'C': 0.01}
Bestf1_weighted:0.6365623385952945
Train classification report:
              precision    recall  f1-score   support

           0       0.63      0.62      0.62     15000
           1       0.71      0.65      0.68     15000
           2       0.72      0.79      0.75     15000

    accuracy                           0.69     45000
   macro avg       0.69      0.69      0.68     45000
weighted avg       0.69      0.69      0.68     45000

Test classification report:
              precision    recall  f1-score   support

           0       0.58      0.58      0.58      5000
           1       0.67      0.61      0.64      5000
           2       0.69      0.76      0.72      5000

    accuracy                           0.65     15000
   macro avg       0.65      0.65      0.65     15000
weighted avg       0.65      0.65      0.65     15000



## SGD Classifier

In [None]:
m = 'SGDClassifier'
param_grid = {'loss':['hinge'],'alpha':[0.0001,0.001,0.01],'penalty':['elasticnet'],'l1_ratio':[0,0.2,0.7,1.0]}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 12 candidates, totalling 60 fits
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.


[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.624, total= 1.3min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:  1.3min remaining:    0.0s


[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.627, total= 1.4min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........


[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:  2.7min remaining:    0.0s


[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.623, total= 1.4min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........
[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.629, total= 1.3min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........
[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.610, total= 1.1min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet, score=0.626, total= 1.5min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet, score=0.637, total= 1.6min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet, score=0.634, total= 1.8min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1

[Parallel(n_jobs=1)]: Done  60 out of  60 | elapsed: 43.5min finished


Best parameters:
{'alpha': 0.001, 'l1_ratio': 0, 'loss': 'hinge', 'penalty': 'elasticnet'}
Bestf1_weighted:0.6353769174431572
Train classification report:
              precision    recall  f1-score   support

           0       0.66      0.51      0.58     15000
           1       0.67      0.70      0.68     15000
           2       0.69      0.81      0.75     15000

    accuracy                           0.68     45000
   macro avg       0.67      0.68      0.67     45000
weighted avg       0.67      0.68      0.67     45000

Test classification report:
              precision    recall  f1-score   support

           0       0.62      0.48      0.54      5000
           1       0.64      0.66      0.65      5000
           2       0.67      0.79      0.72      5000

    accuracy                           0.65     15000
   macro avg       0.64      0.65      0.64     15000
weighted avg       0.64      0.65      0.64     15000



## Random forest classifier

In [None]:
m = 'RandomForestClassifier'
param_grid = {'n_estimators': [50,200,600],'max_depth': [10,15,20]}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 9 candidates, totalling 45 fits
[CV] max_depth=10, n_estimators=50 ...................................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.


[CV] ....... max_depth=10, n_estimators=50, score=0.548, total= 1.7min
[CV] max_depth=10, n_estimators=50 ...................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:  1.7min remaining:    0.0s


[CV] ....... max_depth=10, n_estimators=50, score=0.560, total= 1.6min
[CV] max_depth=10, n_estimators=50 ...................................


[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:  3.3min remaining:    0.0s


[CV] ....... max_depth=10, n_estimators=50, score=0.554, total= 1.6min
[CV] max_depth=10, n_estimators=50 ...................................
[CV] ....... max_depth=10, n_estimators=50, score=0.554, total= 1.6min
[CV] max_depth=10, n_estimators=50 ...................................
[CV] ....... max_depth=10, n_estimators=50, score=0.547, total= 1.6min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.561, total= 6.5min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.563, total= 6.5min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.565, total= 6.5min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.567, total= 6.5min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] .

KeyboardInterrupt: ignored

Stopped as training took too long (~20 minutes) when n_Estimators = 600. The score was also not good (< 0.6).

# Loading data

With the extra columns

In [None]:
path_train = '/content/drive/MyDrive/EE769Project/glove_sent_encoding_Traindata_10Sent.csv'
path_test = '/content/drive/MyDrive/EE769Project/glove_sent_encoding_Testdata_10Sent.csv'
d_train,y_train,sc_train = get_data(path_train,rem_extra=0)
d_test,y_test,sc_train = get_data(path_test,sc=sc_train,rem_extra=0,train=0)

print(d_train.shape)
print(d_test.shape)
print(y_train.shape)
print(y_test.shape)

(45000, 3305)
(15000, 3305)
(45000,)
(15000,)


In [None]:
d_train = sparse.csr_matrix(d_train)
d_test = sparse.csr_matrix(d_test)

## Logistic Regression

In [None]:
result_10 = {}
m = 'LogisticRegression'
param_grid = {'C':[0.01,0.1,1.0,10.0,100.0],'max_iter':[50,150,300,600],'multi_class':['auto']}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 20 candidates, totalling 100 fits
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:   27.6s remaining:    0.0s


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.641, total=  27.6s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:   56.0s remaining:    0.0s


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.656, total=  28.4s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.649, total=  28.0s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.657, total=  29.4s
[CV] C=0.01, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.01, max_iter=50, multi_class=auto, score=0.642, total=  28.9s
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.643, total= 1.0min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.657, total= 1.1min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.649, total= 1.2min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.657, total= 1.1min
[CV] C=0.01, max_iter=150, multi_class=auto ..........................
[CV]  C=0.01, max_iter=150, multi_class=auto, score=0.642, total= 1.2min
[CV] C=0.01, max_iter=300, multi_class=auto ..........................
[CV]  C=0.01, max_iter=300, multi_class=auto, score=0.643, total= 1.0min
[CV] C=0.01, max_iter=300, multi_class=auto ....................

STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.647, total=  27.0s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.666, total=  29.4s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.655, total=  28.4s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.660, total=  28.9s
[CV] C=0.1, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=50, multi_class=auto, score=0.650, total=  28.4s
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.672, total= 1.4min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.688, total= 1.4min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.678, total= 1.4min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.680, total= 1.4min
[CV] C=0.1, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=150, multi_class=auto, score=0.678, total= 1.4min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.673, total= 2.8min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.689, total= 2.8min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.679, total= 2.8min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.682, total= 2.8min
[CV] C=0.1, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=0.1, max_iter=300, multi_class=auto, score=0.678, total= 2.8min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.673, total= 3.2min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.688, total= 3.2min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.679, total= 3.1min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.682, total= 3.3min
[CV] C=0.1, max_iter=600, multi_class=auto ...........................
[CV]  C=0.1, max_iter=600, multi_class=auto, score=0.678, total= 3.0min
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.644, total=  28.4s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.660, total=  28.4s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.655, total=  28.5s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.661, total=  29.9s
[CV] C=1.0, max_iter=50, multi_class=auto ............................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=50, multi_class=auto, score=0.649, total=  28.3s
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.697, total= 1.4min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.707, total= 1.4min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.699, total= 1.4min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.703, total= 1.4min
[CV] C=1.0, max_iter=150, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=150, multi_class=auto, score=0.704, total= 1.4min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.703, total= 2.8min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.716, total= 2.8min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.712, total= 2.8min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.713, total= 2.8min
[CV] C=1.0, max_iter=300, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=300, multi_class=auto, score=0.708, total= 2.8min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.704, total= 5.6min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.716, total= 5.6min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.712, total= 5.7min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.713, total= 5.6min
[CV] C=1.0, max_iter=600, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=1.0, max_iter=600, multi_class=auto, score=0.708, total= 5.5min
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.644, total=  28.0s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.660, total=  28.0s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.655, total=  28.6s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.659, total=  29.0s
[CV] C=10.0, max_iter=50, multi_class=auto ...........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=50, multi_class=auto, score=0.647, total=  28.0s
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.705, total= 1.4min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.706, total= 1.4min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.699, total= 1.4min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.706, total= 1.4min
[CV] C=10.0, max_iter=150, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=150, multi_class=auto, score=0.705, total= 1.4min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.712, total= 2.8min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.722, total= 2.8min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.713, total= 2.8min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.717, total= 2.8min
[CV] C=10.0, max_iter=300, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=300, multi_class=auto, score=0.716, total= 2.8min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.711, total= 5.6min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.723, total= 5.6min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.715, total= 5.6min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.721, total= 5.5min
[CV] C=10.0, max_iter=600, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=10.0, max_iter=600, multi_class=auto, score=0.720, total= 5.6min
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.643, total=  28.5s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.659, total=  27.9s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.655, total=  28.5s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.658, total=  28.4s
[CV] C=100.0, max_iter=50, multi_class=auto ..........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=50, multi_class=auto, score=0.650, total=  27.9s
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.702, total= 1.4min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.705, total= 1.4min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.698, total= 1.4min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.709, total= 1.4min
[CV] C=100.0, max_iter=150, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=150, multi_class=auto, score=0.708, total= 1.4min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.709, total= 2.8min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.718, total= 2.8min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.713, total= 2.8min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.718, total= 2.8min
[CV] C=100.0, max_iter=300, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=300, multi_class=auto, score=0.715, total= 2.7min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.707, total= 5.5min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.720, total= 5.5min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.714, total= 5.6min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.720, total= 5.6min
[CV] C=100.0, max_iter=600, multi_class=auto .........................


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
[Parallel(n_jobs=1)]: Done 100 out of 100 | elapsed: 212.1min finished


[CV]  C=100.0, max_iter=600, multi_class=auto, score=0.719, total= 5.5min


STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression


Best parameters:
{'C': 10.0, 'max_iter': 600, 'multi_class': 'auto'}
Bestf1_weighted:0.7178341071364939
Train classification report:
              precision    recall  f1-score   support

           0       0.76      0.70      0.73     15000
           1       0.81      0.89      0.85     15000
           2       0.82      0.81      0.82     15000

    accuracy                           0.80     45000
   macro avg       0.80      0.80      0.80     45000
weighted avg       0.80      0.80      0.80     45000

Test classification report:
              precision    recall  f1-score   support

           0       0.67      0.62      0.65      5000
           1       0.76      0.83      0.79      5000
           2       0.75      0.73      0.74      5000

    accuracy                           0.73     15000
   macro avg       0.73      0.73      0.73     15000
weighted avg       0.73      0.73      0.73     15000



NameError: ignored

## Linear SVC

In [None]:
m = 'LinearSVC'
param_grid = params = {'C':[0.01,0.1,1.0,10.0,100.0]}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 5 candidates, totalling 25 fits
[CV] C=0.01 ..........................................................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.


[CV] .............................. C=0.01, score=0.666, total=  21.3s
[CV] C=0.01 ..........................................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:   21.3s remaining:    0.0s


[CV] .............................. C=0.01, score=0.683, total=  18.8s
[CV] C=0.01 ..........................................................


[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:   40.1s remaining:    0.0s


[CV] .............................. C=0.01, score=0.671, total=  18.9s
[CV] C=0.01 ..........................................................
[CV] .............................. C=0.01, score=0.675, total=  18.9s
[CV] C=0.01 ..........................................................
[CV] .............................. C=0.01, score=0.664, total=  18.5s
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.696, total= 2.0min
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.708, total= 2.1min
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.700, total= 2.1min
[CV] C=0.1 ...........................................................
[CV] ............................... C=0.1, score=0.697, total= 2.2min
[CV] C=0.1 ...........................................................
[CV] .



[CV] ............................... C=1.0, score=0.707, total= 5.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.718, total= 5.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.713, total= 5.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.713, total= 5.5min
[CV] C=1.0 ...........................................................
[CV] ............................... C=1.0, score=0.715, total= 5.5min
[CV] C=10.0 ..........................................................
[CV] .............................. C=10.0, score=0.694, total= 6.1min
[CV] C=10.0 ..........................................................
[CV] .............................. C=10.0, score=0.699, total= 6.2min
[CV] C=10.0 ..........................................................
[CV] .

[Parallel(n_jobs=1)]: Done  25 out of  25 | elapsed: 103.1min finished


Best parameters:
{'C': 1.0}
Bestf1_weighted:0.7130630512915516
Train classification report:
              precision    recall  f1-score   support

           0       0.75      0.67      0.71     15000
           1       0.81      0.87      0.84     15000
           2       0.80      0.83      0.82     15000

    accuracy                           0.79     45000
   macro avg       0.79      0.79      0.79     45000
weighted avg       0.79      0.79      0.79     45000

Test classification report:
              precision    recall  f1-score   support

           0       0.67      0.60      0.63      5000
           1       0.76      0.81      0.79      5000
           2       0.74      0.76      0.75      5000

    accuracy                           0.73     15000
   macro avg       0.72      0.72      0.72     15000
weighted avg       0.72      0.72      0.72     15000



NameError: ignored

## SGD Classifier

In [None]:
m = 'SGDClassifier'
param_grid = {'loss':['hinge'],'alpha':[0.0001,0.001,0.01],'penalty':['elasticnet'],'l1_ratio':[0,0.2,0.7,1.0]}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 12 candidates, totalling 60 fits
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.


[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.684, total= 1.2min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:  1.2min remaining:    0.0s


[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.697, total= 1.1min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........


[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:  2.3min remaining:    0.0s


[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.684, total= 1.2min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........
[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.687, total= 1.2min
[CV] alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet ........
[CV]  alpha=0.0001, l1_ratio=0, loss=hinge, penalty=elasticnet, score=0.684, total= 1.2min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet, score=0.682, total= 1.5min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet, score=0.678, total= 1.4min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet, score=0.689, total= 1.2min
[CV] alpha=0.0001, l1_ratio=0.2, loss=hinge, penalty=elasticnet ......
[CV]  alpha=0.0001, l1

[Parallel(n_jobs=1)]: Done  60 out of  60 | elapsed: 40.2min finished


Best parameters:
{'alpha': 0.0001, 'l1_ratio': 1.0, 'loss': 'hinge', 'penalty': 'elasticnet'}
Bestf1_weighted:0.7222651132983737
Train classification report:
              precision    recall  f1-score   support

           0       0.81      0.50      0.62     15000
           1       0.76      0.91      0.83     15000
           2       0.73      0.87      0.79     15000

    accuracy                           0.76     45000
   macro avg       0.77      0.76      0.75     45000
weighted avg       0.77      0.76      0.75     45000

Test classification report:
              precision    recall  f1-score   support

           0       0.77      0.48      0.59      5000
           1       0.74      0.89      0.81      5000
           2       0.71      0.83      0.76      5000

    accuracy                           0.73     15000
   macro avg       0.74      0.73      0.72     15000
weighted avg       0.74      0.73      0.72     15000



NameError: ignored

## Random forest classifier

In [None]:
m = 'RandomForestClassifier'
param_grid = {'n_estimators': [50,200,600],'max_depth': [10,15,20]}
p = clf_dict[m]
result_10_rem[m] = do_gridSearch(p,d_train,y_train,d_test,y_test,param_grid)

Fitting 5 folds for each of 9 candidates, totalling 45 fits
[CV] max_depth=10, n_estimators=50 ...................................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.


[CV] ....... max_depth=10, n_estimators=50, score=0.656, total= 1.6min
[CV] max_depth=10, n_estimators=50 ...................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:  1.6min remaining:    0.0s


[CV] ....... max_depth=10, n_estimators=50, score=0.656, total= 1.6min
[CV] max_depth=10, n_estimators=50 ...................................


[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:  3.1min remaining:    0.0s


[CV] ....... max_depth=10, n_estimators=50, score=0.657, total= 1.6min
[CV] max_depth=10, n_estimators=50 ...................................
[CV] ....... max_depth=10, n_estimators=50, score=0.673, total= 1.5min
[CV] max_depth=10, n_estimators=50 ...................................
[CV] ....... max_depth=10, n_estimators=50, score=0.666, total= 1.6min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.663, total= 6.2min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.675, total= 6.1min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.679, total= 6.2min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] ...... max_depth=10, n_estimators=200, score=0.681, total= 6.2min
[CV] max_depth=10, n_estimators=200 ..................................
[CV] .

KeyboardInterrupt: ignored

Stopeed training as for each fold, it was taking about 20 minutes.