In [6]:
import pandas as pd
import numpy as np
from sklearn.svm import SVC
from sklearn.preprocessing import StandardScaler,MinMaxScaler
from sklearn.model_selection import GridSearchCV,StratifiedKFold
from sklearn.pipeline import Pipeline

In [3]:
wine_qal_train=pd.read_csv("wine_kaggle_train.csv",index_col=0)
wine_qal_train.head()

Unnamed: 0_level_0,fixed acidity,volatile acidity,citric acid,residual sugar,chlorides,free sulfur dioxide,total sulfur dioxide,density,pH,sulphates,alcohol,quality
Id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,8.0,0.5,0.39,2.2,0.073,30.0,39.0,0.99572,3.33,0.77,12.1,6
1,9.3,0.3,0.73,2.3,0.092,30.0,67.0,0.99854,3.32,0.67,12.8,6
2,7.1,0.51,0.03,2.1,0.059,3.0,12.0,0.9966,3.52,0.73,11.3,7
3,8.1,0.87,0.22,2.6,0.084,11.0,65.0,0.9973,3.2,0.53,9.8,5
4,8.5,0.36,0.3,2.3,0.079,10.0,45.0,0.99444,3.2,1.36,9.5,6


In [5]:
wine_qal_train['quality'].unique()

array([6, 7, 5, 4, 8, 3], dtype=int64)

In [7]:
X_train=wine_qal_train.drop('quality',axis=1) # Training Dataset
y_train=wine_qal_train['quality']

In [9]:
wine_qal_test=pd.read_csv("wine_kaggle_test.csv",index_col=0)
wine_qal_test.head()

Unnamed: 0_level_0,fixed acidity,volatile acidity,citric acid,residual sugar,chlorides,free sulfur dioxide,total sulfur dioxide,density,pH,sulphates,alcohol
Id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1
2056,7.2,0.51,0.01,2.0,0.077,31.0,54.0,0.99748,3.39,0.59,9.8
2057,7.2,0.755,0.15,2.0,0.102,14.0,35.0,0.99586,3.33,0.68,10.0
2058,8.4,0.46,0.4,2.0,0.065,21.0,50.0,0.99774,3.08,0.65,9.5
2059,8.0,0.47,0.4,1.8,0.056,14.0,25.0,0.9948,3.3,0.65,11.7
2060,6.5,0.34,0.32,2.1,0.044,8.0,94.0,0.99356,3.23,0.48,12.8


In [11]:
X_test=wine_qal_test  # Test Dataset

# 1. Std scaling + Linear

In [12]:
std_scaler=StandardScaler()

In [13]:
svm=SVC(kernel='linear',probability=True,random_state=23)

In [14]:
pipe=Pipeline([('SCL',std_scaler),('SVM',svm)])

In [15]:
kfold=StratifiedKFold(n_splits=5,shuffle=True,random_state=23)

In [16]:
params={'SVM__C':np.linspace(0.001,5,10)}

In [17]:
gcv=GridSearchCV(pipe,param_grid=params,cv=kfold,scoring='neg_log_loss',verbose=3)
gcv.fit(X_train,y_train)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
[CV 1/5] END .....................SVM__C=0.001;, score=-1.094 total time=   1.2s
[CV 2/5] END .....................SVM__C=0.001;, score=-1.049 total time=   1.3s
[CV 3/5] END .....................SVM__C=0.001;, score=-1.058 total time=   1.2s
[CV 4/5] END .....................SVM__C=0.001;, score=-1.061 total time=   1.2s
[CV 5/5] END .....................SVM__C=0.001;, score=-1.058 total time=   1.1s
[CV 1/5] END ........SVM__C=0.5564444444444444;, score=-1.102 total time=   1.2s
[CV 2/5] END ........SVM__C=0.5564444444444444;, score=-1.029 total time=   1.2s
[CV 3/5] END ........SVM__C=0.5564444444444444;, score=-1.058 total time=   1.2s
[CV 4/5] END ........SVM__C=0.5564444444444444;, score=-1.053 total time=   1.2s
[CV 5/5] END ........SVM__C=0.5564444444444444;, score=-1.052 total time=   1.2s
[CV 1/5] END ........SVM__C=1.1118888888888887;, score=-1.099 total time=   1.6s
[CV 2/5] END ........SVM__C=1.1118888888888887;,

GridSearchCV(cv=StratifiedKFold(n_splits=5, random_state=23, shuffle=True),
             estimator=Pipeline(steps=[('SCL', StandardScaler()),
                                       ('SVM',
                                        SVC(kernel='linear', probability=True,
                                            random_state=23))]),
             param_grid={'SVM__C': array([1.00000000e-03, 5.56444444e-01, 1.11188889e+00, 1.66733333e+00,
       2.22277778e+00, 2.77822222e+00, 3.33366667e+00, 3.88911111e+00,
       4.44455556e+00, 5.00000000e+00])},
             scoring='neg_log_loss', verbose=3)

In [18]:
print("Best Parameters: ",gcv.best_params_)
print("Best Score: ",gcv.best_score_)

Best Parameters:  {'SVM__C': 2.2227777777777775}
Best Score:  -1.0561656274417708


In [19]:
best_model=gcv.best_estimator_

In [20]:
y_pred=best_model.predict(X_test)
y_pred

array([5, 5, 5, ..., 5, 5, 5], dtype=int64)

In [21]:
submission=pd.DataFrame({'Id':wine_qal_test.index,'quality':y_pred})
submission.head()

Unnamed: 0,Id,quality
0,2056,5
1,2057,5
2,2058,5
3,2059,6
4,2060,6


In [22]:
submission.to_csv('win_qual_std_Scl_svm_linear.csv',index=False)

In [23]:
# Leaderboard Score
# Score: 0.39382
# Public score: 0.43906

# 2. MinMax scaling + Linear

In [25]:
mm_scaler=MinMaxScaler()
svm=SVC(kernel='linear',probability=True,random_state=23)
pipe=Pipeline([('SCL',mm_scaler),('SVM',svm)])
kfold=StratifiedKFold(n_splits=5,shuffle=True,random_state=23)

params={'SVM__C':np.linspace(0.001,5,10)}

In [26]:
gcv=GridSearchCV(pipe,param_grid=params,cv=kfold,scoring='neg_log_loss',verbose=3)
gcv.fit(X_train,y_train)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
[CV 1/5] END .....................SVM__C=0.001;, score=-1.116 total time=   1.2s
[CV 2/5] END .....................SVM__C=0.001;, score=-1.060 total time=   1.2s
[CV 3/5] END .....................SVM__C=0.001;, score=-1.094 total time=   1.3s
[CV 4/5] END .....................SVM__C=0.001;, score=-1.082 total time=   1.3s
[CV 5/5] END .....................SVM__C=0.001;, score=-1.063 total time=   1.3s
[CV 1/5] END ........SVM__C=0.5564444444444444;, score=-1.091 total time=   1.3s
[CV 2/5] END ........SVM__C=0.5564444444444444;, score=-1.033 total time=   1.2s
[CV 3/5] END ........SVM__C=0.5564444444444444;, score=-1.068 total time=   1.3s
[CV 4/5] END ........SVM__C=0.5564444444444444;, score=-1.055 total time=   1.4s
[CV 5/5] END ........SVM__C=0.5564444444444444;, score=-1.056 total time=   1.3s
[CV 1/5] END ........SVM__C=1.1118888888888887;, score=-1.097 total time=   1.1s
[CV 2/5] END ........SVM__C=1.1118888888888887;,

GridSearchCV(cv=StratifiedKFold(n_splits=5, random_state=23, shuffle=True),
             estimator=Pipeline(steps=[('SCL', MinMaxScaler()),
                                       ('SVM',
                                        SVC(kernel='linear', probability=True,
                                            random_state=23))]),
             param_grid={'SVM__C': array([1.00000000e-03, 5.56444444e-01, 1.11188889e+00, 1.66733333e+00,
       2.22277778e+00, 2.77822222e+00, 3.33366667e+00, 3.88911111e+00,
       4.44455556e+00, 5.00000000e+00])},
             scoring='neg_log_loss', verbose=3)

In [27]:
print("Best Parameters: ",gcv.best_params_)
print("Best Score: ",gcv.best_score_)

Best Parameters:  {'SVM__C': 2.2227777777777775}
Best Score:  -1.0594821507200114


In [28]:
best_model=gcv.best_estimator_

In [29]:
y_pred=best_model.predict(X_test)
y_pred

array([5, 5, 5, ..., 5, 5, 5], dtype=int64)

In [30]:
submission=pd.DataFrame({'Id':wine_qal_test.index,'quality':y_pred})
submission.head()

Unnamed: 0,Id,quality
0,2056,5
1,2057,5
2,2058,5
3,2059,6
4,2060,6


In [32]:
submission.to_csv('win_qual_mm_Scl_svm_linear.csv',index=False)

In [33]:
# Leaderboard Score
# Score: 0.39669
# Public score: 0.43653

# 3. Std scaling + Radial

In [36]:
std_scaler=StandardScaler()
svm=SVC(kernel='rbf',probability=True,random_state=23)
pipe=Pipeline([('SCL',std_scaler),('SVM',svm)])
kfold=StratifiedKFold(n_splits=5,shuffle=True,random_state=23)

params={'SVM__C':np.linspace(0.001,5,10),'SVM__gamma':list(np.linspace(0.001,5,10))+['scale','auto']}

gcv=GridSearchCV(pipe,param_grid=params,cv=kfold,scoring='neg_log_loss',verbose=3)
gcv.fit(X_train,y_train)

Fitting 5 folds for each of 120 candidates, totalling 600 fits
[CV 1/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.174 total time=   2.1s
[CV 2/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.162 total time=   2.2s
[CV 3/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.125 total time=   2.6s
[CV 4/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.177 total time=   2.1s
[CV 5/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.249 total time=   2.2s
[CV 1/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.176 total time=   2.2s
[CV 2/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.106 total time=   2.5s
[CV 3/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.077 total time=   2.3s
[CV 4/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.085 total time=   2.2s
[CV 5/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.099 total time=   2.3s
[CV 1/5] END SVM__C=0.001, SVM__gamma=1.1118888888888887;, score=-1.176 total

[CV 5/5] END SVM__C=0.5564444444444444, SVM__gamma=2.778222222222222;, score=-1.199 total time=   5.9s
[CV 1/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.225 total time=   6.0s
[CV 2/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.204 total time=   6.3s
[CV 3/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.211 total time=   6.0s
[CV 4/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.206 total time=   6.3s
[CV 5/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.214 total time=   6.1s
[CV 1/5] END SVM__C=0.5564444444444444, SVM__gamma=3.8891111111111107;, score=-1.232 total time=   6.1s
[CV 2/5] END SVM__C=0.5564444444444444, SVM__gamma=3.8891111111111107;, score=-1.216 total time=   5.9s
[CV 3/5] END SVM__C=0.5564444444444444, SVM__gamma=3.8891111111111107;, score=-1.220 total time=   6.2s
[CV 4/5] END SVM__C=0.5564444444444444, SVM__gamma=3.889111111111

[CV 3/5] END SVM__C=1.1118888888888887, SVM__gamma=scale;, score=-1.030 total time=   2.2s
[CV 4/5] END SVM__C=1.1118888888888887, SVM__gamma=scale;, score=-1.028 total time=   2.2s
[CV 5/5] END SVM__C=1.1118888888888887, SVM__gamma=scale;, score=-1.037 total time=   2.2s
[CV 1/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.070 total time=   2.2s
[CV 2/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.036 total time=   2.2s
[CV 3/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.030 total time=   2.3s
[CV 4/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.028 total time=   2.3s
[CV 5/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.037 total time=   2.2s
[CV 1/5] END SVM__C=1.6673333333333331, SVM__gamma=0.001;, score=-1.078 total time=   2.1s
[CV 2/5] END SVM__C=1.6673333333333331, SVM__gamma=0.001;, score=-1.022 total time=   2.3s
[CV 3/5] END SVM__C=1.6673333333333331, SVM__gamma=0.001;, score=-1.055 total time=   2.2s
[CV 

[CV 2/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.148 total time=   4.9s
[CV 3/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.151 total time=   5.0s
[CV 4/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.144 total time=   4.9s
[CV 5/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.156 total time=   5.0s
[CV 1/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.202 total time=   5.4s
[CV 2/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.167 total time=   5.4s
[CV 3/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.173 total time=   5.4s
[CV 4/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.167 total time=   5.4s
[CV 5/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.180 total time=   5.5s
[CV 1/5] END SVM__C=2.2227777777777775, SVM__gamma=2.77822222222

[CV 4/5] END SVM__C=2.778222222222222, SVM__gamma=3.8891111111111107;, score=-1.215 total time=  10.6s
[CV 5/5] END SVM__C=2.778222222222222, SVM__gamma=3.8891111111111107;, score=-1.222 total time=   9.4s
[CV 1/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.235 total time=   8.1s
[CV 2/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.221 total time=   7.6s
[CV 3/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.224 total time=  10.3s
[CV 4/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.222 total time=   8.3s
[CV 5/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.227 total time=   8.5s
[CV 1/5] END SVM__C=2.778222222222222, SVM__gamma=5.0;, score=-1.238 total time=   7.9s
[CV 2/5] END SVM__C=2.778222222222222, SVM__gamma=5.0;, score=-1.224 total time=   7.3s
[CV 3/5] END SVM__C=2.778222222222222, SVM__gamma=5.0;, score=-1.226 total time=   7.7s
[CV 4/5] END SVM__C=

[CV 4/5] END SVM__C=3.8891111111111107, SVM__gamma=0.001;, score=-1.046 total time=   2.3s
[CV 5/5] END SVM__C=3.8891111111111107, SVM__gamma=0.001;, score=-1.046 total time=   2.3s
[CV 1/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.132 total time=   4.3s
[CV 2/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.099 total time=   4.2s
[CV 3/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.106 total time=   4.3s
[CV 4/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.095 total time=   5.2s
[CV 5/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.122 total time=   4.3s
[CV 1/5] END SVM__C=3.8891111111111107, SVM__gamma=1.1118888888888887;, score=-1.160 total time=   5.0s
[CV 2/5] END SVM__C=3.8891111111111107, SVM__gamma=1.1118888888888887;, score=-1.124 total time=   5.2s
[CV 3/5] END SVM__C=3.8891111111111107, SVM__gamma=1.1118888888888887;, score=-1.130 total

[CV 2/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.185 total time=   6.4s
[CV 3/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.192 total time=   6.4s
[CV 4/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.189 total time=   6.4s
[CV 5/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.200 total time=   6.5s
[CV 1/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.223 total time=   8.3s
[CV 2/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.202 total time=   8.4s
[CV 3/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.208 total time=   8.2s
[CV 4/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.204 total time=   7.5s
[CV 5/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.213 total time=   6.9s
[CV 1/5] END SVM__C=4.444555555555556, SVM__gamma=3.8891111111111107;, score=

[CV 3/5] END ......SVM__C=5.0, SVM__gamma=auto;, score=-1.050 total time=   2.6s
[CV 4/5] END ......SVM__C=5.0, SVM__gamma=auto;, score=-1.049 total time=   2.7s
[CV 5/5] END ......SVM__C=5.0, SVM__gamma=auto;, score=-1.067 total time=   2.6s


GridSearchCV(cv=StratifiedKFold(n_splits=5, random_state=23, shuffle=True),
             estimator=Pipeline(steps=[('SCL', StandardScaler()),
                                       ('SVM',
                                        SVC(probability=True,
                                            random_state=23))]),
             param_grid={'SVM__C': array([1.00000000e-03, 5.56444444e-01, 1.11188889e+00, 1.66733333e+00,
       2.22277778e+00, 2.77822222e+00, 3.33366667e+00, 3.88911111e+00,
       4.44455556e+00, 5.00000000e+00]),
                         'SVM__gamma': [0.001, 0.5564444444444444,
                                        1.1118888888888887, 1.6673333333333331,
                                        2.2227777777777775, 2.778222222222222,
                                        3.3336666666666663, 3.8891111111111107,
                                        4.444555555555556, 5.0, 'scale',
                                        'auto']},
             scoring='neg_log_loss', 

In [37]:
print("Best Parameters: ",gcv.best_params_)
print("Best Score: ",gcv.best_score_)

Best Parameters:  {'SVM__C': 0.5564444444444444, 'SVM__gamma': 'scale'}
Best Score:  -1.0354126932900787


In [38]:
best_model=gcv.best_estimator_
y_pred=best_model.predict(X_test)
y_pred

array([5, 6, 6, ..., 5, 5, 5], dtype=int64)

In [39]:
submission=pd.DataFrame({'Id':wine_qal_test.index,'quality':y_pred})
submission.head()

Unnamed: 0,Id,quality
0,2056,5
1,2057,6
2,2058,6
3,2059,6
4,2060,5


In [41]:
submission.to_csv('win_qual_std_Scl_svm_rbf.csv',index=False)

In [40]:
# Leaderboard Score
# Score: 0.45141
# Public score: 0.50007

# 4. MinMax scaling + Radial

In [42]:
mm_scaler=MinMaxScalerMaxScaler()
svm=SVC(kernel='rbf',probability=True,random_state=23)
pipe=Pipeline([('SCL',mm_scaler),('SVM',svm)])
kfold=StratifiedKFold(n_splits=5,shuffle=True,random_state=23)

params={'SVM__C':np.linspace(0.001,5,10),'SVM__gamma':list(np.linspace(0.001,5,10))+['scale','auto']}

gcv=GridSearchCV(pipe,param_grid=params,cv=kfold,scoring='neg_log_loss',verbose=3)
gcv.fit(X_train,y_train)

Fitting 5 folds for each of 120 candidates, totalling 600 fits
[CV 1/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.221 total time=   2.4s
[CV 2/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.110 total time=   2.2s
[CV 3/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.156 total time=   2.3s
[CV 4/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.117 total time=   2.2s
[CV 5/5] END ...SVM__C=0.001, SVM__gamma=0.001;, score=-1.109 total time=   2.3s
[CV 1/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.118 total time=   2.3s
[CV 2/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.056 total time=   2.3s
[CV 3/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.087 total time=   2.3s
[CV 4/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.072 total time=   2.5s
[CV 5/5] END SVM__C=0.001, SVM__gamma=0.5564444444444444;, score=-1.058 total time=   2.3s
[CV 1/5] END SVM__C=0.001, SVM__gamma=1.1118888888888887;, score=-1.107 total

[CV 5/5] END SVM__C=0.5564444444444444, SVM__gamma=2.778222222222222;, score=-1.025 total time=   2.2s
[CV 1/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.068 total time=   2.1s
[CV 2/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.041 total time=   2.2s
[CV 3/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.037 total time=   2.2s
[CV 4/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.025 total time=   2.2s
[CV 5/5] END SVM__C=0.5564444444444444, SVM__gamma=3.3336666666666663;, score=-1.028 total time=   2.2s
[CV 1/5] END SVM__C=0.5564444444444444, SVM__gamma=3.8891111111111107;, score=-1.068 total time=   2.1s
[CV 2/5] END SVM__C=0.5564444444444444, SVM__gamma=3.8891111111111107;, score=-1.043 total time=   2.2s
[CV 3/5] END SVM__C=0.5564444444444444, SVM__gamma=3.8891111111111107;, score=-1.037 total time=   2.3s
[CV 4/5] END SVM__C=0.5564444444444444, SVM__gamma=3.889111111111

[CV 3/5] END SVM__C=1.1118888888888887, SVM__gamma=scale;, score=-1.033 total time=   2.6s
[CV 4/5] END SVM__C=1.1118888888888887, SVM__gamma=scale;, score=-1.023 total time=   2.7s
[CV 5/5] END SVM__C=1.1118888888888887, SVM__gamma=scale;, score=-1.022 total time=   3.2s
[CV 1/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.075 total time=   2.5s
[CV 2/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.021 total time=   2.3s
[CV 3/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.069 total time=   2.2s
[CV 4/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.050 total time=   2.3s
[CV 5/5] END SVM__C=1.1118888888888887, SVM__gamma=auto;, score=-1.049 total time=   2.4s
[CV 1/5] END SVM__C=1.6673333333333331, SVM__gamma=0.001;, score=-1.122 total time=   2.2s
[CV 2/5] END SVM__C=1.6673333333333331, SVM__gamma=0.001;, score=-1.049 total time=   2.4s
[CV 3/5] END SVM__C=1.6673333333333331, SVM__gamma=0.001;, score=-1.090 total time=   3.3s
[CV 

[CV 2/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.032 total time=   2.4s
[CV 3/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.034 total time=   2.5s
[CV 4/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.023 total time=   2.5s
[CV 5/5] END SVM__C=2.2227777777777775, SVM__gamma=1.6673333333333331;, score=-1.019 total time=   2.5s
[CV 1/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.066 total time=   2.4s
[CV 2/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.039 total time=   2.4s
[CV 3/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.034 total time=   2.5s
[CV 4/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.028 total time=   2.4s
[CV 5/5] END SVM__C=2.2227777777777775, SVM__gamma=2.2227777777777775;, score=-1.027 total time=   2.5s
[CV 1/5] END SVM__C=2.2227777777777775, SVM__gamma=2.77822222222

[CV 4/5] END SVM__C=2.778222222222222, SVM__gamma=3.8891111111111107;, score=-1.035 total time=   2.6s
[CV 5/5] END SVM__C=2.778222222222222, SVM__gamma=3.8891111111111107;, score=-1.052 total time=   2.6s
[CV 1/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.073 total time=   2.9s
[CV 2/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.055 total time=   2.7s
[CV 3/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.046 total time=   2.6s
[CV 4/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.039 total time=   2.6s
[CV 5/5] END SVM__C=2.778222222222222, SVM__gamma=4.444555555555556;, score=-1.056 total time=   2.6s
[CV 1/5] END SVM__C=2.778222222222222, SVM__gamma=5.0;, score=-1.075 total time=   2.5s
[CV 2/5] END SVM__C=2.778222222222222, SVM__gamma=5.0;, score=-1.058 total time=   2.6s
[CV 3/5] END SVM__C=2.778222222222222, SVM__gamma=5.0;, score=-1.049 total time=   2.7s
[CV 4/5] END SVM__C=

[CV 4/5] END SVM__C=3.8891111111111107, SVM__gamma=0.001;, score=-1.083 total time=   2.4s
[CV 5/5] END SVM__C=3.8891111111111107, SVM__gamma=0.001;, score=-1.070 total time=   2.4s
[CV 1/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.057 total time=   2.4s
[CV 2/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.021 total time=   2.5s
[CV 3/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.043 total time=   2.5s
[CV 4/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.026 total time=   2.5s
[CV 5/5] END SVM__C=3.8891111111111107, SVM__gamma=0.5564444444444444;, score=-1.014 total time=   2.6s
[CV 1/5] END SVM__C=3.8891111111111107, SVM__gamma=1.1118888888888887;, score=-1.063 total time=   2.4s
[CV 2/5] END SVM__C=3.8891111111111107, SVM__gamma=1.1118888888888887;, score=-1.028 total time=   2.4s
[CV 3/5] END SVM__C=3.8891111111111107, SVM__gamma=1.1118888888888887;, score=-1.036 total

[CV 2/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.050 total time=   2.5s
[CV 3/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.041 total time=   2.5s
[CV 4/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.034 total time=   2.6s
[CV 5/5] END SVM__C=4.444555555555556, SVM__gamma=2.778222222222222;, score=-1.046 total time=   2.5s
[CV 1/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.075 total time=   2.5s
[CV 2/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.055 total time=   2.5s
[CV 3/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.045 total time=   2.6s
[CV 4/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.039 total time=   2.6s
[CV 5/5] END SVM__C=4.444555555555556, SVM__gamma=3.3336666666666663;, score=-1.054 total time=   2.7s
[CV 1/5] END SVM__C=4.444555555555556, SVM__gamma=3.8891111111111107;, score=

[CV 3/5] END ......SVM__C=5.0, SVM__gamma=auto;, score=-1.060 total time=   2.5s
[CV 4/5] END ......SVM__C=5.0, SVM__gamma=auto;, score=-1.042 total time=   2.5s
[CV 5/5] END ......SVM__C=5.0, SVM__gamma=auto;, score=-1.040 total time=   2.5s


GridSearchCV(cv=StratifiedKFold(n_splits=5, random_state=23, shuffle=True),
             estimator=Pipeline(steps=[('SCL', MinMaxScaler()),
                                       ('SVM',
                                        SVC(probability=True,
                                            random_state=23))]),
             param_grid={'SVM__C': array([1.00000000e-03, 5.56444444e-01, 1.11188889e+00, 1.66733333e+00,
       2.22277778e+00, 2.77822222e+00, 3.33366667e+00, 3.88911111e+00,
       4.44455556e+00, 5.00000000e+00]),
                         'SVM__gamma': [0.001, 0.5564444444444444,
                                        1.1118888888888887, 1.6673333333333331,
                                        2.2227777777777775, 2.778222222222222,
                                        3.3336666666666663, 3.8891111111111107,
                                        4.444555555555556, 5.0, 'scale',
                                        'auto']},
             scoring='neg_log_loss', ve

In [43]:
print("Best Parameters: ",gcv.best_params_)
print("Best Score: ",gcv.best_score_)

Best Parameters:  {'SVM__C': 5.0, 'SVM__gamma': 0.5564444444444444}
Best Score:  -1.0312897379357935


In [44]:
best_model=gcv.best_estimator_
y_pred=best_model.predict(X_test)
y_pred

array([5, 6, 5, ..., 5, 5, 5], dtype=int64)

In [45]:
submission=pd.DataFrame({'Id':wine_qal_test.index,'quality':y_pred})
submission.head()

Unnamed: 0,Id,quality
0,2056,5
1,2057,6
2,2058,5
3,2059,6
4,2060,5


In [46]:
submission.to_csv('win_qual_mm_Scl_svm_rbf.csv',index=False)

In [47]:
# Leaderboard Score
# Score: 0.43059
# Public score: 0.47177

# Leaderboard Score

## Standard Scaler SVM_Linear

#### Score: 0.39382
#### Public score: 0.43906

## MinMax Scaler SVM_Linear

#### Score: 0.39669
#### Public score: 0.43653

## Standard Scaler SVM_rbf

#### Score: 0.45141
#### Public score: 0.50007

## MinMax Scaler SVM_rbf

#### Score: 0.43059
#### Public score: 0.47177