In [5]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

from sklearn.linear_model import LinearRegression
from sklearn.model_selection import train_test_split

from sklearn.datasets import load_breast_cancer

In [6]:
df = load_breast_cancer()

In [7]:
df['data']

array([[1.799e+01, 1.038e+01, 1.228e+02, ..., 2.654e-01, 4.601e-01,
        1.189e-01],
       [2.057e+01, 1.777e+01, 1.329e+02, ..., 1.860e-01, 2.750e-01,
        8.902e-02],
       [1.969e+01, 2.125e+01, 1.300e+02, ..., 2.430e-01, 3.613e-01,
        8.758e-02],
       ...,
       [1.660e+01, 2.808e+01, 1.083e+02, ..., 1.418e-01, 2.218e-01,
        7.820e-02],
       [2.060e+01, 2.933e+01, 1.401e+02, ..., 2.650e-01, 4.087e-01,
        1.240e-01],
       [7.760e+00, 2.454e+01, 4.792e+01, ..., 0.000e+00, 2.871e-01,
        7.039e-02]])

In [8]:
x = pd.DataFrame(df.data, columns=df.feature_names)
y = df.target

In [9]:
x_train, x_test, y_train, y_test = train_test_split(x,y, test_size=0.2, random_state=100)

In [10]:
from sklearn.svm import SVC

In [11]:
svc = SVC()

In [12]:
svc.fit(x_train,y_train)

SVC()

In [13]:
preds = svc.predict(x_test)

In [14]:
from sklearn.metrics import classification_report

In [15]:
print(classification_report(y_test, preds))

              precision    recall  f1-score   support

           0       0.98      0.90      0.94        49
           1       0.93      0.98      0.96        65

    accuracy                           0.95       114
   macro avg       0.95      0.94      0.95       114
weighted avg       0.95      0.95      0.95       114



In [16]:
from sklearn.model_selection import GridSearchCV

In [17]:
params = {'C':[0.1, 1, 10, 100], 'gamma':[1, 0.1, 0.01, 0.001, 0.0001]}

In [19]:
grid = GridSearchCV(SVC(), param_grid=params, refit=True, verbose=True)

In [20]:
grid.fit(x_train, y_train)

Fitting 5 folds for each of 20 candidates, totalling 100 fits


GridSearchCV(estimator=SVC(),
             param_grid={'C': [0.1, 1, 10, 100],
                         'gamma': [1, 0.1, 0.01, 0.001, 0.0001]},
             verbose=True)

In [21]:
grid.best_params_

{'C': 10, 'gamma': 0.0001}

In [22]:
grid.best_score_

0.945054945054945

In [23]:
svc = SVC(C=10, gamma=0.0001)

In [24]:
svc.fit(x_train, y_train)

SVC(C=10, gamma=0.0001)

In [25]:
preds = svc.predict(x_test)

In [26]:
print(classification_report(y_test, preds))

              precision    recall  f1-score   support

           0       0.94      0.96      0.95        49
           1       0.97      0.95      0.96        65

    accuracy                           0.96       114
   macro avg       0.95      0.96      0.96       114
weighted avg       0.96      0.96      0.96       114

