In [1]:

import pandas as pd
import numpy as np


In [2]:
import matplotlib.pyplot as plt
import seaborn as sns


In [3]:
from sklearn.datasets import load_breast_cancer

In [4]:
cancer = load_breast_cancer()


In [5]:
cancer.keys()

dict_keys(['data', 'target', 'frame', 'target_names', 'DESCR', 'feature_names', 'filename', 'data_module'])

In [6]:
data_feat = pd.DataFrame(cancer['data'], columns = cancer['feature_names'])

In [7]:
data_feat.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 569 entries, 0 to 568
Data columns (total 30 columns):
 #   Column                   Non-Null Count  Dtype  
---  ------                   --------------  -----  
 0   mean radius              569 non-null    float64
 1   mean texture             569 non-null    float64
 2   mean perimeter           569 non-null    float64
 3   mean area                569 non-null    float64
 4   mean smoothness          569 non-null    float64
 5   mean compactness         569 non-null    float64
 6   mean concavity           569 non-null    float64
 7   mean concave points      569 non-null    float64
 8   mean symmetry            569 non-null    float64
 9   mean fractal dimension   569 non-null    float64
 10  radius error             569 non-null    float64
 11  texture error            569 non-null    float64
 12  perimeter error          569 non-null    float64
 13  area error               569 non-null    float64
 14  smoothness error         5

In [8]:
cancer['target_names']

array(['malignant', 'benign'], dtype='<U9')

In [9]:
from sklearn.model_selection import train_test_split

In [10]:
x = data_feat
y= cancer['target']

x_Train, x_test, y_train , y_test =train_test_split(x,y,test_size=0.2, random_state=101)

In [11]:
from sklearn.svm import SVC

In [12]:
model = SVC()


In [13]:
model.fit(x_Train,y_train)

In [15]:
predictions = model.predict(x_test)

In [17]:
from sklearn.metrics import classification_report, confusion_matrix

In [18]:
print(confusion_matrix(y_test, predictions))
print(classification_report(y_test, predictions))

[[36  6]
 [ 0 72]]
              precision    recall  f1-score   support

           0       1.00      0.86      0.92        42
           1       0.92      1.00      0.96        72

    accuracy                           0.95       114
   macro avg       0.96      0.93      0.94       114
weighted avg       0.95      0.95      0.95       114



In [20]:
from sklearn.model_selection import GridSearchCV


In [21]:
param_grid = {'C':[0.1,1,10,100,1000], 'gamma':[1,0.1,0.01,0.001,0.0001]}

In [22]:
grid = GridSearchCV(SVC(), param_grid, verbose=3)

In [23]:
grid.fit(x_Train, y_train)

Fitting 5 folds for each of 25 candidates, totalling 125 fits
[CV 1/5] END ....................C=0.1, gamma=1;, score=0.626 total time=   0.1s
[CV 2/5] END ....................C=0.1, gamma=1;, score=0.626 total time=   0.0s
[CV 3/5] END ....................C=0.1, gamma=1;, score=0.626 total time=   0.0s
[CV 4/5] END ....................C=0.1, gamma=1;, score=0.626 total time=   0.0s
[CV 5/5] END ....................C=0.1, gamma=1;, score=0.626 total time=   0.0s
[CV 1/5] END ..................C=0.1, gamma=0.1;, score=0.626 total time=   0.0s
[CV 2/5] END ..................C=0.1, gamma=0.1;, score=0.626 total time=   0.0s
[CV 3/5] END ..................C=0.1, gamma=0.1;, score=0.626 total time=   0.0s
[CV 4/5] END ..................C=0.1, gamma=0.1;, score=0.626 total time=   0.0s
[CV 5/5] END ..................C=0.1, gamma=0.1;, score=0.626 total time=   0.0s
[CV 1/5] END .................C=0.1, gamma=0.01;, score=0.626 total time=   0.0s
[CV 2/5] END .................C=0.1, gamma=0.01

In [24]:
grid.best_params_

{'C': 10, 'gamma': 0.0001}

In [25]:
grid.best_estimator_

In [26]:
grid_predict = grid.predict(x_test)

In [27]:
print(confusion_matrix(y_test, grid_predict))
print(classification_report(y_test, grid_predict))

[[36  6]
 [ 0 72]]
              precision    recall  f1-score   support

           0       1.00      0.86      0.92        42
           1       0.92      1.00      0.96        72

    accuracy                           0.95       114
   macro avg       0.96      0.93      0.94       114
weighted avg       0.95      0.95      0.95       114

