In [18]:
import numpy as np
import matplotlib.pyplot as plt
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix

In [19]:
breast_cancer = load_breast_cancer()
X = breast_cancer.data
y = breast_cancer.target

feature_names = breast_cancer.feature_names
feature_indices = {name: i for i, name in enumerate(feature_names)}

selected_features = ['worst compactness', 'worst concavity', 'worst area']
feature_indices_to_use = [feature_indices[name] for name in selected_features]

X_selected = X[:, feature_indices_to_use]


In [26]:
X_train, X_test, y_train, y_test = train_test_split(X_selected, y, train_size=0.6, random_state=9)

In [27]:
scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

In [28]:
svm_linear = SVC(kernel='linear', random_state=9)
svm_linear.fit(X_train_scaled, y_train)

y_pred_linear = svm_linear.predict(X_test_scaled)

What is the accuracy of the classification model with a linear kernel?

In [29]:
linear_accuracy = accuracy_score(y_test, y_pred_linear)
print("lin accuracy")
print(linear_accuracy)

lin accuracy
0.9385964912280702


What is the accuracy of the classification model with a radial basis function
kernel with regularization strength parameter, C=2?

In [30]:
svm_rbf = SVC(kernel='rbf', C=2, random_state=9)
svm_rbf.fit(X_train_scaled, y_train)

y_pred_rbf = svm_rbf.predict(X_test_scaled)

rbf_accuracy = accuracy_score(y_test, y_pred_rbf)
print("radial basis func accuracy")
print(rbf_accuracy)

radial basis func accuracy
0.9429824561403509
