In [1]:
from sklearn import datasets
import numpy as np

data_breast_cancer = datasets.load_breast_cancer(as_frame=True)
data_iris = datasets.load_iris(as_frame=True)

In [2]:
from sklearn.model_selection import train_test_split

In [3]:
X = data_breast_cancer.data.iloc[:, 3:5]
y = data_breast_cancer.target

breast_cancer_X_train, breast_cancer_X_test, breast_cancer_y_train, breast_cancer_y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [4]:
from sklearn.pipeline import Pipeline
from sklearn.preprocessing import StandardScaler
from sklearn.svm import LinearSVC

In [5]:
svm_clf = Pipeline([("linear_svc", LinearSVC(C=1,loss="hinge",random_state=42))])
svm_clf_scaled = Pipeline([("scaler", StandardScaler()),("linear_svc", LinearSVC(C=1,loss="hinge",random_state=42))])

svm_clf.fit(breast_cancer_X_train, breast_cancer_y_train)
svm_clf_scaled.fit(breast_cancer_X_train, breast_cancer_y_train)



Pipeline(steps=[('scaler', StandardScaler()),
                ('linear_svc', LinearSVC(C=1, loss='hinge', random_state=42))])

In [6]:
train_svm_clf_score = svm_clf.score(breast_cancer_X_train, breast_cancer_y_train)
test_svm_clf_score = svm_clf.score(breast_cancer_X_test, breast_cancer_y_test)

train_svm_clf_scaled_score = svm_clf_scaled.score(breast_cancer_X_train, breast_cancer_y_train)
test_svm_clf_scaled_score = svm_clf_scaled.score(breast_cancer_X_test, breast_cancer_y_test)

In [7]:
import pickle

scores = [train_svm_clf_score, test_svm_clf_score, train_svm_clf_scaled_score, test_svm_clf_scaled_score]
print(scores)

with open('bc_acc.pkl', 'wb') as f:
    pickle.dump(scores, f)

[0.6285714285714286, 0.6228070175438597, 0.8923076923076924, 0.9298245614035088]


In [8]:
X = data_iris.data.iloc[:, 2:4]
y = (data_iris.target == 2)

iris_X_train, iris_X_test, iris_y_train, iris_y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [9]:
svm_clf_i = Pipeline([("linear_svc", LinearSVC(C=1,loss="hinge",random_state=42))])
svm_clf_i_scaled = Pipeline([("scaler", StandardScaler()),("linear_svc", LinearSVC(C=1,loss="hinge",random_state=42))])

svm_clf_i.fit(iris_X_train, iris_y_train)
svm_clf_i_scaled.fit(iris_X_train, iris_y_train)



Pipeline(steps=[('scaler', StandardScaler()),
                ('linear_svc', LinearSVC(C=1, loss='hinge', random_state=42))])

In [10]:
train_svm_clf_score = svm_clf_i.score(iris_X_train, iris_y_train)
test_svm_clf_score = svm_clf_i.score(iris_X_test, iris_y_test)

train_svm_clf_scaled_score = svm_clf_i_scaled.score(iris_X_train, iris_y_train)
test_svm_clf_scaled_score = svm_clf_i_scaled.score(iris_X_test, iris_y_test)

In [11]:
scores = [train_svm_clf_score, test_svm_clf_score, train_svm_clf_scaled_score, test_svm_clf_scaled_score]
print(scores)

with open('iris_acc.pkl', 'wb') as f:
    pickle.dump(scores, f)

[0.9416666666666667, 1.0, 0.9416666666666667, 1.0]
