In [2]:
import numpy as np
import pandas as pd
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LinearRegression, LogisticRegression
from sklearn.metrics import mean_squared_error

# Load dataset
data = load_breast_cancer()
X = data.data
y = data.target

# Split train/test
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Scaling the data set 
sc = StandardScaler()
X_train_std = sc.fit_transform(X_train)
X_test_std = sc.transform(X_test)

# Linear Regression
lr = LinearRegression()
lr.fit(X_train_std, y_train)
preds_lr = lr.predict(X_test_std)

# Logistic Regression
clf = LogisticRegression()
clf.fit(X_train_std, y_train)

# Get probabilities for MSE calculation
preds_log = clf.predict_proba(X_test_std)[:, 1]

# Calculate errors
mse_linear = mean_squared_error(y_test, preds_lr)
mse_logistic = mean_squared_error(y_test, preds_log)

print(f"MSE Linear Regression: {mse_linear:.5f}")
print(f"MSE Logistic Regression: {mse_logistic:.5f}")

MSE Linear Regression: 0.06411
MSE Logistic Regression: 0.01670
