## Testing the Accuracy of the Model Before and After Standardizing the Features

The KNN model is evaluated on the sklearn's breast cancer dataset to check if the accuracy of the model is impacted when the features of the dataset is standardized (scaled) using StandardScaler.

In [1]:
from sklearn import datasets
from sklearn.model_selection import cross_val_score
from sklearn.neighbors import KNeighborsClassifier
from numpy import mean

# load dataset
df = datasets.load_breast_cancer()
X = df.data
y = df.target

# Instantiating the model
model = KNeighborsClassifier()

# Evaluating the model
scores = cross_val_score(model, X, y, scoring='accuracy', cv=10, n_jobs=-1)

# Model's average score
print(f'Accuracy: {mean(scores):.2f}')

Accuracy: 0.93


In [2]:
from sklearn import datasets
from sklearn.model_selection import cross_val_score
from sklearn.neighbors import KNeighborsClassifier
from sklearn.preprocessing import StandardScaler
from numpy import mean

# loading dataset and configuring features and target variables
df = datasets.load_breast_cancer()
X = df.data
y = df.target

# Standardizing features
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Instantiating model
model = KNeighborsClassifier()

# Evaluating the model
scores = cross_val_score(model, X_scaled, y, scoring='accuracy', cv=10, n_jobs=-1)

# Model's average score
print(f'Accuracy: {mean(scores):.2f}')

Accuracy: 0.97
