<a href="https://colab.research.google.com/github/sirikuragayathri/samsung.md/blob/main/KNN.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import numpy as np
import time
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.neighbors import KNeighborsClassifier
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score, classification_report, roc_auc_score

In [2]:
# Load the breast cancer dataset
df = load_breast_cancer()

X = df.data

y = df.target


In [3]:

# Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42, stratify=y)


In [4]:
# Feature Scaling is critical for KNN and SVM
scaler = StandardScaler()

X_train_scaled = scaler.fit_transform(X_train)

X_test_scaled = scaler.transform(X_test)

In [5]:
# Initialize and train the KNN Classifier
start_time_knn = time.time()

knn_model = KNeighborsClassifier(n_neighbors=5)

knn_model.fit(X_train_scaled, y_train)

end_time_knn = time.time()


In [6]:
# Make predictions and evaluate
y_pred_knn = knn_model.predict(X_test_scaled)

accuracy_knn = accuracy_score(y_test, y_pred_knn)

roc_auc_knn = roc_auc_score(y_test, y_pred_knn)

training_time_knn = end_time_knn - start_time_knn


In [7]:
print("=== K-Nearest Neighbors (KNN) ===")
print(f"Accuracy: {accuracy_knn:.4f}")

print(f"ROC AUC Score: {roc_auc_knn:.4f}")

print(f"Training Time: {training_time_knn:.4f} seconds")

print("\nClassification Report:")
print(classification_report(y_test, y_pred_knn))

=== K-Nearest Neighbors (KNN) ===
Accuracy: 0.9591
ROC AUC Score: 0.9453
Training Time: 0.0016 seconds

Classification Report:
              precision    recall  f1-score   support

           0       1.00      0.89      0.94        64
           1       0.94      1.00      0.97       107

    accuracy                           0.96       171
   macro avg       0.97      0.95      0.96       171
weighted avg       0.96      0.96      0.96       171



In [8]:
# Initialize and train the SVM Classifier
start_time_svm = time.time()
svm_model = SVC(kernel='rbf',
                C=1.0,
                gamma='scale',
                random_state=42)

svm_model.fit(X_train_scaled, y_train)

end_time_svm = time.time()

In [9]:
# Make predictions and evaluate
y_pred_svm = svm_model.predict(X_test_scaled)

accuracy_svm = accuracy_score(y_test, y_pred_svm)

roc_auc_svm = roc_auc_score(y_test, y_pred_svm)

training_time_svm = end_time_svm - start_time_svm

In [10]:
print("\n=== Support Vector Machine (SVM) ===")
print(f"Accuracy: {accuracy_svm:.4f}")

print(f"ROC AUC Score: {roc_auc_svm:.4f}")

print(f"Training Time: {training_time_svm:.4f} seconds")

print("\nClassification Report:")
print(classification_report(y_test, y_pred_svm))


=== Support Vector Machine (SVM) ===
Accuracy: 0.9766
ROC AUC Score: 0.9750
Training Time: 0.0191 seconds

Classification Report:
              precision    recall  f1-score   support

           0       0.97      0.97      0.97        64
           1       0.98      0.98      0.98       107

    accuracy                           0.98       171
   macro avg       0.98      0.98      0.98       171
weighted avg       0.98      0.98      0.98       171

