# Cancer Cell Classification using Scikit‑learn
This notebook walks through data exploration, model training, and evaluation.

In [None]:
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import accuracy_score, confusion_matrix, ConfusionMatrixDisplay
import pandas as pd
import matplotlib.pyplot as plt

## Load dataset

In [None]:
data = load_breast_cancer()
X = data.data
y = data.target
print(data.DESCR.split('\n')[0])

## DataFrame preview

In [None]:
df = pd.DataFrame(X, columns=data.feature_names)
df.head()

## Train‑test split

In [None]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33, random_state=42)

## Train Naive Bayes model

In [None]:
model = GaussianNB()
model.fit(X_train, y_train)

## Evaluate model

In [None]:
y_pred = model.predict(X_test)
acc = accuracy_score(y_test, y_pred)
print(f'Accuracy: {acc*100:.2f}%')
cm = confusion_matrix(y_test, y_pred)
ConfusionMatrixDisplay(cm, display_labels=data.target_names).plot()
plt.show()