In [None]:
# model_evaluation.ipynb

## IMPORT LIBRARIES

In [None]:
import numpy as np
import pandas as pd
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split, cross_val_score
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import classification_report, confusion_matrix


## LOAD BREAST CANCER DATA SET

In [None]:
data = load_breast_cancer()
X = pd.DataFrame(data.data, columns=data.feature_names)
y = pd.Series(data.target, name="target")

## SPLIT DATA INTO TRAINING & TEST SETS

In [None]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)


## DEFINE RANDOM FOREST CLASSIFIER MODEL

In [None]:
clf = RandomForestClassifier(
    n_estimators=200,
    max_depth=None,
    random_state=42,
)

## FIT RANDOM FOREST CLASSIFIER

In [None]:
clf.fit(X_train, y_train)
y_pred = clf.predict(X_test)

## PRINT SUMMARIES, CONFUSION MATRIX, & CROSS-VALIDATION SCORES

In [None]:
print("Classification report:\n", classification_report(y_test, y_pred))
print("Confusion matrix:\n", confusion_matrix(y_test, y_pred))

cv_scores = cross_val_score(clf, X, y, cv=5, scoring="accuracy")
print("Cross-validated accuracy:", cv_scores.mean())