In [3]:
# Import necessary libraries
from sklearn.datasets import load_breast_cancer
from sklearn.ensemble import RandomForestClassifier
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score, confusion_matrix
import pandas as pd

# Load the dataset
data = load_breast_cancer()
# Creating a DataFrame 'X' with the feature data and assigning appropriate column names from the dataset's feature names
# This DataFrame 'X' will be used as the input features for the model.
X = pd.DataFrame(data.data, columns=data.feature_names)


# Creating a Series 'y' for the target variable, which indicates if the cancer is benign or malignant
# This Series 'y' will be used as the labels for the model training.
y = pd.Series(data.target)


# Data preprocessing
# Splitting the dataset into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

# Model Training
# Initialize the Random Forest classifier with specified parameters
rf = RandomForestClassifier(n_estimators=100, max_depth=10, random_state=42)
rf.fit(X_train, y_train)

# Model Evaluation
# Making predictions and evaluating the model
y_pred = rf.predict(X_test)
accuracy = accuracy_score(y_test, y_pred)
conf_matrix = confusion_matrix(y_test, y_pred)

# Output the results
print("Accuracy of the Random Forest model: {:.2f}%".format(accuracy * 100))
print("Confusion Matrix:")
print(conf_matrix)


Accuracy of the Random Forest model: 97.08%
Confusion Matrix:
[[ 59   4]
 [  1 107]]
