In [1]:
# breast_cancer_model.ipynb

import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, f1_score
from sklearn.preprocessing import LabelEncoder

# Load breast cancer dataset
from sklearn.datasets import load_breast_cancer
data = load_breast_cancer()

# Create DataFrame
df = pd.DataFrame(data.data, columns=data.feature_names)
df['target'] = data.target

# Simulate 'priority' label: low, medium, high
np.random.seed(42)
df['priority'] = np.random.choice(['low', 'medium', 'high'], size=len(df))

# Encode priority
label_encoder = LabelEncoder()
df['priority_encoded'] = label_encoder.fit_transform(df['priority'])

# Features and labels
X = df.drop(columns=['priority', 'priority_encoded', 'target'])
y = df['priority_encoded']

# Split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1)

# Train
clf = RandomForestClassifier(n_estimators=100, random_state=1)
clf.fit(X_train, y_train)

# Predict
y_pred = clf.predict(X_test)

# Evaluate
acc = accuracy_score(y_test, y_pred)
f1 = f1_score(y_test, y_pred, average='weighted')

print(f"Accuracy: {acc:.2f}")
print(f"F1 Score: {f1:.2f}")


Accuracy: 0.33
F1 Score: 0.34
