In [None]:
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, roc_auc_score, classification_report
import pandas as pd
import joblib

# Load labeled dataset
labeled_data = pd.read_csv('../data/labeled_data.csv')

# Train-test split
X_train, X_test, y_train, y_test = train_test_split(labeled_data.drop('Disease', axis=1), labeled_data['Disease'], test_size=0.2, random_state=42)

# Train model for Alzheimer's
alzheimers_model = RandomForestClassifier(n_estimators=100, random_state=42)
alzheimers_model.fit(X_train, y_train)

# Save model
joblib.dump(alzheimers_model, '../models/alzheimers_model.pkl')

# Train model for Huntington's
huntingtons_model = RandomForestClassifier(n_estimators=100, random_state=42)
huntingtons_model.fit(X_train, y_train)

# Save model
joblib.dump(huntingtons_model, '../models/huntingtons_model.pkl')

# Evaluate model
y_pred = alzheimers_model.predict(X_test)
accuracy = accuracy_score(y_test, y_pred)
roc_auc = roc_auc_score(y_test, y_pred)
print(f'Alzheimer\'s Model Accuracy: {accuracy}')
print(f'Alzheimer\'s Model AUC: {roc_auc}')
print(classification_report(y_test, y_pred))
