In [1]:
import pandas as pd
from sklearn.ensemble import RandomForestRegressor
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_absolute_error, mean_squared_error

# Example dataset: features and target (wait times)
data = pd.DataFrame({
    "CapacityUtilization": [0.8, 0.6, 0.9, 0.4],  # Hospital capacity utilization as a ratio
    "DayOfWeek": [1, 3, 4, 5],  # Numerical encoding for days of the week
    "HistoricalWaitTime": [30, 45, 20, 60],  # Historical average wait times (minutes)
    "WaitTime": [35, 50, 25, 55]  # Actual observed wait times (target variable)
})

# Features and target variable
features = data[["CapacityUtilization", "DayOfWeek", "HistoricalWaitTime"]]
target = data["WaitTime"]

# Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(features, target, test_size=0.2, random_state=42)

# Initialize and train the Random Forest Regressor
rf_model = RandomForestRegressor(n_estimators=100, random_state=42)
rf_model.fit(X_train, y_train)

# Make predictions on the test set
predictions = rf_model.predict(X_test)

# Evaluate model performance
mse = mean_squared_error(y_test, predictions)  # Mean Squared Error
mae = mean_absolute_error(y_test, predictions)  # Mean Absolute Error

# Output evaluation metrics
print("Mean Squared Error:", mse)
print("Mean Absolute Error:", mae)


Mean Squared Error: 156.25
Mean Absolute Error: 12.5
