# ðŸ’Š $12M Cost-Cut Rx â€” Healthcare Analytics Demo
This notebook demonstrates Pareto analysis and claim denial prediction modeling using sample data.

In [None]:

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import roc_auc_score

# Load data
df = pd.read_csv('sample_claims_data.csv')
df.head()


## ðŸ“Š Pareto Analysis â€” Identifying High-Cost Members

In [None]:

# Sort by total cost and compute cumulative percentage
df_sorted = df.sort_values('total_cost', ascending=False)
df_sorted['cum_perc'] = df_sorted['total_cost'].cumsum() / df_sorted['total_cost'].sum() * 100

# Identify top 5% threshold
threshold = df['total_cost'].quantile(0.95)
df['high_cost_flag'] = (df['total_cost'] >= threshold).astype(int)

# Plot Pareto curve
plt.figure(figsize=(8,5))
plt.plot(np.arange(len(df_sorted)), df_sorted['cum_perc'], label='Cumulative % of Spend')
plt.axhline(80, color='r', linestyle='--', label='80% Line')
plt.title('Pareto Curve: Cumulative Spend Distribution')
plt.xlabel('Patients (sorted by total cost)')
plt.ylabel('Cumulative % of Spend')
plt.legend()
plt.tight_layout()
plt.show()


## ðŸ¤– Predictive Model â€” Claim Denial Prediction

In [None]:

features = ['age', 'chronic_conditions', 'ed_visits', 'total_cost']
X = df[features]
y = df['denied_claim']

# Train/test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Train model
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)
y_pred_prob = model.predict_proba(X_test)[:, 1]

# Evaluate
auc = roc_auc_score(y_test, y_pred_prob)
print(f'Model AUC: {auc:.3f}')


## ðŸ’¡ Insights
- The Pareto principle confirms a small cohort drives most spend.
- Predictive modeling enables proactive denial prevention.
- This notebook represents an end-to-end healthcare analytics workflow.

**Next Steps:** Integrate real data, expand features, and publish dashboards for leadership insights.