## Real-World Case Studies

### Finance - Fraud Detection Models:
**Description**: Analyze a financial dataset, define SLAs for data accuracy and
completeness, and ensure high data quality for fraud detection models.

In [1]:
import pandas as pd
import numpy as np
from sklearn.ensemble import IsolationForest

data = pd.DataFrame({
    "transaction_id": range(1, 1001),
    "amount": np.append(np.random.normal(100, 20, 980), np.random.normal(1000, 100, 20)),
    "account_age_days": np.random.randint(30, 1000, size=1000),
    "is_fraud": [0]*980 + [1]*20
})

completeness = data.notnull().mean().mean() * 100
accuracy_sla = 99
completeness_sla = 95

model = IsolationForest(contamination=0.02, random_state=42)
data["anomaly"] = model.fit_predict(data[["amount", "account_age_days"]])
data["anomaly"] = data["anomaly"].map({1: 0, -1: 1})

completeness_pass = completeness >= completeness_sla
accuracy_pass = (data["anomaly"] == data["is_fraud"]).mean() * 100 >= accuracy_sla

(completeness_pass, accuracy_pass)


(True, True)