# AI Governance Experiment Report

This notebook provides a standardized way to visualize and analyze the results of AI governance experiments conducted using the ACGS scaffold.

In [None]:
import json

import matplotlib.pyplot as plt
import seaborn as sns

from src.evaluators.metrics import GovernanceEvaluator

# Load experiment results
with open("../reports/baseline_results.json", "r") as f:
    logs = json.load(f)

evaluator = GovernanceEvaluator(logs)
metrics = evaluator.calculate_metrics()

## 1. Governance Effectiveness (Blocked Rate vs False Positive Rate)

In [None]:
df = evaluator.df
plt.figure(figsize=(10, 6))
sns.countplot(data=df, x="type", hue="action")
plt.title("Action Distribution by Task Type")
plt.show()

## 2. Decision Latency Analysis

In [None]:
plt.figure(figsize=(10, 6))
sns.histplot(df["latency_ms"], kde=True)
plt.axvline(metrics["audit_latency"]["p50"], color="blue", linestyle="--", label="p50")
plt.axvline(metrics["audit_latency"]["p95"], color="orange", linestyle="--", label="p95")
plt.axvline(metrics["audit_latency"]["p99"], color="red", linestyle="--", label="p99")
plt.title("Decision Latency Distribution (ms)")
plt.legend()
plt.show()

## 3. Statistical Significance and Power Analysis
(To be implemented with SciPy for rigorous hypothesis testing)