# 02 — Analysis using AHS data

Load analysis-ready AHS data and run the **shared econometric pipeline** from `scripts/core_metrics.py` (OLS, HC3, WLS, log-level, diagnostics). No SFA; drivers/barriers only.

In [None]:
import os
import sys
import pandas as pd

REPO_ROOT = os.path.dirname(os.getcwd()) if os.path.basename(os.getcwd()) == "notebooks" else os.getcwd()
sys.path.insert(0, os.path.join(REPO_ROOT, "scripts"))
from core_metrics import run_ols_pipeline, interpret_effect

DATA_PROCESSED = os.path.join(REPO_ROOT, "data", "processed")
path_ahs = os.path.join(DATA_PROCESSED, "ahs_analysis_ready.csv")
if not os.path.isfile(path_ahs):
    raise FileNotFoundError("Run 01_ingestion_AHS.ipynb first and save ahs_analysis_ready.csv")
df = pd.read_csv(path_ahs)
print("Loaded:", df.shape)

In [None]:
results = run_ols_pipeline(df, target_col="Multigen_Rate", weight_col="_total_hh" if "_total_hh" in df.columns else None)
print("OLS (HC3) R²:", results["ols_robust"].rsquared)
print("N:", int(results["ols_robust"].nobs))

In [None]:
results["coef_table"][["Label", "Robust_Coef", "Robust_SE", "Robust_pval", "Significance"]].head(15)

In [None]:
results["beta_table"][["Label", "Beta_Coef", "Beta_pval", "Significance"]].head(10)