# IHDP Dataset Analysis

Analyzing the IHDP (Infant Health and Development Program) dataset using causal inference methods.



In [None]:
import sys
sys.path.append('..')

import numpy as np
import pandas as pd
from pathlib import Path
import warnings
warnings.filterwarnings('ignore')

# Set random seed
RANDOM_SEED = 42
np.random.seed(RANDOM_SEED)


In [None]:
from src.data_loader import download_ihdp
from src.dowhy_pipeline import run_full_pipeline

# Download data
data_path = download_ihdp()
data = pd.read_csv(data_path)
print(f"Loaded {len(data)} rows, {len(data.columns)} columns")


In [None]:
# Run pipeline
results = run_full_pipeline(
    dataset_name="ihdp",
    estimators=["ipw", "psm", "dr", "dml"],
    output_dir=Path("../results"),
    random_state=RANDOM_SEED
)

print("\nResults:")
print(results.to_string())
