In [None]:
import sys
from pathlib import Path

# Resolve project root (notebook is in analysis/)
PROJECT_ROOT = Path.cwd().resolve().parents[0]
sys.path.insert(0, str(PROJECT_ROOT))

In [None]:
from scripts.analyse_results import (
    analyse_results,
    describe_recommendation,
    describe_k_breakdown,
    describe_track_breakdown,
)

RESULTS_CSV = f"{PROJECT_ROOT}/outputs/experiments/mut_vs_dnase_full_1/results.csv"

# 1) Run analysis (mode="auto" chooses between pearson vs rf)
out = analyse_results(RESULTS_CSV, mode="auto", require_mela_top_perm=False)

# 2) Human-readable narrative summaries (strings)
print(describe_recommendation(out))
print()
print(describe_k_breakdown(out))
print()
print(describe_track_breakdown(out))

# 3) Access structured outputs for further exploration
best = out["best_overall"]          # pandas Series (recommended config)
k_summary = out["k_summary"]        # DataFrame (mela win rates by k and mode)
best_by_k = out["best_by_k_df"]     # DataFrame (best config per k)
best_by_track = out["best_by_track_df"]  # DataFrame (best config per track strategy)
best_by_k_track = out["best_by_k_track_df"]  # DataFrame (best per (k, track))


In [None]:
# Force a specific winner metric instead of auto
out_rf = analyse_results(RESULTS_CSV, mode="rf")
out_pearson = analyse_results(RESULTS_CSV, mode="pearson")

print(describe_recommendation(out_rf))
print(describe_recommendation(out_pearson))


In [None]:
best_by_k_track