# Generate baseline dataset (no interventions)

This notebook generates a *synthetic* dataset of **infected vs time** using a simple SIR model with **no interventions**.

Output:
- `data/processed/scenarios/baseline_no_intervention.csv`

See `docs/SCENARIO_DATASETS.md` for the full scenario plan.


In [None]:
from pathlib import Path

import matplotlib.pyplot as plt

from epidemiology_project.paths import processed_data_dir, figures_dir
from epidemiology_project.sir import SirParams, simulate_sir


## Parameters


In [None]:
params = SirParams(N=1_000_000, beta=0.28, gamma=0.10)  # adjust as desired
days = 200
I0 = 100


## Simulate


In [None]:
df = simulate_sir(params=params, I0=I0, days=days, scenario='baseline_no_intervention')
df.head()


## Save dataset


In [None]:
out_dir = processed_data_dir() / 'scenarios'
out_dir.mkdir(parents=True, exist_ok=True)
out_path = out_dir / 'baseline_no_intervention.csv'
df.to_csv(out_path, index=False)
out_path


## Plot: infected vs time


In [None]:
fig, ax = plt.subplots(figsize=(10,4))
ax.plot(df['date'], df['I'], label='Infected (I)')
ax.set_title('Baseline (no interventions): infected vs time')
ax.set_xlabel('Date')
ax.set_ylabel('People infected (model)')
ax.grid(True, alpha=0.3)
fig.tight_layout()

fig_path = figures_dir(final=True) / 'sir_baseline_infected_vs_time.png'
fig.savefig(fig_path, dpi=200)
fig_path
