# FZ8 PREP (2020 - 2022)

In [1]:
"""
Convert every sheet of the legacy workbook `_fz8_pdf_2020-2022.xlsx`
into a header-less CSV file.

Context
-------
The 2020-2022 data were delivered as a single “PDF-layout” Excel file.
Here we do **no parsing** – we simply dump raw cell values so that they
can later be merged with the 2023-2025 data (which *are* parsed).

Output location
---------------
../data/raw/fz8/csv/fz_8.<N>_2020-2022_raw.csv
where <N> is the sheet number (1 … 16).

All cells are stored as text (`dtype=str`); the CSV has **no header**.
"""

# paths
from pathlib import Path
import pandas as pd
from openpyxl import load_workbook

DATA_DIR = Path("../data/raw/fz8")
XLSX     = DATA_DIR / "_fz8_pdf_2020-2022.xlsx"

# extract
wb = load_workbook(XLSX, read_only=True)

for sheet in wb.sheetnames:
    df = pd.read_excel(XLSX, sheet_name=sheet, dtype=str, header=None)

    # Sheet name looks like “8.2 DONE” → take “8.2” part
    number = sheet.split()[0]
    csv_name = f"fz_8.{number.split('.')[1]}_2020-2022_raw.csv"

    out_path = DATA_DIR / "csv" / csv_name
    df.to_csv(out_path, index=False, header=False)
    print(f"✓ {out_path.name}  ←  sheet «{sheet}»")

print("\nReady.")

✓ fz_8.2_2020-2022_raw.csv  ←  sheet «8.2 DONE»
✓ fz_8.3_2020-2022_raw.csv  ←  sheet «8.3 DONE»
✓ fz_8.6_2020-2022_raw.csv  ←  sheet «8.6 DONE»
✓ fz_8.7_2020-2022_raw.csv  ←  sheet «8.7 DONE»
✓ fz_8.8_2020-2022_raw.csv  ←  sheet «8.8 DONE»
✓ fz_8.9_2020-2022_raw.csv  ←  sheet «8.9 DONE»
✓ fz_8.16_2020-2022_raw.csv  ←  sheet «8.16 DONE»

Ready.
