In [None]:
from pathlib import Path
import pandas as pd
import kagglehub

DATASET = "rohitgrewal/global-superstore-data"

def main() -> None:
    path = kagglehub.dataset_download(DATASET)
    data_path = Path(path)

    print(f"Downloaded to: {data_path}")
    print("Files:")
    for p in data_path.iterdir():
        print(" -", p.name)

    # Find the Excel file (robust)
    excel_files = list(data_path.rglob("*.xlsx"))
    if not excel_files:
        raise FileNotFoundError(f"No .xlsx file found in {data_path}")

    excel_file = excel_files[0]
    print(f"Using Excel file: {excel_file}")

    # Read all sheets and write CSV per sheet
    sheets = pd.read_excel(excel_file, sheet_name=None, engine="openpyxl")

    out_dir = Path("data/raw")
    out_dir.mkdir(parents=True, exist_ok=True)

    for sheet_name, df in sheets.items():
        csv_path = out_dir / f"{sheet_name}.csv"
        df.to_csv(csv_path, index=False)
        print(f"Saved: {csv_path}")

    print("\nDone. Now upload the CSVs to SQLite Online:")
    print(" - data/raw/Orders.csv")
    print(" - data/raw/Returns.csv")
    print(" - data/raw/People.csv")

if __name__ == "__main__":
    main()

