# Notebook 31 - Annotated Methodology Table
This notebook creates a structured overview of all key notebooks, listing inputs, outputs, method type, and purpose for thesis documentation.

In [1]:
import pandas as pd
import os

# Output folder
output_folder = "thesis_outputs"
os.makedirs(output_folder, exist_ok=True)

# Define pipeline steps manually
pipeline_steps = [
    {"notebook": "01_preview_data", "step": "Preview Raw Files", "inputs": "Raw Excel Snapshots", "outputs": "Preview summary", "method": "Manual Inspection", "purpose": "Understand data layout and headers"},
    {"notebook": "02_standardize_columns", "step": "Clean Headers", "inputs": "All raw files", "outputs": "Clean CSVs", "method": "Column renaming", "purpose": "Standardize tables for downstream use"},
    {"notebook": "03_merge_metadata", "step": "Merge Product Info", "inputs": "Clean CSVs", "outputs": "Merged product table", "method": "Joins", "purpose": "Enrich sales/waste with categories"},
    {"notebook": "04_prepare_semantic_matching", "step": "Text Normalization", "inputs": "Product + Recipe names", "outputs": "Embeddings", "method": "Sentence-BERT", "purpose": "Enable semantic comparison"},
    {"notebook": "05_evaluate_matching_methods", "step": "Match Evaluation", "inputs": "Recipe-product pairs", "outputs": "Precision scores", "method": "Exact, Fuzzy, Semantic", "purpose": "Compare match strategies"},
    {"notebook": "06_ontology_alignment", "step": "Concept Mapping", "inputs": "Ingredients + Products", "outputs": "Ontology tags", "method": "Manual rules + embeddings", "purpose": "Align to shared food taxonomy"},
    {"notebook": "07_to_10", "step": "Store-Level Meal Box Planning", "inputs": "Products + recipes + store data", "outputs": "Meal box plan", "method": "Matching + prioritization", "purpose": "Prepare deployment strategy"},
    {"notebook": "14_to_24", "step": "Waste Reduction Simulation", "inputs": "Meal plans + waste logs", "outputs": "KPIs per strategy", "method": "Concept join + simulation", "purpose": "Quantify avoided waste"},
    {"notebook": "27", "step": "Deployment Summary", "inputs": "Ranked plan + inventories", "outputs": "Per-store summaries", "method": "Join + export", "purpose": "Enable operational deployment"},
    {"notebook": "28_to_30", "step": "Appendix and Reporting Tables", "inputs": "Final results", "outputs": "CSV + LaTeX + PNGs", "method": "Export formatting", "purpose": "Support thesis transparency"}
]

df_pipeline = pd.DataFrame(pipeline_steps)
df_pipeline.to_csv(os.path.join(output_folder, "annotated_methodology_table.csv"), index=False)
df_pipeline.to_latex(os.path.join(output_folder, "annotated_methodology_table.tex"), index=False, escape=False)

print("Saved annotated methodology table to:", output_folder)
df_pipeline


Saved annotated methodology table to: thesis_outputs


Unnamed: 0,notebook,step,inputs,outputs,method,purpose
0,01_preview_data,Preview Raw Files,Raw Excel Snapshots,Preview summary,Manual Inspection,Understand data layout and headers
1,02_standardize_columns,Clean Headers,All raw files,Clean CSVs,Column renaming,Standardize tables for downstream use
2,03_merge_metadata,Merge Product Info,Clean CSVs,Merged product table,Joins,Enrich sales/waste with categories
3,04_prepare_semantic_matching,Text Normalization,Product + Recipe names,Embeddings,Sentence-BERT,Enable semantic comparison
4,05_evaluate_matching_methods,Match Evaluation,Recipe-product pairs,Precision scores,"Exact, Fuzzy, Semantic",Compare match strategies
5,06_ontology_alignment,Concept Mapping,Ingredients + Products,Ontology tags,Manual rules + embeddings,Align to shared food taxonomy
6,07_to_10,Store-Level Meal Box Planning,Products + recipes + store data,Meal box plan,Matching + prioritization,Prepare deployment strategy
7,14_to_24,Waste Reduction Simulation,Meal plans + waste logs,KPIs per strategy,Concept join + simulation,Quantify avoided waste
8,27,Deployment Summary,Ranked plan + inventories,Per-store summaries,Join + export,Enable operational deployment
9,28_to_30,Appendix and Reporting Tables,Final results,CSV + LaTeX + PNGs,Export formatting,Support thesis transparency
