In [4]:
import pandas as pd
import os

# 1. Load Data
# Access the 'data' folder in the parent directory
target_path = '../data/cafe_sales_data_en.csv'

try:
    df = pd.read_csv(target_path)
    df['Date'] = pd.to_datetime(df['Date']) # Convert to datetime object
    print(f"‚úÖ Data successfully loaded! Path: {target_path}")
    print(f"Total Records: {len(df):,}")

    # -------------------------------------------------------
    # 2. Validation: Sandwich Launch Effect (Pre vs Post July)
    # -------------------------------------------------------

    # Split data based on launch date (July 1st)
    pre_sandwich = df[df['Date'] < '2023-07-01']
    post_sandwich = df[df['Date'] >= '2023-07-01']

    # Calculate average daily transactions (Customer Traffic)
    avg_pre = pre_sandwich.groupby('Date').size().mean()
    avg_post = post_sandwich.groupby('Date').size().mean()

    print(f"\n[üìä Validation Result: Sandwich Launch Effect]")
    print(f"1. Pre-Launch (Jan-Jun) Avg Traffic: {avg_pre:.1f}")
    print(f"2. Post-Launch (Jul-Dec) Avg Traffic: {avg_post:.1f}")

    # Calculate Growth Rate
    growth_rate = ((avg_post - avg_pre) / avg_pre) * 100
    print(f"3. üìà Growth Rate: {growth_rate:.1f}% (Sandwich Effect + Seasonality)")

    # -------------------------------------------------------
    # 3. Validation: Monthly Sandwich Sales Integrity
    # -------------------------------------------------------
    # Check if sandwich sales are strictly zero before July
    sandwich_counts = df[df['Category'] == 'Sandwich'].groupby(df['Date'].dt.month).size()
    print(f"\n[ü•™ Monthly Sandwich Sales Volume]")
    print(sandwich_counts)

except FileNotFoundError:
    print("‚ùå File not found. Please check the directory structure.")

‚úÖ Data successfully loaded! Path: ../data/cafe_sales_data_en.csv
Total Records: 27,853

[üìä Validation Result: Sandwich Launch Effect]
1. Pre-Launch (Jan-Jun) Avg Traffic: 69.7
2. Post-Launch (Jul-Dec) Avg Traffic: 82.8
3. üìà Growth Rate: 18.7% (Sandwich Effect + Seasonality)

[ü•™ Monthly Sandwich Sales Volume]
Date
7     320
8     300
9     268
10    301
11    300
12    190
dtype: int64
