In [1]:
import pandas as pd
import numpy as np
import random
from datetime import datetime, timedelta

# === 1) Folder path where you want to save ===
folder = "/Users/chriswinge/desktop/Job Projects/Sierra Nevada"  # <<-- change to your folder

# Helper: random date generator
def random_dates(start, end, n=10):
    start_u = start.value // 10**9
    end_u = end.value // 10**9
    return pd.to_datetime(np.random.randint(start_u, end_u, n), unit='s')

# === 2) sales_scan_data.csv ===
dates = pd.date_range("2024-01-01", "2024-12-31", freq="W")
markets = ["CA", "PA", "TX", "CO", "NC"]
brands = ["Sierra Nevada Pale Ale", "Sierra Nevada Hazy IPA", "Sierra Nevada Torpedo", "Competitor IPA", "Competitor Lager"]
packages = ["6pk Cans", "12pk Bottles", "Single Draft"]

sales_scan_data = pd.DataFrame({
    "Date": np.random.choice(dates, 200),
    "Account": np.random.choice(["Safeway", "Whole Foods", "Kroger", "Publix", "Costco"], 200),
    "Market": np.random.choice(markets, 200),
    "Brand": np.random.choice(brands, 200),
    "Package": np.random.choice(packages, 200),
    "Units_Sold": np.random.randint(20, 500, 200),
    "Dollars_Sold": np.random.uniform(200, 5000, 200).round(2),
    "Promoted": np.random.choice(["Y", "N"], 200, p=[0.3, 0.7])
})
sales_scan_data.to_csv(folder + "sales_scan_data.csv", index=False)

# === 3) consumer_insights_survey.csv ===
consumer_insights = pd.DataFrame({
    "Respondent_ID": range(1, 101),
    "Age": np.random.randint(21, 65, 100),
    "Gender": np.random.choice(["Male", "Female", "Non-Binary"], 100),
    "Market": np.random.choice(markets, 100),
    "Favorite_Brand": np.random.choice(brands, 100),
    "Purchase_Frequency": np.random.choice(["Weekly", "Monthly", "Occasionally"], 100),
    "Occasion": np.random.choice(["At-Home", "Bar", "Event"], 100),
    "Sustainability_Importance": np.random.randint(1, 6, 100)  # Likert 1-5
})
consumer_insights.to_csv(folder + "consumer_insights_survey.csv", index=False)

# === 4) pricing_comparison.csv ===
pricing = pd.DataFrame({
    "Market": np.random.choice(markets, 50),
    "Brand": np.random.choice(brands, 50),
    "Package": np.random.choice(packages, 50),
    "Price_Per_Unit": np.random.uniform(1.0, 3.5, 50).round(2),
    "Promotion_Discount (%)": np.random.choice([0, 5, 10, 15, 20], 50),
    "Competitor": np.random.choice(["Y", "N"], 50, p=[0.5, 0.5])
})
pricing.to_csv(folder + "pricing_comparison.csv", index=False)

# === 5) planogram_data.csv ===
planogram = pd.DataFrame({
    "Account": np.random.choice(["Safeway", "Whole Foods", "Kroger", "Publix", "Costco"], 50),
    "Market": np.random.choice(markets, 50),
    "Shelf_Space_Linear_Feet": np.random.uniform(2, 20, 50).round(1),
    "Brand": np.random.choice(brands, 50),
    "Package": np.random.choice(packages, 50),
    "Facings": np.random.randint(1, 10, 50),
    "Sales_Per_Facing": np.random.uniform(50, 500, 50).round(2)
})
planogram.to_csv(folder + "planogram_data.csv", index=False)

# === 6) distribution_data.csv ===
distribution = pd.DataFrame({
    "Market": np.random.choice(markets, 50),
    "Account": np.random.choice(["Safeway", "Whole Foods", "Kroger", "Publix", "Costco"], 50),
    "Brand": np.random.choice(brands, 50),
    "Package": np.random.choice(packages, 50),
    "Authorized": np.random.choice(["Y", "N"], 50, p=[0.9, 0.1]),
    "On_Shelf": np.random.choice(["Y", "N"], 50, p=[0.85, 0.15]),
    "Out_Of_Stock_Days": np.random.randint(0, 15, 50)
})
distribution.to_csv(folder + "distribution_data.csv", index=False)

# === 7) promotion_results.csv ===
promotion = pd.DataFrame({
    "Market": np.random.choice(markets, 40),
    "Account": np.random.choice(["Safeway", "Whole Foods", "Kroger", "Publix", "Costco"], 40),
    "Brand": np.random.choice(brands, 40),
    "Promotion_Type": np.random.choice(["Display", "Price Cut", "BOGO", "Digital Ad"], 40),
    "Start_Date": pd.date_range("2024-01-01", periods=40, freq="7D"),
    "End_Date": pd.date_range("2024-01-08", periods=40, freq="7D"),
    "Incremental_Units": np.random.randint(50, 1000, 40),
    "ROI": np.random.uniform(0.5, 5.0, 40).round(2)
})
promotion.to_csv(folder + "promotion_results.csv", index=False)

# === 8) market_trends.csv ===
market_trends = pd.DataFrame({
    "Year": np.random.choice([2022, 2023, 2024], 30),
    "Quarter": np.random.choice([1, 2, 3, 4], 30),
    "Market": np.random.choice(markets, 30),
    "Category": np.random.choice(["IPA", "Lager", "Non-Alcoholic", "Flavored Beer"], 30),
    "Growth_Rate (%)": np.random.uniform(-5, 15, 30).round(2),
    "SNBC_Share (%)": np.random.uniform(2, 15, 30).round(2),
    "Competitor_Share (%)": np.random.uniform(2, 15, 30).round(2)
})
market_trends.to_csv(folder + "market_trends.csv", index=False)

print("✅ Mock Sierra Nevada datasets created and saved!")


✅ Mock Sierra Nevada datasets created and saved!
