In [7]:
import pandas as pd
import numpy as np

In [8]:
# Set random seed for reproducibility
np.random.seed(42)

In [9]:
# Generate simulated data
n = 1000  # Number of data points
dates = pd.date_range(start="2020-01-01", periods=n, freq="D")
marketing_spend = np.random.normal(5000, 2000, n)  # Simulate marketing spend
seasonality = np.random.choice([1, 2, 3, 4], size=n)  # Simulate seasonal factor
price = np.random.normal(20, 5, n)  # Simulate price
competitor_sales = np.random.normal(10000, 5000, n)  # Simulate competitor sales


In [14]:
# Generate a target sales variable (sales)
sales = (0.5 * marketing_spend + 0.3 * seasonality + 0.1 * price + 0.1 * competitor_sales + np.random.normal(0, 500, n))


In [16]:
# Create DataFrame
data = pd.DataFrame({
    'Date': dates,
    'Marketing Spend': marketing_spend,
    'Seasonality': seasonality,
    'Product Price': price,
    'Competitor Sales': competitor_sales,
    'Sales': sales
})

In [18]:
data.head()


Unnamed: 0,Date,Marketing Spend,Seasonality,Product Price,Competitor Sales,Sales
0,2020-01-01,5993.428306,3,18.173392,9582.810151,4943.983596
1,2020-01-02,4723.471398,4,20.923402,2751.773902,1947.211458
2,2020-01-03,6295.377076,1,13.264369,5390.700934,3941.179689
3,2020-01-04,8046.059713,4,15.14193,4980.21314,5268.321918
4,2020-01-05,4531.693251,3,26.00207,11036.336647,4508.70537


In [22]:
# Save to CSV
data.to_csv("simulated_sales_data.csv", index=False)