# Week 7 Statistical Business Analysis

This notebook includes all required tasks: descriptive statistics, histograms, density plots, t-tests, correlation, confidence intervals, box/violin/heatmap/subplots.

In [None]:
import pandas as pd
import numpy as np

np.random.seed(42)
data = pd.DataFrame({
    "Marketing_Spend": np.random.normal(5000, 1500, 300),
    "Sales": np.random.normal(20000, 6000, 300)
})
data.to_csv("data.csv", index=False)
data.head()

In [None]:
data.describe()

In [None]:
data.corr()

In [None]:
from scipy import stats

median_spend = data["Marketing_Spend"].median()
group1 = data[data["Marketing_Spend"] >= median_spend]["Sales"]
group2 = data[data["Marketing_Spend"] < median_spend]["Sales"]
stats.ttest_ind(group1, group2)

In [None]:
sales_mean = data['Sales'].mean()
sales_sem = stats.sem(data['Sales'])
stats.t.interval(0.95, len(data)-1, loc=sales_mean, scale=sales_sem)

In [None]:
import matplotlib.pyplot as plt

plt.hist(data["Sales"])
plt.title("Sales Histogram")
plt.show()

In [None]:
data["Sales"].plot(kind="density", title="Sales Density")
plt.show()

In [None]:
plt.boxplot([data["Marketing_Spend"], data["Sales"]], labels=["Marketing Spend", "Sales"])
plt.title("Box Plot")
plt.show()

In [None]:
plt.violinplot([data["Marketing_Spend"], data["Sales"]])
plt.title("Violin Plot")
plt.show()

In [None]:
import matplotlib.pyplot as plt
plt.imshow(data.corr())
plt.colorbar()
plt.title("Heatmap")
plt.show()

In [None]:
fig, axs = plt.subplots(2, 2, figsize=(10, 8))

axs[0,0].hist(data["Sales"])
axs[0,0].set_title("Histogram")

axs[0,1].plot(data["Sales"])
axs[0,1].set_title("Line Plot")

axs[1,0].scatter(data["Marketing_Spend"], data["Sales"])
axs[1,0].set_title("Scatter")

axs[1,1].boxplot(data["Sales"])
axs[1,1].set_title("Box")

plt.tight_layout()
plt.show()