In [1]:
import pandas as pd
from scipy import stats

# 1. Load the cleaned dataset
# Ensure 'cleaned_data.csv' is in the same directory
df = pd.read_csv('cleaned_data.csv')

# 2. Define the Groups for Analysis
# We are comparing Sales between 'Consumer' and 'Corporate' segments
consumer_sales = df[df['Segment'] == 'Consumer']['Sales']
corporate_sales = df[df['Segment'] == 'Corporate']['Sales']

# 3. Perform Statistical Hypothesis Testing (T-Test)
# Null Hypothesis (H0): There is no difference in average sales between the two segments.
# Alternate Hypothesis (H1): There is a significant difference in average sales.
t_stat, p_value = stats.ttest_ind(consumer_sales, corporate_sales)

# 4. Print the Results
print("---------------------------------------------------")
print("Statistical Hypothesis Testing Results")
print("---------------------------------------------------")
print(f"T-Statistic: {t_stat:.4f}")
print(f"P-Value:     {p_value:.4f}")
print("---------------------------------------------------")

# 5. Business Conclusion based on P-Value
# We use a significance level (alpha) of 0.05 (5%)
alpha = 0.05

if p_value < alpha:
    print("Conclusion: REJECT Null Hypothesis.")
    print("Insight: There is a STATISTICALLY SIGNIFICANT difference in spending behavior between Consumer and Corporate segments.")
    print("Recommendation: Marketing strategies should be tailored differently for each segment.")
else:
    print("Conclusion: FAIL TO REJECT Null Hypothesis.")
    print("Insight: There is NO significant difference in spending behavior between Consumer and Corporate segments.")
    print("Recommendation: A unified marketing approach can be used for both segments as their spending patterns are similar.")

---------------------------------------------------
Statistical Hypothesis Testing Results
---------------------------------------------------
T-Statistic: -0.5896
P-Value:     0.5555
---------------------------------------------------
Conclusion: FAIL TO REJECT Null Hypothesis.
Insight: There is NO significant difference in spending behavior between Consumer and Corporate segments.
Recommendation: A unified marketing approach can be used for both segments as their spending patterns are similar.
