Mizzare Corporation has collected data on customer satisfaction levels for two types of smart home devices: Smart Thermostats and Smart Lights. They want to determine if there's a significant association between the type of device purchased and the customer's satisfaction level.

In [1]:
import numpy as np
import pandas as pd
import scipy.stats as stats

In [2]:
## hypothesis statement
##H0 = "There is no association between the type of device purchased and the customer's satisfaction level."
## H1 = "There is an association between the type of device purchased and the customer's satisfaction level."

In [3]:
observed = np.array([[50, 70],
                     [80, 100],
                     [60, 90],
                     [30, 50],
                     [20, 50]])

In [4]:
row_totals = observed.sum(axis=1)
col_totals = observed.sum(axis=0)
grand_total = observed.sum()

In [5]:
expected = np.outer(row_totals, col_totals) / grand_total

In [6]:
chi_square_statistic = ((observed - expected) ** 2 / expected).sum()

In [7]:
df = (observed.shape[0] - 1) * (observed.shape[1] - 1)

In [8]:
alpha = 0.05
critical_value = stats.chi2.ppf(1 - alpha, df)

In [9]:
p_value = 1 - stats.chi2.cdf(chi_square_statistic, df)

In [10]:
if chi_square_statistic > critical_value:
    conclusion = "Reject the null hypothesis: There is a significant association between device type and customer satisfaction."
else:
    conclusion = "Fail to reject the null hypothesis: There is no significant association between device type and customer satisfaction."


In [11]:
print(f"Chi-Square Statistic: {chi_square_statistic:.2f}")
print(f"Critical Value: {critical_value:.2f}")
print(f"P-value: {p_value:.4f}")
print(f"Conclusion: {conclusion}")

Chi-Square Statistic: 5.64
Critical Value: 9.49
P-value: 0.2278
Conclusion: Fail to reject the null hypothesis: There is no significant association between device type and customer satisfaction.
