chi square

In [3]:
import numpy as np
import scipy.stats as stats
import pandas as pd

# Step 1: State the Hypotheses
# H0: There is no association between the type of smart home device and customer satisfaction.
# H1: There is an association between the type of smart home device and customer satisfaction.

# Step 2: Create the Contingency Table
data = np.array([[50, 70], [80, 100], [60, 90], [30, 50], [20, 50]])
labels = ['Very Satisfied', 'Satisfied', 'Neutral', 'Unsatisfied', 'Very Unsatisfied']
devices = ['Smart Thermostat', 'Smart Light']

df = pd.DataFrame(data, index=labels, columns=devices)
print("Contingency Table:\n", df)

# Step 3: Compute the Chi-Square Statistic
chi2_stat, p_value, dof, expected = stats.chi2_contingency(df)

print(f"Chi-Square Statistic: {chi2_stat}")
print(f"P-value: {p_value}")
print(f"Degrees of Freedom: {dof}")
print("Expected Frequencies:\n", pd.DataFrame(expected, index=labels, columns=devices))

# Step 4: Determine the Critical Value (alpha = 0.05)
alpha = 0.05
critical_value = stats.chi2.ppf(1 - alpha, dof)
print(f"Critical Value at alpha=0.05: {critical_value}")

# Step 5: Decision Rule
if chi2_stat > critical_value:
    print("Reject the null hypothesis: There is a significant association between device type and satisfaction.")
else:
    print("Fail to reject the null hypothesis: No significant association between device type and satisfaction.")


Contingency Table:
                   Smart Thermostat  Smart Light
Very Satisfied                  50           70
Satisfied                       80          100
Neutral                         60           90
Unsatisfied                     30           50
Very Unsatisfied                20           50
Chi-Square Statistic: 5.638227513227513
P-value: 0.22784371130697179
Degrees of Freedom: 4
Expected Frequencies:
                   Smart Thermostat  Smart Light
Very Satisfied                48.0         72.0
Satisfied                     72.0        108.0
Neutral                       60.0         90.0
Unsatisfied                   32.0         48.0
Very Unsatisfied              28.0         42.0
Critical Value at alpha=0.05: 9.487729036781154
Fail to reject the null hypothesis: No significant association between device type and satisfaction.


# Hypothesis Testing