In [5]:
# Import necessary libraries
import pandas as pd
from scipy.stats import chi2_contingency, chi2

# Step 1: Define the data in a contingency table format
data = pd.DataFrame({
    'Smart Thermostat': [50, 80, 60, 30, 20],
    'Smart Light': [70, 100, 90, 50, 50]
}, index=['Very Satisfied', 'Satisfied', 'Neutral', 'Unsatisfied', 'Very Unsatisfied'])

# Step 2: State the Hypotheses
# Null Hypothesis (H0): There is no association between the type of device and customer satisfaction.
# Alternative Hypothesis (H1): There is an association between the type of device and customer satisfaction.

# Step 3: Perform the Chi-Square test
chi2_stat, p_value, dof, expected = chi2_contingency(data)

# Step 4: Define significance level and find critical value
alpha = 0.05
critical_value = chi2.ppf(1 - alpha, dof)

# Step 5: Conclusion based on comparison between chi2_stat and critical_value
if chi2_stat > critical_value:
    conclusion = "Reject the null hypothesis: There is a significant association between device type and satisfaction level."
else:
    conclusion = "Fail to reject the null hypothesis: No significant association between device type and satisfaction level."

# Step 6: Print the results
print("Chi-Square Test Analysis for Association between Device Type and Customer Satisfaction")
print("--------------------------------------------------------------------------")
print("Chi-Square Statistic:", chi2_stat)
print("P-value:", p_value)
print("Degrees of Freedom:", dof)
print("Critical Value (at alpha = 0.05):", critical_value)
print("Conclusion:", conclusion)
print("--------------------------------------------------------------------------")

# Additional Information for clarity in your report:
# Display the expected frequencies for each cell as calculated by the chi-square test.
print("\nExpected Frequencies Table:")
print(pd.DataFrame(expected, index=data.index, columns=data.columns))


Chi-Square Test Analysis for Association between Device Type and Customer Satisfaction
--------------------------------------------------------------------------
Chi-Square Statistic: 5.638227513227513
P-value: 0.22784371130697179
Degrees of Freedom: 4
Critical Value (at alpha = 0.05): 9.487729036781154
Conclusion: Fail to reject the null hypothesis: No significant association between device type and satisfaction level.
--------------------------------------------------------------------------

Expected Frequencies Table:
                  Smart Thermostat  Smart Light
Very Satisfied                48.0         72.0
Satisfied                     72.0        108.0
Neutral                       60.0         90.0
Unsatisfied                   32.0         48.0
Very Unsatisfied              28.0         42.0
