In [1]:
import pandas as pd
import scipy.stats as stats
from statsmodels.stats.multicomp import pairwise_tukeyhsd

In [2]:
# Load data
data = pd.read_csv("results.csv")

In [3]:
# Clean Q4: Drop rows with missing Q4 values
data = data.dropna(subset=["Which type of scenes held your attention better? "])
q4_groups = data["Which type of scenes held your attention better? "].unique()

In [8]:
# Function to run ANOVA and post-hoc tests
def run_anova_test(column_name):
    # Extract data for each Q4 group
    grouped_data = [data[data["Which type of scenes held your attention better? "] == group][column_name].astype(float)
                    for group in q4_groups]

    # One-way ANOVA
    f_stat, p_value = stats.f_oneway(*grouped_data)
    print(f"\n--- ANOVA for {column_name} ---")
    print(f"F-statistic: {f_stat:.2f}, p-value: {p_value:.4f}")

    # Post-hoc Tukey HSD test if ANOVA is significant
    if p_value < 0.05:
        posthoc = pairwise_tukeyhsd(data[column_name].astype(float),
                               data["Which type of scenes held your attention better? "])
        print(posthoc)


In [9]:
# Run tests for Q1 and Q5
run_anova_test("How engaged were you during scenes that included Pepper’s arm gestures?  (1: Not engaged → 5: Highly engaged)")
run_anova_test("How did scenes with arm gestures compare to ones without, in making you feel immersed?\n(1: Less immersive → 5: More immersive)")


--- ANOVA for How engaged were you during scenes that included Pepper’s arm gestures?  (1: Not engaged → 5: Highly engaged) ---
F-statistic: 17.81, p-value: 0.0001
                    Multiple Comparison of Means - Tukey HSD, FWER=0.05                    
         group1                     group2           meandiff p-adj   lower   upper  reject
-------------------------------------------------------------------------------------------
           No difference    Scenes with arm gestures   2.5333 0.0005  1.1759  3.8908   True
           No difference Scenes without arm gestures   0.6667 0.5633 -0.9795  2.3128  False
Scenes with arm gestures Scenes without arm gestures  -1.8667 0.0017 -3.0072 -0.7262   True
-------------------------------------------------------------------------------------------

--- ANOVA for How did scenes with arm gestures compare to ones without, in making you feel immersed?
(1: Less immersive → 5: More immersive) ---
F-statistic: 14.01, p-value: 0.0003
         