In [None]:
# Jupyter Notebook Cell 1: Load Data
import pandas as pd

json_logs = pd.read_csv("data/processed/json_logs_parsed.csv")
surveys = pd.read_csv("data/processed/surveys_parsed.csv")
transcripts = pd.read_csv("data/processed/transcripts_labeled.csv")

# Jupyter Notebook Cell 2: Merge Data
merged = pd.merge(
    json_logs[['team_id', 'timestamp', 'game_score', 'advice_type']],
    surveys[['team_id', 'cohesion_score']],
    on='team_id'
)

# Jupyter Notebook Cell 3: Statistical Test
from scipy.stats import spearmanr

corr, p_value = spearmanr(merged['game_score'], merged['cohesion_score'])
print(f"Spearman’s ρ: {corr:.2f}, p = {p_value:.3f}")

# Jupyter Notebook Cell 4: Visualization
import seaborn as sns
import matplotlib.pyplot as plt

sns.scatterplot(data=merged, x='game_score', y='cohesion_score', hue='advice_type')
plt.title("Game Score vs. Cohesion Score by Advice Type")
plt.savefig("results/correlation_plot.png")