In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from scipy.stats import ttest_ind

# Load dataset
df = pd.read_excel('data/screen_time_mood_data.xlsx')
df.head()


In [None]:
# Screen Time Distribution
plt.figure(figsize=(8,5))
plt.hist(df['Total_Screen_Minutes'], bins=20, edgecolor='black')
plt.title('Distribution of Total Daily Screen Time')
plt.xlabel('Screen Time (minutes)')
plt.ylabel('Frequency')
plt.savefig('charts/screen_time_distribution.png')
plt.show()


In [None]:
# Stress Score Distribution
plt.figure(figsize=(8,5))
plt.hist(df['Stress_Score'], bins=10, edgecolor='black')
plt.title('Distribution of Stress Scores')
plt.xlabel('Stress Score')
plt.ylabel('Frequency')
plt.savefig('charts/stress_distribution.png')
plt.show()


In [None]:
# Correlation Matrix
corr = df[['Total_Screen_Minutes', 'Stress_Score', 'Mood_Score']].corr()
plt.figure(figsize=(6,5))
sns.heatmap(corr, annot=True, cmap='coolwarm', fmt=".2f")
plt.title('Correlation Matrix')
plt.savefig('charts/correlation_matrix.png')
plt.show()
corr


In [None]:
# Hypothesis Testing
high_screen = df[df['Total_Screen_Minutes'] > 240]
low_screen = df[df['Total_Screen_Minutes'] <= 240]

# Stress Score T-test
stress_tstat, stress_pval = ttest_ind(high_screen['Stress_Score'], low_screen['Stress_Score'], equal_var=False)

# Mood Score T-test
mood_tstat, mood_pval = ttest_ind(high_screen['Mood_Score'], low_screen['Mood_Score'], equal_var=False)

print('Stress Score T-test: t =', round(stress_tstat, 3), ', p =', round(stress_pval, 4))
print('Mood Score T-test: t =', round(mood_tstat, 3), ', p =', round(mood_pval, 4))
