# Weight Management Project
Exploratory Data Analysis & Hypothesis Testing

In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from scipy.stats import ttest_ind


df = pd.read_csv("weight_mgmt_dataset.csv")
df.head()

In [None]:
df.describe().round(2)

In [None]:
plt.figure(figsize=(12,6))
plt.plot(df['Date'], df['Weight)'], marker='o')
plt.xticks(rotation=45)
plt.title('Weight Changing Over Time')
plt.xlabel('Date')
plt.ylabel('Weight')
plt.grid(True)
plt.tight_layout()
plt.show()

In [None]:
corr = df.drop(columns=['Date']).corr()
plt.figure(figsize=(8,5))
sns.heatmap(corr, annot=True, cmap='coolwarm', fmt='.2f', linewidths=.5)
plt.title('Correlation Heatmap')
plt.tight_layout()
plt.show()

In [None]:
gym_days = df[df['Gym (min)'] > 0]['Weight']
no_gym_days = df[df['Gym (min)'] == 0]['Weight']

t_stat, p_val = ttest_ind(no_gym_days, gym_days, equal_var=False)
print(f"Average Weight (Gym Days): {gym_days.mean():.2f} kg")
print(f"Average Weight (No-Gym Days): {no_gym_days.mean():.2f} kg")
print(f"T-statistic: {t_stat:.3f}")
print(f"P-value: {p_val:.4f}")
if p_val < 0.05:
    print('Difference is statistically significant (p < 0.05)')
else:
    print('No statistically significant differences (p >= 0.05)')

**Conclusion:** The exploratory analysis shows a general downward trend in weight. The t-test did not reveal a statistically significant difference between gym and no-gym days, suggesting calorie intake might play a stronger role than gym minutes alone within this short observation window.