# 🧠 Exploratory Data Analysis: Calories Burnt Prediction
This notebook performs EDA on the dataset to explore patterns and trends related to calorie expenditure during workouts.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
sns.set(style='whitegrid')

## 📥 Load Dataset

In [None]:
calories_df = pd.read_csv('data/calories.csv')
calories_df.head()

## 🔍 Initial Inspection

In [None]:
calories_df.info()
calories_df.isnull().sum()

## 📊 Feature Distributions

In [None]:
numeric_cols = ['Age', 'Height', 'Weight', 'Duration', 'Heart_Rate', 'Body_Temp', 'Calories']
fig, axes = plt.subplots(nrows=3, ncols=3, figsize=(16, 12))
axes = axes.flatten()
for i, col in enumerate(numeric_cols):
    sns.histplot(calories_df[col], kde=True, ax=axes[i], color='skyblue')
    axes[i].set_title(f'Distribution of {col}')
    axes[i].set_xlabel(col)
    axes[i].set_ylabel('Frequency')
for j in range(len(numeric_cols), len(axes)):
    fig.delaxes(axes[j])
plt.tight_layout()
plt.show()

## 📉 Scatter Plots: Features vs Calories

In [None]:
fig, axes = plt.subplots(2, 3, figsize=(18, 10))
axes = axes.flatten()
features = ['Age', 'Weight', 'Duration', 'Heart_Rate', 'Body_Temp', 'Height']
for i, col in enumerate(features):
    sns.scatterplot(data=calories_df, x=col, y='Calories', ax=axes[i], color='orange')
    axes[i].set_title(f'{col} vs Calories')
plt.tight_layout()
plt.show()

## 🔥 Correlation Heatmap

In [None]:
corr_matrix = calories_df.corr(numeric_only=True)
plt.figure(figsize=(10, 6))
sns.heatmap(corr_matrix, annot=True, cmap='coolwarm', linewidths=0.5)
plt.title('Correlation Heatmap')
plt.show()

## 📌 Summary of EDA Findings
- Dataset is complete with no missing values.
- Strong positive correlation between Calories and Duration, Heart Rate, Body Temp.
- Weak correlation with Age and Height.
- Visualizations confirm meaningful patterns useful for model training.