# Exploratory Data Analysis (EDA)
This notebook explores the WSN dataset, visualizes distributions, and investigates relationships between features and targets.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

df = pd.read_csv('../data/wsn_dataset.csv')
df.head()

## Dataset Info and Missing Values

In [None]:
df.info()
df.isnull().sum()

## Feature Distributions

In [None]:
numeric_cols = df.select_dtypes(include=['float64', 'int64']).columns
df[numeric_cols].hist(figsize=(12,8))
plt.tight_layout()
plt.show()

## Categorical Feature Counts

In [None]:
categorical_cols = ['Node_ID', 'Congestion_Status', 'Latency_Category']
for col in categorical_cols:
    sns.countplot(x=col, data=df)
    plt.title(f'{col} Distribution')
    plt.show()

## Correlation Heatmap

In [None]:
plt.figure(figsize=(10,7))
sns.heatmap(df.corr(numeric_only=True), annot=True, cmap='coolwarm')
plt.title('Correlation Heatmap')
plt.show()

## Pairplot for Key Features

In [None]:
sns.pairplot(df, hue='Latency_Category', vars=['Packet_Size', 'Energy_Level', 'Link_Quality', 'PDR'])
plt.show()