# Exploratory Data Analysis (EDA) Template
This notebook provides a reusable template for performing EDA on any dataset, particularly suitable for Kaggle datasets.

In [None]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import plotly.express as px

sns.set(style='whitegrid')
%matplotlib inline

## Load the Dataset

In [None]:
# Replace 'your_dataset.csv' with your dataset file
df = pd.read_csv('your_dataset.csv')
df.head()

## Basic Dataset Information

In [None]:
df.info()
df.describe().T

## Missing Values

In [None]:
missing = df.isnull().sum()
missing = missing[missing > 0]
missing.sort_values(ascending=False)

## Data Types Overview

In [None]:
df.dtypes.value_counts()

## Distribution of Numerical Features

In [None]:
num_cols = df.select_dtypes(include=np.number).columns
df[num_cols].hist(figsize=(15, 10), bins=30, edgecolor='black')
plt.tight_layout()

## Correlation Heatmap

In [None]:
plt.figure(figsize=(12, 8))
sns.heatmap(df[num_cols].corr(), annot=True, fmt='.2f', cmap='coolwarm')

## Feature Distributions with Seaborn

In [None]:
# Example: Distribution of a specific column
sns.histplot(df[num_cols[0]], kde=True)

## Interactive Visualization with Plotly

In [None]:
# Example: Interactive scatter plot
px.scatter(df, x=num_cols[0], y=num_cols[1],
           color=num_cols[2] if len(num_cols) > 2 else None)

## Categorical Features Analysis

In [None]:
cat_cols = df.select_dtypes(include='object').columns
for col in cat_cols:
    print(f'\nValue counts for {col}:')
    print(df[col].value_counts())