# Exploratory Data Analysis Template

**Dataset**: [Name]
**Date**: [Date]
**Analyst**: [Name]

## Objective
[What question are we answering?]

In [None]:
# Import libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from scipy import stats

# Set style
sns.set_style('whitegrid')
plt.rcParams['figure.figsize'] = (12, 6)

%matplotlib inline

## 1. Data Loading

In [None]:
# Load data
df = pd.read_csv('data.csv')

# Initial inspection
print(f"Shape: {df.shape}")
df.head()

## 2. Data Quality Assessment

In [None]:
# Data types
print("Data Types:")
print(df.dtypes)

# Missing values
print("\nMissing Values:")
missing = df.isnull().sum()
missing[missing > 0]

# Duplicates
print(f"\nDuplicates: {df.duplicated().sum()}")

## 3. Statistical Summary

In [None]:
# Descriptive statistics
df.describe()

## 4. Distribution Analysis

In [None]:
# Numeric columns
numeric_cols = df.select_dtypes(include=[np.number]).columns

# Plot distributions
for col in numeric_cols:
    fig, axes = plt.subplots(1, 2, figsize=(12, 4))
    
    # Histogram with KDE
    sns.histplot(df[col], kde=True, ax=axes[0])
    axes[0].set_title(f'Distribution of {col}')
    
    # Box plot
    sns.boxplot(x=df[col], ax=axes[1])
    axes[1].set_title(f'Box Plot of {col}')
    
    plt.tight_layout()
    plt.show()

## 5. Correlation Analysis

In [None]:
# Correlation matrix
corr_matrix = df[numeric_cols].corr()

# Heatmap
plt.figure(figsize=(10, 8))
sns.heatmap(corr_matrix, annot=True, fmt='.2f', cmap='coolwarm', center=0, square=True)
plt.title('Correlation Matrix')
plt.show()

## 6. Key Findings

### Finding 1
[Description]

### Finding 2
[Description]

### Finding 3
[Description]

## 7. Recommendations

1. [Recommendation 1]
2. [Recommendation 2]
3. [Recommendation 3]