# ZIP Code EDA Project
This notebook performs exploratory data analysis on a synthetic dataset containing ZIP codes, states, cities, and user counts.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
sns.set(style='whitegrid')

In [None]:
data = pd.read_csv('sample_zip_data.csv')
data.head()

In [None]:
# Dataset Info
data.info()

In [None]:
# Summary Statistics
data.describe()

In [None]:
# Check for Missing Values
data.isnull().sum()

In [None]:
# Top 10 ZIP Codes by User Count
top_zip = data.groupby('ZIP Code')['Users'].sum().sort_values(ascending=False).head(10)
top_zip

In [None]:
# User Count by State
state_dist = data.groupby('State')['Users'].sum().sort_values(ascending=False)
state_dist

In [None]:
# Plot: Top 10 ZIP Codes by Users
plt.figure(figsize=(10,6))
sns.barplot(x=top_zip.values, y=top_zip.index, palette='viridis')
plt.title('Top 10 ZIP Codes by Users')
plt.xlabel('User Count')
plt.ylabel('ZIP Code')
plt.tight_layout()
plt.show()

In [None]:
# Plot: Total Users by State
plt.figure(figsize=(8,5))
sns.barplot(x=state_dist.index, y=state_dist.values, palette='muted')
plt.title('User Distribution by State')
plt.xlabel('State')
plt.ylabel('User Count')
plt.tight_layout()
plt.show()