# 📊 Data Visualization Notebook
This notebook creates visual insights from the IMDb dataset.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load cleaned dataset
df = pd.read_csv('imdb_movies_cleaned.csv')

In [None]:
# Distribution of Ratings
plt.figure(figsize=(8,5))
sns.histplot(df['Rating'], bins=20, kde=True)
plt.title('Distribution of IMDb Ratings')
plt.xlabel('Rating')
plt.ylabel('Count')
plt.show()

In [None]:
# Top 10 Genres (if genre column exists)
if 'Genre' in df.columns:
    genre_counts = df['Genre'].value_counts().head(10)
    genre_counts.plot(kind='bar', figsize=(10,5), title='Top 10 Genres')
    plt.ylabel('Number of Movies')
    plt.show()

In [None]:
# Rating vs Year
plt.figure(figsize=(10,6))
sns.scatterplot(data=df, x='Year', y='Rating', alpha=0.5)
plt.title('IMDb Rating Over Years')
plt.xlabel('Year')
plt.ylabel('Rating')
plt.show()