# 📊 Netflix Data Analytics – Beginner Version
Created by **Suman Rajput** | 📅 June 29, 2025

This beginner-friendly project explores the Netflix dataset using basic data analysis techniques in Python.  
We’ll analyze trends in content type, country, categories, and more – using dark mode visualizations.

---


In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

plt.style.use('dark_background')
sns.set(style="darkgrid")

df = pd.read_csv("netflix_titles.csv")
df['date_added'] = pd.to_datetime(df['date_added'], errors='coerce')
df['year_added'] = df['date_added'].dt.year
df.head()


In [None]:
plt.figure(figsize=(6, 4))
sns.countplot(data=df, x='type', palette='cool')
plt.title('Distribution of Content Types')
plt.show()


In [None]:
top_countries = df['country'].value_counts().dropna().head(10)
top_countries.plot(kind='bar', figsize=(8, 4), color='orange')
plt.title('Top 10 Countries with Most Content')
plt.ylabel('Number of Titles')
plt.show()


In [None]:
content_by_year = df['year_added'].value_counts().sort_index()
content_by_year.plot(kind='line', marker='o', color='lime', figsize=(10, 4))
plt.title('Content Added Over the Years')
plt.ylabel('Titles Added')
plt.show()


In [None]:
from collections import Counter
categories = df['listed_in'].dropna().str.split(', ')
flat_categories = [cat for sublist in categories for cat in sublist]
top_categories = dict(Counter(flat_categories).most_common(10))

sns.barplot(x=list(top_categories.values()), y=list(top_categories.keys()), palette='viridis')
plt.title('Top 10 Genres / Categories')
plt.show()
