In [None]:
# === Load Libraries ===
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import plotly.express as px

# === Load Data ===
df = pd.read_csv("../data/netflix_titles.csv")

# === Basic Cleaning ===
df['date_added'] = pd.to_datetime(df['date_added'])
df['year_added'] = df['date_added'].dt.year
df['month_added'] = df['date_added'].dt.month

# === Movies vs TV Shows ===
sns.countplot(data=df, x="type")
plt.title("Movies vs TV Shows on Netflix")
plt.show()

# === Content Growth by Year ===
df['year_added'].value_counts().sort_index().plot(kind='bar', figsize=(10,5))
plt.title("Content Added to Netflix Over Time")
plt.xlabel("Year Added")
plt.ylabel("Number of Titles")
plt.show()

# === Top 10 Countries ===
top_countries = df['country'].value_counts().head(10)
px.bar(top_countries, title="Top Countries with Most Netflix Titles").show()

# === Popular Genres ===
genres = df['listed_in'].str.split(',').explode().str.strip()
genres.value_counts().head(10).plot(kind='bar')
plt.title("Top 10 Netflix Genres")
plt.show()
