# 🎬 Netflix Data Cleaning & Analysis Project
This project analyzes data from Netflix's library of movies and TV shows. We'll clean the data and explore some trends using Python.

In [None]:
# Step 1: Import libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np

# Set up visual style
sns.set(style='darkgrid')

# Load dataset
df = pd.read_csv('netflix_titles.csv')
df.head()

## Step 2: Data Overview

In [None]:
# Check data info
df.info()

## Step 3: Handle Missing Values

In [None]:
# Check for null values
df.isnull().sum()

In [None]:
# Drop rows with null in 'title', 'type', or 'release_year'
df.dropna(subset=['title', 'type', 'release_year'], inplace=True)

# Fill remaining missing values with 'Unknown'
df.fillna('Unknown', inplace=True)

## Step 4: Convert Date Column

In [None]:
# Convert 'date_added' to datetime
df['date_added'] = pd.to_datetime(df['date_added'], errors='coerce')
df['year_added'] = df['date_added'].dt.year
df['month_added'] = df['date_added'].dt.month

## Step 5: Basic Analysis - Movies vs TV Shows

In [None]:
# Countplot of content types
sns.countplot(data=df, x='type')
plt.title('Movies vs TV Shows on Netflix')
plt.show()