# Netflix Data Cleaning Task

This notebook cleans and preprocesses the Netflix Movies and TV Shows dataset.

In [None]:
import pandas as pd

# Load dataset
df = pd.read_csv('netflix_titles.csv')
df.head()

In [None]:
# Check for missing values
df.isnull().sum()

In [None]:
# Drop duplicates
df.drop_duplicates(inplace=True)

In [None]:
# Standardize text format
df['country'] = df['country'].str.strip().str.title()
df['rating'] = df['rating'].str.upper()
df['type'] = df['type'].str.title()

In [None]:
# Convert date_added to datetime
df['date_added'] = pd.to_datetime(df['date_added'], errors='coerce')

In [None]:
# Rename columns to lowercase with underscores
df.columns = df.columns.str.strip().str.lower().str.replace(' ', '_')

In [None]:
# Convert release_year to integer (nullable)
df['release_year'] = df['release_year'].astype('Int64')

In [None]:
# Save cleaned dataset
df.to_csv('netflix_titles_cleaned.csv', index=False)
print("Cleaned dataset saved as 'netflix_titles_cleaned.csv'")