#  Netflix Data Cleaning Task
This notebook demonstrates how to clean the Netflix dataset step-by-step.

In [None]:
import pandas as pd

In [None]:
# Load the dataset
df = pd.read_csv('netflix_titles.csv')
df.head()

In [None]:
# Basic info about the dataset
df.shape
df.info()
df.describe()

In [None]:
# Check for missing values
df.isnull().sum()

In [None]:
# Handle missing values
df.dropna(subset=['director', 'cast'], inplace=True)
df['country'].fillna('Unknown', inplace=True)

In [None]:
# Remove duplicate rows
df.drop_duplicates(inplace=True)

In [None]:
# Standardize text data
df['type'] = df['type'].str.lower().str.strip()
df['country'] = df['country'].str.strip()

In [None]:
# Convert 'date_added' to datetime
df['date_added'] = pd.to_datetime(df['date_added'], errors='coerce')

In [None]:
# Rename columns to snake_case
df.columns = df.columns.str.strip().str.lower().str.replace(' ', '_')

In [None]:
# Check data types
df.dtypes

In [None]:
# Save the cleaned dataset
df.to_csv('netflix_cleaned.csv', index=False)