# 🧹 IPL Data Cleaning Notebook

This notebook loads and cleans the `matches.csv` and `deliveries.csv` datasets for IPL Data Analytics.

In [None]:
# 📦 Import required libraries
import pandas as pd
import numpy as np

# Display all columns
pd.set_option('display.max_columns', None)

In [None]:
# 📂 Load datasets
matches = pd.read_csv('../data/matches.csv')
deliveries = pd.read_csv('../data/deliveries.csv')

## 🔍 Inspect Matches Dataset

In [None]:
matches.head()

In [None]:
matches.info()

## 🧼 Clean Matches Dataset

In [None]:
# Drop columns that may not be useful for basic analysis
matches.drop(columns=['umpire1', 'umpire2', 'umpire3'], inplace=True)

# Check for nulls
matches.isnull().sum()

## 🔍 Inspect Deliveries Dataset

In [None]:
deliveries.head()

In [None]:
deliveries.info()

## 🧼 Clean Deliveries Dataset

In [None]:
# Fill any missing player names (if applicable)
deliveries['batsman'].fillna('Unknown', inplace=True)

# Check for nulls
deliveries.isnull().sum()

## 💾 Save Cleaned Data

In [None]:
matches.to_csv('../data/matches_cleaned.csv', index=False)
deliveries.to_csv('../data/deliveries_cleaned.csv', index=False)
print("✅ Cleaned files saved!")