Loading & Inspecting Data

In [None]:
import pandas as pd

print("Loading IPL Auction Dataset...")
df = pd.read_csv("IPLPlayerAuctionData.csv")

print(f"Dataset loaded with {df.shape[0]} rows and {df.shape[1]} columns.\n")

print("Column names:")
print(df.columns)

print("\nPreview of the data:")
print(df.head())

print("\nDataset info:")
print(df.info())


Data Cleaning

In [None]:
print("Cleaning column names...")
df.columns = df.columns.str.strip().str.replace(' ', '_')

print("Filling missing 'Year' values...")
df['Year'] = df['Year'].ffill().astype(int)

Adding Required Columns

In [None]:
print("Creating 'Amount_Cr' column...")
df['Amount_Cr'] = df['Amount'] / 1e7

print("Calculating player appearance counts...")
df['Count'] = df.groupby('Player')['Player'].transform('count')

print("Marking repeated players...")
df['Repeated'] = df['Count'] > 1

Saving The Cleaned Data

In [None]:
print("Saving cleaned data to CSV...")
df.to_csv("Cleaned_IPL_Auction_Data.csv", index=False)
print("File saved successfully.")