# E-commerce Customer Reviews Data Cleaning 🚀

In [None]:

import pandas as pd

# Load the dataset
df = pd.read_csv("ecommerce_reviews.csv")

# Display first 5 rows
df.head()


## Handling Missing Values

In [None]:

# Checking missing values
print("Missing Values Before Cleaning:\n", df.isnull().sum())

# Filling missing values with appropriate defaults
df["Customer_Name"].fillna("Unknown", inplace=True)
df["Review_Text"].fillna("No review provided", inplace=True)

# Checking missing values after cleaning
print("Missing Values After Cleaning:\n", df.isnull().sum())


## Removing Duplicate Rows

In [None]:

# Checking duplicate rows
print("Duplicate Rows Before:", df.duplicated().sum())

# Removing duplicate rows
df.drop_duplicates(inplace=True)

# Checking duplicate rows after cleaning
print("Duplicate Rows After:", df.duplicated().sum())


## Fixing Incorrect Ratings

In [None]:

# Fixing incorrect ratings (Valid range: 1 to 5)
df["Rating"] = df["Rating"].apply(lambda x: x if 1 <= x <= 5 else 3)  # Default 3 for incorrect values

# Checking unique ratings after cleaning
df["Rating"].unique()


## Saving Cleaned Dataset

In [None]:

# Saving the cleaned dataset
df.to_csv("ecommerce_reviews_cleaned.csv", index=False)

print("Cleaned dataset saved as 'ecommerce_reviews_cleaned.csv'!")
