# ðŸ“Š Sales Data Analysis Project
---
This notebook demonstrates a simple **Data Analyst project** using Python, Pandas, and visualization libraries (Matplotlib & Seaborn).

In [None]:

# Step 1: Import Libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns


In [None]:

# Step 2: Load Dataset
df = pd.read_csv("sales.csv")

print("ðŸ”¹ First 5 rows of data:")
display(df.head())

print("\nðŸ”¹ Dataset Info:")
display(df.info())

print("\nðŸ”¹ Missing values:")
display(df.isnull().sum())


In [None]:

# Step 3: Data Cleaning
# Convert Date column to datetime format
df['Date'] = pd.to_datetime(df['Date'])

# Add a new column "Total Sales"
df['Total_Sales'] = df['Quantity'] * df['Price']

print("\nðŸ”¹ Data after cleaning:")
display(df.head())


In [None]:

# Step 4: Descriptive Analysis

print("\nðŸ”¹ Total Sales by Category:")
display(df.groupby('Category')['Total_Sales'].sum())

print("\nðŸ”¹ Best Selling Product:")
display(df.groupby('Product')['Total_Sales'].sum().sort_values(ascending=False).head(1))


In [None]:

# Step 5: Visualizations

# 5.1 Total Sales by Category
plt.figure(figsize=(10,6))
sns.barplot(x='Category', y='Total_Sales', data=df, estimator=sum, palette='viridis')
plt.title("Total Sales by Category")
plt.ylabel("Sales Amount")
plt.show()

# 5.2 Monthly Sales Trend
monthly_sales = df.groupby(df['Date'].dt.to_period('M'))['Total_Sales'].sum()

plt.figure(figsize=(10,6))
monthly_sales.plot(kind='line', marker='o', color='blue')
plt.title("Monthly Sales Trend")
plt.xlabel("Month")
plt.ylabel("Total Sales")
plt.show()

# 5.3 Product-wise Sales
plt.figure(figsize=(10,6))
sns.barplot(x='Product', y='Total_Sales', data=df, estimator=sum, palette='coolwarm')
plt.title("Product-wise Total Sales")
plt.xticks(rotation=45)
plt.show()
