<a href="https://colab.research.google.com/github/abinayalakshmi852-spec/sales-data-analysis-python/blob/main/Week2_Sales_Data_Analysis.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import pandas as pd
import numpy as np

# -----------------------------
# 1. Create Sales Dataset
# -----------------------------
np.random.seed(42)

orders = 50
data = {
    "Order_ID": range(1001, 1001 + orders),
    "Order_Date": pd.date_range(start="2024-01-01", periods=orders, freq="D"),
    "Product": np.random.choice(
        ["Laptop", "Mobile", "Headphones", "Keyboard", "Mouse", "Monitor"],
        orders
    ),
    "Category": np.random.choice(
        ["Electronics", "Accessories"],
        orders
    ),
    "Quantity": np.random.randint(1, 6, orders),
    "Price": np.random.randint(500, 50000, orders)
}

df = pd.DataFrame(data)

# -----------------------------
# 2. Calculate Total Sales Amount
# -----------------------------
df["Total_Sales"] = df["Quantity"] * df["Price"]

# -----------------------------
# 3. Overall Sales Summary
# -----------------------------
total_revenue = df["Total_Sales"].sum()
total_orders = df["Order_ID"].nunique()

# -----------------------------
# 4. Product-wise Sales Analysis
# -----------------------------
product_sales = df.groupby("Product")["Total_Sales"].sum().reset_index()

# -----------------------------
# 5. Category-wise Sales Analysis
# -----------------------------
category_sales = df.groupby("Category")["Total_Sales"].sum().reset_index()

# -----------------------------
# 6. Monthly Sales Analysis
# -----------------------------
df["Month"] = df["Order_Date"].dt.month
monthly_sales = df.groupby("Month")["Total_Sales"].sum().reset_index()

# -----------------------------
# 7. Business Summary
# -----------------------------
print("----- BUSINESS SUMMARY -----")
print(f"Total Revenue Generated: ₹{total_revenue}")
print(f"Total Orders Placed: {total_orders}")

top_product = product_sales.sort_values("Total_Sales", ascending=False).iloc[0]
low_product = product_sales.sort_values("Total_Sales").iloc[0]

print(f"Top Performing Product: {top_product['Product']} (₹{top_product['Total_Sales']})")
print(f"Lowest Performing Product: {low_product['Product']} (₹{low_product['Total_Sales']})")

top_category = category_sales.sort_values("Total_Sales", ascending=False).iloc[0]
print(f"Best Performing Category: {top_category['Category']}")

best_month = monthly_sales.sort_values("Total_Sales", ascending=False).iloc[0]
print(f"Highest Sales Month: Month {best_month['Month']}")

# -----------------------------
# 8. Export Final Dataset
# -----------------------------
df.to_csv("week2_sales_analysis_output.csv", index=False)

print("\nFile exported successfully: week2_sales_analysis_output.csv")

----- BUSINESS SUMMARY -----
Total Revenue Generated: ₹3651204
Total Orders Placed: 50
Top Performing Product: Mouse (₹911216)
Lowest Performing Product: Laptop (₹265625)
Best Performing Category: Accessories
Highest Sales Month: Month 1

File exported successfully: week2_sales_analysis_output.csv
