In [1]:
import pandas as pd

# Load dataset
df = pd.read_csv("online_store_sales.csv")

# 1. Classify orders by value using apply() and lambda
df["Order_Value"] = df["Order_Amount"].apply(
    lambda x: "High Value" if x >= 500
    else ("Medium Value" if x >= 200 else "Low Value")
)

# 2. Group orders by Category (total revenue, avg order amount, total quantity)
category_summary = df.groupby("Category").agg(
    Total_Revenue=("Order_Amount", "sum"),
    Avg_Order_Amount=("Order_Amount", "mean"),
    Total_Quantity=("Quantity", "sum")
)

# 3. Group customers by City (analyze spending trends)
city_summary = df.groupby("City").agg(
    Total_Spending=("Order_Amount", "sum"),
    Avg_Spending=("Order_Amount", "mean"),
    Orders_Count=("Order_ID", "count")
)

# 4. Pivot table for revenue comparison by Category & City
pivot_table = pd.pivot_table(
    df,
    values="Order_Amount",
    index="Category",
    columns="City",
    aggfunc="sum",
    fill_value=0
)

# 5. Sort products to find top-selling (by total quantity sold)
top_products = df.groupby("Product_Name")["Quantity"].sum().sort_values(ascending=False)

# Display results
print("Category Summary:\n", category_summary)
print("\nCity Summary:\n", city_summary)
print("\nPivot Table (Revenue by Category & City):\n", pivot_table)
print("\nTop-Selling Products:\n", top_products.head(10))


Category Summary:
              Total_Revenue  Avg_Order_Amount  Total_Quantity
Category                                                    
Books                 4874        487.400000              27
Electronics          24309        517.212766             135
Fashion              21745        505.697674             124

City Summary:
                Total_Spending  Avg_Spending  Orders_Count
City                                                     
Chicago                  8491    566.066667            15
Houston                 11007    647.470588            17
Los Angeles              9154    457.700000            20
Miami                    4609    512.111111             9
New York                 7390    369.500000            20
San Francisco           10277    540.894737            19

Pivot Table (Revenue by Category & City):
 City         Chicago  Houston  Los Angeles  Miami  New York  San Francisco
Category                                                                  
Bo