In [None]:
import pandas as pd
import matplotlib.pyplot as plt

### Example dataset — tiny sales log

In [None]:
data = {
    "Date": pd.date_range("2023-01-01", periods=8, freq="D"),
    "Region": ["North", "South", "East", "West"] * 2,
    "Product": ["Widget", "Widget", "Gadget", "Gadget"] * 2,
    "Units_Sold": [12, 8, 15, 7, 10, 14, 9, 11],
    "Unit_Price": [20.0, 20.0, 35.0, 35.0, 20.0, 20.0, 35.0, 35.0]
}

df = pd.DataFrame(data)

### Calculate total revenue per row

In [None]:
df["Revenue"] = df["Units_Sold"] * df["Unit_Price"]

print("Full dataset:\n", df)

### Filter for high-performing regions

In [None]:
high_perf = df[df["Revenue"] > 300]
print("\nHigh revenue rows:\n", high_perf)

### Group by region, sum revenue & units sold

In [None]:
summary = df.groupby("Region").agg({
    "Units_Sold": "sum",
    "Revenue": "sum"
}).sort_values("Revenue", ascending=False)

print("\nRevenue by region:\n", summary)

### Plot the revenue by region

In [None]:
summary["Revenue"].plot(kind="bar", color="skyblue", title="Revenue by Region")
plt.ylabel("Revenue ($)")
plt.tight_layout()
plt.show()