# 🧮 Descriptive Statistics with Pandas (Retail Sales Example)
This notebook introduces basic descriptive statistics techniques using a sample retail sales dataset.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Sample data
data = {
    'Product': ['Shirt', 'Pants', 'Shoes', 'Shirt', 'Shoes', 'Pants', 'Shirt', 'Shoes', 'Pants', 'Shirt'],
    'Category': ['Clothing', 'Clothing', 'Footwear', 'Clothing', 'Footwear', 'Clothing', 'Clothing', 'Footwear', 'Clothing', 'Clothing'],
    'Price': [25.99, 35.50, 60.00, 22.50, 65.00, 40.00, 20.00, 55.00, 38.00, 23.99],
    'Units_Sold': [120, 80, 60, 150, 50, 90, 130, 65, 85, 140]
}

df = pd.DataFrame(data)
df.head()

## 1️⃣ Basic Summary
Use `describe()` to view summary statistics for numeric columns.

In [None]:
df.describe()

## 2️⃣ Category Analysis
See how many products belong to each category.

In [None]:
df['Category'].value_counts()

## 3️⃣ Individual Stats
Get mean, median, and standard deviation for specific columns.

In [None]:
print("Mean Price:", df['Price'].mean())
print("Median Units Sold:", df['Units_Sold'].median())
print("Std Dev of Price:", df['Price'].std())

## 4️⃣ Grouped Summary
Average price by product category.

In [None]:
df.groupby('Category')['Price'].mean()

## 5️⃣ Visual Summary
Boxplot of price by category using seaborn.

In [None]:
sns.boxplot(x='Category', y='Price', data=df)
plt.title("Price Distribution by Category")
plt.show()