# üõç MarketEdge Retail Analytics ‚Äî Profitability Insights
This notebook explores store-level sales and profitability trends for a mid-market retail chain using sample data.

### Objectives
- Identify margin leakage across stores
- Highlight top-performing stores and products
- Generate visuals for Tableau dashboard integration

In [None]:
# üß© Import Libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
sns.set(style='whitegrid', palette='muted', font_scale=1.1)

In [None]:
# üì• Load Sample Dataset
sales = pd.read_csv('../data/sample_sales_data.csv')
sales.head()

In [None]:
# üßπ Data Cleaning
sales.drop_duplicates(inplace=True)
sales['date'] = pd.to_datetime(sales['date'])
sales.info()

In [None]:
# üí∞ Calculate Profit Margins
sales['margin'] = sales['revenue'] - sales['cost']
sales['margin_pct'] = (sales['margin'] / sales['revenue']) * 100
sales.describe()[['revenue', 'cost', 'margin', 'margin_pct']]

In [None]:
# üìä Pareto (80/20) Analysis ‚Äî Stores Driving 80% of Total Margin
pareto = sales.groupby('store')['margin'].sum().reset_index().sort_values('margin', ascending=False)
pareto['cum_margin_pct'] = pareto['margin'].cumsum() / pareto['margin'].sum() * 100
pareto.head()

In [None]:
# üñºÔ∏è Visualization: Top Stores by Margin
plt.figure(figsize=(10,6))
sns.barplot(data=pareto.head(10), x='store', y='margin', palette='Spectral')
plt.title('Top 10 Stores by Margin', fontsize=14, weight='bold')
plt.xlabel('Store')
plt.ylabel('Total Margin ($)')
plt.tight_layout()
plt.savefig('../visuals/store_profitability_chart.png', bbox_inches='tight')
plt.show()

In [None]:
# üí° Key Insights Summary
top_20 = pareto[pareto['cum_margin_pct'] <= 80]
print(f"Number of stores driving 80% of total margin: {len(top_20)}")
print(f"Total margin from these stores: ${top_20['margin'].sum():,.2f}")