# 🛒 Retail Company Performance Analysis
Analyze sales data to extract performance insights by region, category, and time.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np
import warnings
warnings.filterwarnings('ignore')

In [None]:
# Load the dataset
df = pd.read_csv('data/retail_raw.csv', parse_dates=['Date'])
df.head()

In [None]:
# Basic info and missing values
df.info()
df.isnull().sum()

In [None]:
# Total Sales by Region
region_sales = df.groupby('Region')['Sales'].sum().sort_values(ascending=False)
plt.figure(figsize=(8,5))
sns.barplot(x=region_sales.index, y=region_sales.values, palette='Blues_d')
plt.title('Total Sales by Region')
plt.ylabel('Sales')
plt.xlabel('Region')
plt.tight_layout()
plt.show()

In [None]:
# Profit by Category
category_profit = df.groupby('Category')['Profit'].sum().sort_values()
plt.figure(figsize=(8,5))
sns.barplot(x=category_profit.index, y=category_profit.values, palette='Greens_r')
plt.title('Total Profit by Category')
plt.ylabel('Profit')
plt.xlabel('Category')
plt.tight_layout()
plt.show()

In [None]:
# Monthly Sales Trend
df['Month'] = df['Date'].dt.to_period('M')
monthly_sales = df.groupby('Month')['Sales'].sum()
monthly_sales.plot(kind='line', marker='o', figsize=(10,5), title='Monthly Sales Trend')
plt.ylabel('Sales')
plt.xlabel('Month')
plt.grid(True)
plt.tight_layout()
plt.show()

### 💡 Key Business Insights
- Western region generated the highest total sales.
- Furniture category showed high sales but lower profit margins.
- Seasonal trends observed in monthly sales — opportunity to optimize inventory.
- High discounts correlated with reduced profit in some categories.