# Supermarket Sales Analysis

This notebook provides a full exploratory data analysis of supermarket sales data, including trends, customer behavior, and product performance.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Setup
sns.set(style='whitegrid')
plt.rcParams['figure.figsize'] = (12, 6)


In [None]:
# Load cleaned data
df = pd.read_csv('../data/supermarket_sales_cleaned.csv')
df['Date'] = pd.to_datetime(df['Date'])
df.head()

## Key Metrics

In [None]:
total_sales = df['Sales'].sum()
total_orders = df.shape[0]
avg_order_value = df['Sales'].mean()
gross_income = df['gross_income'].sum()

print(f"Total Sales: ${total_sales:,.2f}")
print(f"Total Orders: {total_orders}")
print(f"Average Order Value: ${avg_order_value:.2f}")
print(f"Gross Income: ${gross_income:,.2f}")

## Monthly Sales

In [None]:
monthly_sales = df.groupby('Month')['Sales'].sum().reindex([
    'January', 'February', 'March'])
monthly_sales.plot(kind='bar', color='skyblue', title='Sales by Month')
plt.ylabel('Sales')
plt.show()

## Sales by Category

In [None]:
category_sales = df.groupby('Category')['Sales'].sum().sort_values()
category_sales.plot(kind='barh', color='salmon', title='Sales by Category')
plt.xlabel('Sales')
plt.show()

## Customer Type Analysis

In [None]:
sns.boxplot(x='Customer type', y='Sales', data=df)
plt.title('Sales Distribution by Customer Type')
plt.show()

## Payment Methods

In [None]:
df['Payment'].value_counts().plot(kind='pie', autopct='%1.1f%%', startangle=140)
plt.title('Payment Method Distribution')
plt.ylabel('')
plt.show()