# E-commerce Data Analysis (Python)

This notebook demonstrates cleaning, exploration, and visualization of the synthetic e-commerce dataset.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
df = pd.read_csv('../data/ecommerce_sales_data.csv', parse_dates=['OrderDate'])

## Data Cleaning

In [None]:
print(df.info())
print(df.isnull().sum())

## Sales Trend Over Time

In [None]:
daily_sales = df.groupby('OrderDate')['OrderAmount'].sum()
plt.figure(figsize=(12,5))
daily_sales.plot()
plt.title('Daily Sales Trend')
plt.xlabel('Date')
plt.ylabel('Total Sales ($)')
plt.tight_layout()
plt.savefig('../visualizations/sales_trends.png')
plt.show()

## Average Order Amount by Region

In [None]:
plt.figure(figsize=(8,5))
sns.barplot(data=df, x='Region', y='OrderAmount', ci=None)
plt.title('Average Order Amount by Region')
plt.tight_layout()
plt.savefig('../visualizations/region_avg_order.png')
plt.show()

## Product Category vs Payment Method (Heatmap)

In [None]:
pivot = df.pivot_table(index='ProductCategory', columns='PaymentMethod', values='OrderAmount', aggfunc='sum')
plt.figure(figsize=(8,5))
sns.heatmap(pivot, annot=True, fmt='.0f', cmap='Blues')
plt.title('Sales by Product Category and Payment Method')
plt.tight_layout()
plt.savefig('../visualizations/category_heatmap.png')
plt.show()

## Customer Age vs. Order Amount

In [None]:
plt.figure(figsize=(8,5))
sns.scatterplot(data=df, x='Age', y='OrderAmount', hue='Gender', alpha=0.7)
plt.title('Customer Age vs. Order Amount')
plt.tight_layout()
plt.savefig('../visualizations/age_vs_order.png')
plt.show()