# 📦 Amazon Sales Data Analysis & Visualization
This notebook analyzes Amazon sales data to identify key trends, top-performing products, and customer behavior.

In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load dataset
df = pd.read_csv('amazon_sales_data.csv')
df['Date'] = pd.to_datetime(df['Date'])
df.head()


FileNotFoundError: [Errno 2] No such file or directory: 'amazon_sales_data.csv'

In [None]:
# Overview
df.info()
df.describe()

# Add Month and Year columns
df['Month'] = df['Date'].dt.to_period('M')
df['Year'] = df['Date'].dt.year


In [None]:
monthly_revenue = df.groupby('Month')['Revenue'].sum().reset_index()
plt.figure(figsize=(10, 5))
sns.lineplot(data=monthly_revenue, x='Month', y='Revenue', marker='o')
plt.title("Monthly Revenue Trend")
plt.ylabel("Revenue ($)")
plt.xticks(rotation=45)
plt.grid(True)
plt.tight_layout()
plt.show()


In [None]:
top_products = df.groupby('Product')['Units Sold'].sum().sort_values(ascending=False).head(10)
top_products.plot(kind='bar', figsize=(10,5), color='skyblue')
plt.title("Top 10 Best-Selling Products")
plt.ylabel("Units Sold")
plt.xticks(rotation=45)
plt.grid(axis='y')
plt.tight_layout()
plt.show()


In [None]:
category_sales = df.groupby('Category')['Revenue'].sum()
category_sales.plot(kind='pie', autopct='%1.1f%%', figsize=(7, 7))
plt.title("Sales Distribution by Category")
plt.ylabel("")
plt.show()


In [None]:
country_sales = df.groupby('Country')['Revenue'].sum().sort_values(ascending=False)
country_sales.plot(kind='bar', color='coral', figsize=(8,5))
plt.title("Sales by Country")
plt.ylabel("Revenue ($)")
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()


In [1]:
sns.histplot(df['Rating'], bins=5, kde=True, color='green')
plt.title("Distribution of Product Ratings")
plt.xlabel("Rating")
plt.ylabel("Frequency")
plt.grid(True)
plt.show()


NameError: name 'sns' is not defined

## ✅ Key Insights
- Revenue peaked in certain months due to seasonal trends.
- Electronics and Home categories were top contributors.
- The USA led in revenue generation.
- Customer ratings are mostly between 3 and 5 stars.

## Tools Used
- Python, Pandas, Matplotlib, Seaborn

Prepared by: **Ada Akuma**
