# Project 1: Simple Data Analytics – Sales Data Analysis

## 📌 Objective:
Analyze a fictional sales dataset using basic statistics and visualizations to understand product-wise and region-wise performance.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

sns.set(style="whitegrid")

## 🔄 Step 2: Load Dataset

In [None]:
# Load the sales dataset
sales_df = pd.read_csv("sales_data.csv")
sales_df.head()

## 📊 Step 3: Descriptive Statistics

In [None]:
# Summary statistics
sales_df.describe()

## 📈 Step 4: Total Sales by Product

In [None]:
product_sales = sales_df.groupby('Product')['Total Sales'].sum().reset_index()

plt.figure(figsize=(8, 5))
sns.barplot(data=product_sales, x='Product', y='Total Sales', palette='viridis')
plt.title('Total Sales by Product')
plt.tight_layout()
plt.savefig("bar_chart_product_sales.png")
plt.show()

## 🧭 Step 5: Sales Distribution by Region

In [None]:
region_sales = sales_df.groupby('Region')['Total Sales'].sum().reset_index()

plt.figure(figsize=(6, 6))
plt.pie(region_sales['Total Sales'], labels=region_sales['Region'], autopct='%1.1f%%', colors=sns.color_palette('pastel'))
plt.title('Sales Distribution by Region')
plt.tight_layout()
plt.savefig("pie_chart_region_sales.png")
plt.show()

## ✅ Insights:
- Product X (highest revenue)
- Region Y (top sales contributor)
- Overall performance trend from charts