# 📊 Sales Data Analysis

This notebook demonstrates loading, exploring, analyzing, and visualizing a dataset using **pandas** and **matplotlib**.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load dataset
df = pd.read_csv('data/sales.csv')
print("✅ Dataset Loaded Successfully")
df.head()

In [None]:
# Explore dataset
df.info()
df.describe()

# Check missing values
df.isnull().sum()

In [None]:
# Fill missing values if any
df = df.fillna(0)
df.head()

In [None]:
# Basic analysis: group by Region (example)
if 'Region' in df.columns:
    print(df.groupby('Region')['Sales'].mean())
else:
    print("No 'Region' column found. Skipping grouping.")

In [None]:
# 1️⃣ Line Chart: Sales over Time
if 'Date' in df.columns:
    df['Date'] = pd.to_datetime(df['Date'])
    df.groupby('Date')['Sales'].sum().plot(kind='line', figsize=(8,5), title='Sales Over Time')
    plt.ylabel('Sales')
    plt.show()

In [None]:
# 2️⃣ Bar Chart: Average Sales by Region
if 'Region' in df.columns:
    df.groupby('Region')['Sales'].mean().plot(kind='bar', figsize=(8,5), title='Average Sales by Region')
    plt.ylabel('Average Sales')
    plt.show()

In [None]:
# 3️⃣ Histogram: Distribution of Sales
df['Sales'].plot(kind='hist', bins=10, figsize=(8,5), title='Sales Distribution')
plt.xlabel('Sales')
plt.show()

In [None]:
# 4️⃣ Scatter Plot: Sales vs Profit (if columns exist)
if 'Profit' in df.columns:
    df.plot(kind='scatter', x='Sales', y='Profit', title='Sales vs Profit', figsize=(8,5))
    plt.show()