# Sales Data Analysis Assignment
**Objective:**
- Load and analyze a dataset using the pandas library in Python.
- Create simple plots and charts with matplotlib and seaborn for visualizing the data.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np

In [None]:
# Simulate a sales dataset
data = {
    'Date': pd.date_range(start='2025-01-01', periods=30, freq='D'),
    'Region': np.random.choice(['North', 'South', 'East', 'West'], size=30),
    'Sales': np.random.randint(1000, 5000, size=30),
    'Profit': np.random.randint(100, 1000, size=30)
}
df = pd.DataFrame(data)

# Display first 5 rows
df.head()

In [None]:
df.info()
df.isnull().sum()

In [None]:
df.describe()

In [None]:
region_summary = df.groupby('Region')[['Sales', 'Profit']].mean()
region_summary

In [None]:
plt.figure(figsize=(10,5))
plt.plot(df['Date'], df['Sales'], marker='o', color='blue', label='Sales')
plt.title('Daily Sales Trend')
plt.xlabel('Date')
plt.ylabel('Sales')
plt.xticks(rotation=45)
plt.legend()
plt.tight_layout()
plt.show()

In [None]:
sns.barplot(x=region_summary.index, y=region_summary['Sales'], palette='viridis')
plt.title('Average Sales by Region')
plt.xlabel('Region')
plt.ylabel('Average Sales')
plt.show()

In [None]:
plt.hist(df['Profit'], bins=8, color='orange', edgecolor='black')
plt.title('Profit Distribution')
plt.xlabel('Profit')
plt.ylabel('Frequency')
plt.show()

In [None]:
sns.scatterplot(x='Sales', y='Profit', hue='Region', data=df, palette='deep', s=80)
plt.title('Sales vs Profit by Region')
plt.xlabel('Sales')
plt.ylabel('Profit')
plt.show()

### Observations:
- Sales fluctuate daily but some regions have higher average sales.
- Profit distribution shows most profits are in the mid-range, few extremes.
- There is a positive relationship between sales and profit: higher sales tend to generate higher profits.