# Sales Data Analysis
This notebook explores a sales dataset to identify trends, patterns, and insights into profitability and cost structures.

In [None]:
# Import necessary libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

## Load and Explore Dataset

In [None]:
# Load dataset
df = pd.read_csv('sales_data.csv')  # Replace with actual dataset
df.head()

## Data Cleaning & Preprocessing

In [None]:
# Check for missing values
df.isnull().sum()

## Exploratory Data Analysis (EDA)

In [None]:
# Summary statistics
df.describe()

### Visualization: Sales Trends Over Time

In [None]:
# Convert date column to datetime format
df['Date'] = pd.to_datetime(df['Date'])
df.set_index('Date', inplace=True)

# Plot sales trends
plt.figure(figsize=(12,6))
sns.lineplot(data=df, x=df.index, y='Sales', color='blue')
plt.title('Sales Trends Over Time')
plt.xlabel('Date')
plt.ylabel('Sales')
plt.show()

## Research Question
- How do manufacturing and freight costs impact overall profitability?

In [None]:
# Correlation between cost factors and profitability
correlation = df[['Profit', 'Manufacturing_Cost', 'Freight_Cost']].corr()
sns.heatmap(correlation, annot=True, cmap='coolwarm')
plt.title('Correlation Between Costs and Profit')
plt.show()

## Conclusion
Insights on sales trends, cost impacts, and profitability patterns.