# Supply Chain Data Exploratory Data Analysis

This notebook performs exploratory data analysis on our supply chain data to understand patterns, trends, and potential areas for optimization.

In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

%matplotlib inline
plt.style.use('seaborn')

In [None]:
# Load the supply chain data
df = pd.read_csv('../data/supply_chain_data.csv')
print(f"Dataset shape: {df.shape}")
df.head()

## Data Overview and Basic Statistics

In [None]:
# Display basic statistics
print("\nBasic Statistics:")
df.describe()

print("\nMissing Values:")
df.isnull().sum()

## Time Series Analysis

In [None]:
# Convert date column to datetime
df['date'] = pd.to_datetime(df['date'])

# Plot daily order volumes
plt.figure(figsize=(15, 6))
df.groupby('date')['order_volume'].sum().plot()
plt.title('Daily Order Volumes')
plt.xlabel('Date')
plt.ylabel('Order Volume')
plt.show()

## Supplier Analysis

In [None]:
# Analyze supplier performance
supplier_metrics = df.groupby('supplier_id').agg({
    'delivery_time': 'mean',
    'order_volume': 'sum',
    'quality_score': 'mean'
}).round(2)

print("Supplier Performance Metrics:")
supplier_metrics.sort_values('quality_score', ascending=False).head(10)