# Warehouse Data Analysis (Basic)
This notebook demonstrates basic data cleaning and descriptive analysis on the simulated warehouse dataset.
Tools used: Python (pandas, matplotlib)


In [None]:
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline
df = pd.read_excel('warehouse_data.xlsx')
df['Date_Received'] = pd.to_datetime(df['Date_Received'])
df['Date_Issued'] = pd.to_datetime(df['Date_Issued'])
df.head()

In [None]:
# Basic metrics
total_in = df['Stock_In'].sum()
total_out = df['Stock_Out'].sum()
avg_utilization = (df['Current_Stock'].sum() / (df['Stock_In'].sum())) * 100
discrepancy_rate = (df['Discrepancy'].abs().sum() / df['Stock_In'].sum()) * 100
print(f"Total In: {total_in}")
print(f"Total Out: {total_out}")
print(f"Average Utilization (approx): {avg_utilization:.1f}%")
print(f"Approx Discrepancy Rate: {discrepancy_rate:.2f}%")

In [None]:
# Simple visualization: top zones by current stock
zone_summary = df.groupby('Zone')['Current_Stock'].sum().sort_values(ascending=False)
ax = zone_summary.plot(kind='bar')
ax.set_title('Current Stock by Zone')
ax.set_xlabel('Zone')
ax.set_ylabel('Current Stock')
plt.tight_layout()

## Findings & Recommendations (example)
- Identify zones with high utilization for rebalancing.
- Weekly stock audits for items with non-zero discrepancy.
- Consider relocating fast-moving items to reduce picking time.
