# 📊 Enhanced Commodity Price Analysis (Jan - Jun 2025)

This notebook explores trends in **commodity prices in Tamil Nadu** using `pandas`, `matplotlib`, and `seaborn`.

It complements the Power BI dashboard by offering a code-level analysis.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

sns.set(style='whitegrid')
%matplotlib inline

In [None]:
# Load CSV (adjust path as needed)
df = pd.read_csv('Data/commodity_prices.csv')

# Parse date and extract month/year
df['Arrival_Date'] = pd.to_datetime(df['Arrival_Date'])
df['Month'] = df['Arrival_Date'].dt.strftime('%B')
df['Year'] = df['Arrival_Date'].dt.year

df.head()

In [None]:
df.info()
df.describe()

In [None]:
df.isnull().sum()

In [None]:
monthly_avg = df.groupby('Month')['Modal_Price'].mean().reindex(
    ['January', 'February', 'March', 'April', 'May', 'June', 'July']
).reset_index()

plt.figure(figsize=(10,6))
sns.barplot(x='Month', y='Modal_Price', data=monthly_avg, palette='viridis')
plt.title('Average Modal Price by Month')
plt.ylabel('Avg Modal Price')
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

In [None]:
commodity_avg = df.groupby('Commodity')['Modal_Price'].mean().sort_values(ascending=False).head(10)

plt.figure(figsize=(10,6))
commodity_avg.plot(kind='bar', color='coral')
plt.title('Top 10 Commodities by Avg Modal Price')
plt.ylabel('Modal Price')
plt.tight_layout()
plt.show()

In [None]:
market_sum = df.groupby('Market')['Modal_Price'].sum().sort_values(ascending=False).head(10)

plt.figure(figsize=(10,6))
market_sum.plot(kind='barh', color='skyblue')
plt.title('Top Markets by Total Modal Price')
plt.xlabel('Total Modal Price')
plt.tight_layout()
plt.show()

In [None]:
plt.figure(figsize=(12,6))
sns.lineplot(data=df.sort_values('Arrival_Date'), x='Arrival_Date', y='Modal_Price', hue='Commodity')
plt.title('Modal Price Over Time by Commodity')
plt.ylabel('Modal Price')
plt.xlabel('Date')
plt.legend(bbox_to_anchor=(1.05, 1), loc='upper left')
plt.tight_layout()
plt.show()