In [12]:
import pandas as pd
import plotly.express as px
import plotly.io as pio


In [10]:
# Loading cleaned dataset
df = pd.read_csv("agri_cleaned.csv")

In [17]:
pio.renderers.default = 'browser'

In [19]:
# 1. Top 7 Rice Producing States
rice_top = df.groupby("State")["Rice_Prod_1000t"].sum().sort_values(ascending=False).head(7).reset_index()
fig = px.bar(rice_top, x='State', y='Rice_Prod_1000t', title='Top 7 States by Rice Production')
fig.show()

In [20]:
# 2. Top 5 Wheat Producing States - Pie
wheat_top = df.groupby("State")["Wheat_Prod_1000t"].sum().sort_values(ascending=False).head(5)
px.pie(wheat_top, names=wheat_top.index, values=wheat_top.values, title="Top 5 Wheat Producing States").show()

In [None]:
# 3. Sugarcane Production Over 50 Years
sugarcane_trend = df.groupby("Year")["Sugarcane_Prod_1000t"].sum().reset_index()
px.line(sugarcane_trend, x='Year', y='Sugarcane_Prod_1000t', title='India’s Sugarcane Production (50 Years)').show()

# 4. Rice vs Wheat Production Trends
prod_trend = df.groupby("Year")[["Rice_Prod_1000t", "Wheat_Prod_1000t"]].sum().reset_index()
px.line(prod_trend, x='Year', y=["Rice_Prod_1000t", "Wheat_Prod_1000t"], title='Rice vs Wheat Production (Last 50 Years)').show()

# 5. Groundnut Production - Top States
groundnut_top = df.groupby("State")["Groundnut_Prod_1000t"].sum().sort_values(ascending=False).head(7).reset_index()
px.bar(groundnut_top, x="State", y="Groundnut_Prod_1000t", title="Top 7 Groundnut Producing States").show()

# 6. Sunflower Production - Top States
sunflower_top = df.groupby("State")["Sunflower_Prod_1000t"].sum().sort_values(ascending=False).head(7).reset_index()
px.bar(sunflower_top, x="State", y="Sunflower_Prod_1000t", title="Top 7 Sunflower Producing States").show()

# 7. Soybean Production & Yield
soybean_top = df.groupby("State")[["Soybean_Prod_1000t", "Soybean_Yield"]].mean().sort_values("Soybean_Prod_1000t", ascending=False).head(5).reset_index()
px.bar(soybean_top, x="State", y="Soybean_Prod_1000t", title="Top 5 Soybean Producing States and Yield Efficiency").show()

# 8. Oilseed Production
oilseed_top = df.groupby("State")["Oilseed_Prod_1000t"].sum().sort_values(ascending=False).reset_index()
px.bar(oilseed_top, x="State", y="Oilseed_Prod_1000t", title="Oilseed Production in Major States").show()

# 9. Area Impact on Production
area_effect = df.groupby("Year")[["Rice_Area_1000ha", "Wheat_Area_1000ha", "Maize_Yield"]].mean().reset_index()
px.line(area_effect, x="Year", y=["Rice_Area_1000ha", "Wheat_Area_1000ha", "Maize_Yield"], title="Impact of Area Cultivated on Production").show()

# 10. Yield Comparison
yield_states = df.groupby("State")[["Rice_Yield", "Wheat_Yield"]].mean().reset_index()
px.scatter(yield_states, x="Rice_Yield", y="Wheat_Yield", hover_name="State", title="Rice vs. Wheat Yield Across States").show()