# 📈 Sustainable Energy Trend Analysis
This notebook analyzes renewable energy trends across Canadian provinces using synthetic data.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load data
data = pd.read_csv('../data/renewable_energy_by_province.csv')
data.head()

## 🔍 Installed Capacity Over Time

In [None]:
# Total installed capacity by year and energy type
plt.figure(figsize=(12, 6))
sns.lineplot(data=data, x='Year', y='Installed_Capacity_MW', hue='Energy_Type', estimator='sum', ci=None)
plt.title('Total Installed Renewable Energy Capacity in Canada (2018–2023)')
plt.ylabel('Capacity (MW)')
plt.grid(True)
plt.show()

## 🌍 Provincial Comparison (Latest Year)

In [None]:
latest_year = data['Year'].max()
latest_data = data[data['Year'] == latest_year]
plt.figure(figsize=(12, 6))
sns.barplot(data=latest_data, x='Province', y='Installed_Capacity_MW', hue='Energy_Type')
plt.title(f'Renewable Energy Capacity by Province in {latest_year}')
plt.ylabel('Capacity (MW)')
plt.xticks(rotation=45)
plt.show()

## 📊 Growth Rate Analysis

In [None]:
# Calculate CAGR per province/energy type
growth_data = data.groupby(['Province', 'Energy_Type']).agg(first_year=('Year', 'min'), last_year=('Year', 'max'),
                                                            start_capacity=('Installed_Capacity_MW', 'first'),
                                                            end_capacity=('Installed_Capacity_MW', 'last')).reset_index()

growth_data['CAGR'] = ((growth_data['end_capacity'] / growth_data['start_capacity']) ** 
                       (1 / (growth_data['last_year'] - growth_data['first_year'])) - 1) * 100

growth_data = growth_data.sort_values(by='CAGR', ascending=False)
growth_data.head()