In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from scipy import stats
import os

plt.rcParams.update({'figure.dpi': 120})
sns.set(style='whitegrid')
os.makedirs('outputs', exist_ok=True)


In [None]:
# cell 2
files = {
    'Benin': 'data/benin_clean.csv',
    'SierraLeone': 'data/sierra_leone_clean.csv',
    'Togo': 'data/togo_clean.csv'
}

dfs = {}
for country, path in files.items():
    dfs[country] = pd.read_csv(path)
    print(country, 'loaded, shape=', dfs[country].shape)


In [None]:
for c, df in dfs.items():
    print(f"--- {c} ---")
    print(df[['GHI','DNI','DHI']].describe().loc[['count','mean','50%','std']])
    print()

In [None]:
# cell 4
combined = []
for country, df in dfs.items():
    tmp = df[['GHI','DNI','DHI']].copy()
    tmp['country'] = country
    combined.append(tmp)
combined = pd.concat(combined, ignore_index=True)
combined.head()


In [None]:
metrics = ['GHI','DNI','DHI']
summary = combined.groupby('country')[metrics].agg(['mean','median','std'])
summary.columns = ['_'.join(col).strip() for col in summary.columns.values]
summary = summary.reset_index()
summary.to_csv('outputs/summary_table.csv', index=False)
summary