In [2]:
import pandas as pd

# Load datasets
datasets = {
    "Benin": pd.read_csv("data/benin_clean.csv"),
    "Sierra Leone": pd.read_csv("data/sierraleone_clean.csv"),  # adjust filename if needed
    "Togo": pd.read_csv("data/togo_clean.csv")
}

# Quick check
for country, df in datasets.items():
    print(f"{country} dataset loaded. Shape: {df.shape}")
from scipy.stats import f_oneway, kruskal

# Extract GHI values
ghi_benin = datasets['Benin']['GHI']
ghi_sierra = datasets['Sierra Leone']['GHI']
ghi_togo = datasets['Togo']['GHI']

# One-way ANOVA
anova_result = f_oneway(ghi_benin, ghi_sierra, ghi_togo)
print("One-way ANOVA result:")
print(f"F-statistic = {anova_result.statistic:.4f}, p-value = {anova_result.pvalue:.4e}")

# Kruskal-Wallis test
kruskal_result = kruskal(ghi_benin, ghi_sierra, ghi_togo)
print("\nKruskal-Wallis test result:")
print(f"H-statistic = {kruskal_result.statistic:.4f}, p-value = {kruskal_result.pvalue:.4e}")



Benin dataset loaded. Shape: (525600, 19)
Sierra Leone dataset loaded. Shape: (525600, 19)
Togo dataset loaded. Shape: (525600, 19)
One-way ANOVA result:
F-statistic = 2090.0929, p-value = 0.0000e+00

Kruskal-Wallis test result:
H-statistic = 4524.8835, p-value = 0.0000e+00
