# Exploratory Data Analysis (EDA) - Benin (Malanville) Solar Data
#
# **Objective:** Profile, clean, and explore Benin's (Malanville) solar dataset to understand its characteristics, identify trends, and extract insights for potential solar investments.
#
# **Business Objective Context:** MoonLight Energy Solutions aims to enhance operational efficiency and sustainability through targeted solar investments. This EDA will help identify high-potential regions by analyzing environmental measurement data.

## 1. Setup and Data Loading

In [3]:
#  1. Setup and Data Loading
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from scipy.stats import zscore
import os # For creating directory if it doesn't exist

# Plotting style
plt.style.use('seaborn-v0_8-whitegrid') # A modern seaborn style
sns.set_palette("viridis") # A nice color palette


In [4]:
DATA_DIR = '../data/'
FILE_NAME = 'benin-malanville.csv' 
data_path = os.path.join(DATA_DIR, FILE_NAME)

CLEANED_DATA_DIR = '../data/' 
if not os.path.exists(CLEANED_DATA_DIR):
    os.makedirs(CLEANED_DATA_DIR)
cleaned_file_path = os.path.join(CLEANED_DATA_DIR, 'benin-malanville_clean.csv') # <<< Adjusted cleaned file name

In [5]:
try:
    df_benin = pd.read_csv(data_path)
    print(f"Successfully loaded {data_path}")
except FileNotFoundError:
    print(f"Error: {data_path} not found. Ensure the file is in the '{DATA_DIR}' directory.")
    df_benin = None # Set to None if file not found
except Exception as e:
    print(f"An error occurred while loading the file: {e}")
    df_benin = None

Successfully loaded ../data/benin-malanville.csv


 ## 2. Initial Data Inspection