# Exploratory Data Analysis for Solar Farm Data
This notebook explores the solar farm dataset to identify high-potential regions for solar installations in Benin, Sierra Leone, and Togo.


In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

# Load the dataset
data = pd.read_csv('../data/solar_farm_data.csv')

# Display the first few rows
data.head()

# Dataset overview
print("Dataset Info:")
data.info()

# Check for missing values
print("\nMissing Values:")
print(data.isnull().sum())

# Summary statistics
print("\nSummary Statistics:")
print(data.describe())


# Distribution of key numeric columns
data.hist(figsize=(10, 8), bins=20)
plt.tight_layout()
plt.show()


# Correlation heatmap
plt.figure(figsize=(8, 6))
sns.heatmap(data.corr(), annot=True, cmap='coolwarm', fmt='.2f')
plt.title("Correlation Heatmap")
plt.show()


# Example bar plot
sns.barplot(x='Country', y='SolarPotential', data=data)
plt.title("Solar Potential by Country")
plt.show()


