# GeoRelief-AI Data Exploration

This notebook is for exploring and analyzing the geospatial data used in GeoRelief-AI.


In [None]:
import sys
from pathlib import Path
import geopandas as gpd
import pandas as pd
import matplotlib.pyplot as plt

# Add parent directory to path
sys.path.insert(0, str(Path().resolve().parent))

from core import config


In [None]:
# Load the master dataset
if config.MASTER_DATASET_PATH.exists():
    gdf = gpd.read_file(config.MASTER_DATASET_PATH)
    print(f"Loaded {len(gdf)} regions")
    print(f"Columns: {list(gdf.columns)}")
    print(f"\nFirst few rows:")
    print(gdf.head())
else:
    print(f"Dataset not found at {config.MASTER_DATASET_PATH}")
    print("Please run data processing first.")


In [None]:
# Visualize the data
if config.MASTER_DATASET_PATH.exists():
    fig, ax = plt.subplots(1, 1, figsize=(12, 8))
    gdf.plot(ax=ax, column='population_density', legend=True, cmap='YlOrRd')
    ax.set_title('Population Density by Region')
    plt.tight_layout()
    plt.show()
