# Exploratory Data Analysis

This notebook demonstrates data generation and exploratory analysis of synthetic solar asset data.


In [None]:
import sys
from pathlib import Path

# Add src to path
sys.path.insert(0, str(Path.cwd().parent / "src"))

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

from src.config.settings import Config, DEFAULT_CONFIG
from src.data_generation.simulate_digital_twin import simulate_digital_twin

sns.set_style("whitegrid")
plt.rcParams["figure.figsize"] = (12, 6)


## Generate Synthetic Data


In [None]:
# Configure for quick demo (smaller dataset)
config = DEFAULT_CONFIG
config.simulation.days = 90  # 3 months
config.simulation.num_sites = 3
config.simulation.inverters_per_site = 5
config.simulation.strings_per_inverter = 4

print(f"Generating data for {config.simulation.days} days...")
telemetry, labels = simulate_digital_twin(config, seed=42)

print(f"Generated {len(telemetry):,} telemetry records")
print(f"Time range: {telemetry['timestamp'].min()} to {telemetry['timestamp'].max()}")
