# Weather Data Processing - Regression Example

This notebook demonstrates how to use the WeatherDataProcessor for regression tasks (predicting 3-day precipitation).


In [None]:
# Import the local development version
import sys
import os
sys.path.insert(0, os.path.abspath('../src'))

# Import directly from the module to avoid conflicts with installed package
from brayam_pineda_ml.weather_data_processor import WeatherDataProcessor
import pandas as pd
import numpy as np


## 1. Initialize the Weather Data Processor


In [None]:
# Initialize the processor for Sydney weather data
processor = WeatherDataProcessor(
    lat=-33.8678,  # Sydney latitude
    lon=151.2073,  # Sydney longitude
    timezone="Australia/Sydney"
)


## 2. Run Complete Pipeline for Regression


In [None]:
# Run the complete pipeline for regression task
data = processor.process_full_pipeline(
    start_date="2016-01-01",
    end_date="2024-12-31",
    task_type="regression",
    target_name="precip_3day_next"
)

print(f"Training set shape: {data['X_train'].shape}")
print(f"Validation set shape: {data['X_val'].shape}")
print(f"Test set shape: {data['X_test'].shape}")
print(f"Number of features: {len(data['feature_names'])}")
print(f"Target variable: {data['target_name']}")
