In [7]:
import pandas as pd

In [8]:
locations = [
    "kum",
    "lovrenska-jezera",
    "osp",
    "storzic",
    "vrsic",
]

In [11]:
for location in locations:
    filename = f"../data/weather/raw/{location}.csv"
    print("PROCESSING", filename)
    
    # Read dataframe from CSV and process columns
    df = (pd.read_csv(filename, header=0)
          .rename(columns={" valid": "datetime", "povp. T [°C]": "temperature", "količina padavin [mm]": "rain"})
          .filter(["datetime", "temperature", "rain"]))

    # Convert the first column to datetime and set it as the index
    df["datetime"] = pd.to_datetime(df["datetime"])
    df.set_index("datetime", inplace=True)

    # Aggregate data per hour and reset index back
    resampled = df.resample("D").agg({"temperature": "mean", "rain": "sum"})
    resampled = resampled.reset_index()

    # Add location column
    resampled["location"] = location

    # Save the data to a new CSV file
    resampled.to_csv(f"../data/weather/aggregated/{location}.csv", columns=["location", "datetime", "temperature", "rain"], index=False)

PROCESSING ../data/weather/raw/kum.csv
PROCESSING ../data/weather/raw/lovrenska-jezera.csv
PROCESSING ../data/weather/raw/osp.csv
PROCESSING ../data/weather/raw/storzic.csv
PROCESSING ../data/weather/raw/vrsic.csv
