In [53]:
import numpy as np
import pandas as pd

# Load historical data to calculate reference mean and standard deviation
historical_data = pd.read_csv('Data_set.csv')
historical_data['Date'] = pd.to_datetime(historical_data['Date'])
historical_data['DayOfYear'] = historical_data['Date'].dt.dayofyear

# Calculate daily statistics
daily_stats = historical_data.groupby('DayOfYear').agg({
    'Rain': ['mean', 'std'],
    'Evap': ['mean', 'std']
}).reset_index()

# Rename columns for clarity
daily_stats.columns = ['DayOfYear', 'Precip_Mean', 'Precip_Std', 'Evap_Mean', 'Evap_Std']
# Add month and date columns
def day_of_year_to_date(day_of_year, year=2024):
    date = pd.Timestamp(year=year, month=1, day=1) + pd.DateOffset(days=day_of_year - 1)
    return date.strftime('%m-%d')

day_numbers = [i for i in range(1, 367)]

# Convert the list to a pandas Series by applying the function to each element
day_series = pd.Series(day_numbers).apply(day_of_year_to_date)

daily_stats['Month-Day'] = day_series

# Reorder columns for better readability
daily_stats = daily_stats[['DayOfYear', 'Month-Day', 'Precip_Mean', 'Precip_Std', 'Evap_Mean', 'Evap_Std']]

# Save daily statistics to a CSV file
daily_stats.to_csv('daily_statistics.csv', index=False)

print("Daily statistics with month and date have been calculated and saved to 'daily_statistics.csv'")


Daily statistics with month and date have been calculated and saved to 'daily_statistics.csv'
