In [6]:
import pandas as pd
import matplotlib.pyplot as plt

# Load the CSV data
CSV_NAME = 'weather_2020-11.csv'
data = pd.read_csv(CSV_NAME)

# Filter and extract relevant data
relevant_params = ['RH_PT1H_AVG', 'TA_PT1H_AVG', 'WS_PT1H_AVG', 'PRA_PT1H_ACC', 'PA_PT1H_AVG']
relevant_data = data[data['ParameterName'].isin(relevant_params)].copy()

# Convert ParameterValue to numeric, handling errors with NaN
relevant_data['ParameterValue'] = pd.to_numeric(relevant_data['ParameterValue'], errors='coerce')

# Pivot the table to have each parameter as a column
pivot_table = relevant_data.pivot_table(values='ParameterValue', index='Time', columns='ParameterName')

# Calculate summary statistics
summary_stats = pivot_table.describe()

# Calculate average values over the entire timespan
avg_values = pivot_table.mean()

# Output calculated values
print("\nCalculated Values:")
print(f"Relative Humidity (avg): {avg_values['RH_PT1H_AVG']:.2f}")
print(f"Temperature Average (avg): {avg_values['TA_PT1H_AVG']:.2f}")
print(f"Wind Speed (avg): {avg_values['WS_PT1H_AVG']:.2f}")

# Check if 'PRA_PT1H_ACC' exists in avg_values before accessing it
if 'PRA_PT1H_ACC' in avg_values:
    print(f"Precipitation Amount (avg): {avg_values['PRA_PT1H_ACC']:.2f}")
else:
    print("Precipitation Amount (avg): NaN")

print(f"Pressure Average (avg): {avg_values['PA_PT1H_AVG']:.2f}")



Calculated Values:
Relative Humidity (avg): 87.90
Temperature Average (avg): 2.74
Wind Speed (avg): 3.90
Precipitation Amount (avg): NaN
Pressure Average (avg): 1012.63
