In [1]:
import os
import pandas as pd

In [2]:
# Initialize an empty DataFrame to store combined data
combined_data = pd.DataFrame()

In [3]:
# Loop through each year folder (2020 to 2024)
for year in range(2020, 2025):
    folder_path = f"./{year}/"  # Path to year folder
    csv_file = f"SurfSpot_SST(Daily Mean {year}).csv"  # Expected filename
    
    try:
        # Read the CSV file
        df = pd.read_csv(os.path.join(folder_path, csv_file))
        
        # Filter for 'Arugam Bay' and keep 'Date' & 'SST (°C)'
        arugam_data = df[df['Surf Spot'] == 'Arugam Bay'][['Date', 'SST (°C)']]
        
        # Rename 'SST (°C)' to 'SST' (optional, for cleaner output)
        arugam_data = arugam_data.rename(columns={'SST (°C)': 'SST'})
        
        # Add to combined DataFrame
        combined_data = pd.concat([combined_data, arugam_data])
    
    except FileNotFoundError:
        print(f"⚠️ File not found: {folder_path}{csv_file} (Skipping)")

In [4]:
# Save the final DataFrame to a new CSV
output_filename = "Arugam Bay Mean Daily SST(2020-24).csv"
combined_data.to_csv(output_filename, index=False)

print(f"✅ Successfully saved: {output_filename}")
print("\nPreview:")
print(combined_data.head())  # Show first 5 rows

✅ Successfully saved: Arugam Bay Mean Daily SST(2020-24).csv

Preview:
         Date          SST
0  2020-01-01  2814.193548
1  2020-01-02  2814.717894
2  2020-01-03  2815.242240
3  2020-01-04  2815.766587
4  2020-01-05  2816.290933
