Set Folders

In [21]:
from google.colab import drive
import os

temp_humidity_folder = "/content/drive/MyDrive/weatherdata"
voltage_folder = "/content/drive/MyDrive/voltagedata"


Read Voltage and Weather Data

In [28]:
import pandas as pd
import glob

#load temp and humidity data
temp_humidity_files = glob.glob(temp_humidity_folder + "/*.csv")
dfs_temp_humidity = []

for file in temp_humidity_files:
    try:
        df = pd.read_csv(file, skiprows=2)  #first 2 rows removed because they mess up the columns
        df = df[['Year', 'Month', 'Day', 'Hour', 'Minute', 'Temperature', 'Relative Humidity']]  # Keep only relevant columns
        df['timestamp'] = pd.to_datetime(df[['Year', 'Month', 'Day', 'Hour', 'Minute']])  #combine into timestamp
        df = df.drop(columns=['Year', 'Month', 'Day', 'Hour', 'Minute'])
        dfs_temp_humidity.append(df)
    except Exception as e:
        print(f"Error processing {file}: {e}")

if dfs_temp_humidity:
    df_temp_humidity = pd.concat(dfs_temp_humidity, ignore_index=True)
    print(df_temp_humidity.head())
else:
    print("No valid weather data found.")

voltage_files = glob.glob(os.path.join(voltage_folder, "*.xls"))
#print("Voltage files found:", voltage_files) #used for debug

dfs_voltage = []
for file in voltage_files:
    try:
        df = pd.read_excel(file)
        dfs_voltage.append(df)
    except Exception as e:
        print(f"Error reading {file}: {e}")

#Concatenate voltage
if dfs_voltage:
    df_voltage = pd.concat(dfs_voltage, ignore_index=True)
    df_voltage = df_voltage[['Hour_End', 'WEST']]  #keep relevant columns
    df_voltage['Hour_End'] = pd.to_datetime(df_voltage['Hour_End'])
else:
    print("No valid voltage data found.")
    df_voltage = pd.DataFrame(columns=['Hour_End', 'WEST']) #put data into dataframe


print(df_temp_humidity.head())
print(df_voltage.head())

   Temperature  Relative Humidity           timestamp
0          9.2              46.99 2012-01-01 00:30:00
1          8.2              48.76 2012-01-01 01:30:00
2          7.4              50.02 2012-01-01 02:30:00
3          6.4              51.82 2012-01-01 03:30:00
4          5.3              53.63 2012-01-01 04:30:00
Voltage files found: ['/content/drive/MyDrive/voltagedata/native_load_2015.xls', '/content/drive/MyDrive/voltagedata/2014_ercot_hourly_load_data.xls', '/content/drive/MyDrive/voltagedata/2013_ercot_hourly_load_data.xls', '/content/drive/MyDrive/voltagedata/2012_ercot_hourly_load_data (3).xls']
   Temperature  Relative Humidity           timestamp
0          9.2              46.99 2012-01-01 00:30:00
1          8.2              48.76 2012-01-01 01:30:00
2          7.4              50.02 2012-01-01 02:30:00
3          6.4              51.82 2012-01-01 03:30:00
4          5.3              53.63 2012-01-01 04:30:00
                 Hour_End         WEST
0 2015-01-01 01:00