In [1]:
import pandas as pd
from google.colab import drive

# Mount Google Drive
drive.mount('/content/drive')

# Define file paths
github_emissions_url = "https://raw.githubusercontent.com/apownukepcc/datathon-spring-2025/main/emissions_data_updated.csv"
github_weather_url = "https://raw.githubusercontent.com/apownukepcc/datathon-spring-2025/main/weather.csv"
output_file = "/content/drive/My Drive/combined_data.csv"

# Load the emissions data from GitHub
try:
    emissions_data = pd.read_csv(github_emissions_url)
    print("Emissions data successfully loaded from GitHub.")
except Exception as e:
    print(f"Error loading emissions data from GitHub: {e}")
    exit()

# Load the weather data from GitHub
try:
    weather_data = pd.read_csv(github_weather_url)
    print("Weather data successfully loaded from GitHub.")
except Exception as e:
    print(f"Error loading weather data from GitHub: {e}")
    exit()

# Standardize column names for merging
emissions_data = emissions_data.rename(columns={"TimeStamp": "date"})

# Merge the datasets on the 'date' column
combined_data = pd.merge(emissions_data, weather_data, on="date", how="inner")

# Save the combined data to Google Drive
try:
    combined_data.to_csv(output_file, index=False)
    print(f"Combined data saved to: {output_file}")
except Exception as e:
    print(f"Error saving combined data to Google Drive: {e}")


Mounted at /content/drive
Emissions data successfully loaded from GitHub.
Weather data successfully loaded from GitHub.
Combined data saved to: /content/drive/My Drive/combined_data.csv
