In [1]:
import pandas as pd
import os
from google.colab import drive

# Mount Google Drive
drive.mount('/content/drive')

# Define file paths
github_url = "https://raw.githubusercontent.com/apownukepcc/datathon-spring-2025/main/emissions_data.csv"
output_file = "/content/drive/My Drive/emissions_data_updated.csv"

# Load the emissions data from GitHub
try:
    emissions_data = pd.read_csv(github_url)
    print("File successfully loaded from GitHub.")
except Exception as e:
    print(f"Error loading file from GitHub: {e}")
    exit()

# Remove time part ("0:00") from the 'TimeStamp' column
if 'TimeStamp' in emissions_data.columns:
    emissions_data['TimeStamp'] = emissions_data['TimeStamp'].str.replace(r"\s0:00", "", regex=True)
    print("'TimeStamp' column cleaned.")
else:
    print("The column 'TimeStamp' was not found in the file.")
    exit()

# Save the updated file to Google Drive
try:
    emissions_data.to_csv(output_file, index=False)
    print(f"Updated emissions data saved to: {output_file}")
except Exception as e:
    print(f"Error saving file to Google Drive: {e}")


Mounted at /content/drive
File successfully loaded from GitHub.
'TimeStamp' column cleaned.
Updated emissions data saved to: /content/drive/My Drive/emissions_data_updated.csv
