In [1]:
import pandas as pd
import json
import os

# Define the file names
file_names = ["Cupertino.csv", "District Office.csv", "Fremont.csv", "Homestead.csv", "Lynbrook.csv", "Monta Vista.csv"]

# Directory paths
input_directory = '/mnt/data/'
output_directory = '/mnt/data/processed/'

# Create output directory if not exists
if not os.path.exists(output_directory):
    os.makedirs(output_directory)

# Function to process CSV files
def process_csv(file_name):
    try:
        # Read the CSV file
        df = pd.read_csv(input_directory + file_name)
        
        # Print columns for debugging
        print(f"Processing {file_name}")
        print(f"Columns: {df.columns.tolist()}")
        
        # Extract Date and CO2 columns
        if file_name == "District Office.csv":
            co2_column = 'Total'
        else:
            co2_column = [col for col in df.columns if 'CO2' in col or 'Carbon' in col]
            if not co2_column:
                print(f"No CO2/Carbon column found in {file_name}")
                return
            co2_column = co2_column[0]
        
        df_co2 = df[[' Date', co2_column]].copy()
        
        # Rename columns
        df_co2.columns = ['Date', 'CO2']
        
        # Save to new CSV
        output_csv_file = output_directory + file_name.replace('.csv', '_co2.csv')
        df_co2.to_csv(output_csv_file, index=False)
        
        # Convert to JSON
        json_data = df_co2.to_json(orient='records')
        output_json_file = output_csv_file.replace('.csv', '.json')
        with open(output_json_file, 'w') as json_file:
            json_file.write(json_data)
        
        print(f"Processed {file_name} successfully.")
    
    except Exception as e:
        print(f"Error processing {file_name}: {e}")

# Process each file
for file_name in file_names:
    process_csv(file_name)


Error processing Cupertino.csv: [Errno 2] No such file or directory: '/mnt/data/Cupertino.csv'
Error processing District Office.csv: [Errno 2] No such file or directory: '/mnt/data/District Office.csv'
Error processing Fremont.csv: [Errno 2] No such file or directory: '/mnt/data/Fremont.csv'
Error processing Homestead.csv: [Errno 2] No such file or directory: '/mnt/data/Homestead.csv'
Error processing Lynbrook.csv: [Errno 2] No such file or directory: '/mnt/data/Lynbrook.csv'
Error processing Monta Vista.csv: [Errno 2] No such file or directory: '/mnt/data/Monta Vista.csv'


In [4]:
import pandas as pd
import json

ev_data = pd.read_csv('./fuhsd_ev_data_22_23.csv')
print(ev_data.head())
print(ev_data.columns)
print(ev_data[['GHGs avoided (lbs)']].sum())

          Day  Energy delivered (kWh)  AVG kWh delivered per session (kWh)  \
0  2023-08-01                     0.0                                  0.0   
1  2023-08-02                     0.0                                  0.0   
2  2023-08-03                     0.0                                  0.0   
3  2023-08-04                     0.0                                  0.0   
4  2023-08-05                     0.0                                  0.0   

   Max kWh delivered per session (kWh) Max kW hour (kW)  GHGs avoided (lbs)  \
0                                  0.0                -                 0.0   
1                                  0.0                -                 0.0   
2                                  0.0                -                 0.0   
3                                  0.0              7pm                 0.0   
4                                  0.0                -                 0.0   

   Gasoline avoided (Gal)  Electric miles provided (mi) 

In [15]:
total = 0
schools=['Cupertino', 'Fremont', 'Lynbrook', 'District Office']
for s in schools:
    df = pd.read_csv('./data_processed/' + s + '_co2.csv')
    df[['CO2']] = df[['CO2']].astype(float)
    print(df.dtypes)
    sum_co2 = df[['CO2']].sum()
    print(sum_co2)
    total += sum_co2

print("TOTAL IS", total)

Date     object
CO2     float64
dtype: object
CO2    2224278.99
dtype: float64
Date     object
CO2     float64
dtype: object
CO2    3651025.68
dtype: float64
Date     object
CO2     float64
dtype: object
CO2    2212113.15
dtype: float64
Date     object
CO2     float64
dtype: object
CO2    650868.99
dtype: float64
TOTAL IS CO2    8738286.81
dtype: float64
