# Importing Modules

In [54]:
import pandas as pd
import numpy as np

# Data Preprocessing

## Importing Dataset

In [57]:
emissions = pd.read_excel("Data/australias-emissions-projections-2024-chart-data.xlsx", 
                          sheet_name = "Figure 5",
                          index_col = 0,
                          skiprows = 2,
                          skipfooter = 2
                         )

emissions

Unnamed: 0,1990,1991,1992,1993,1994,1995,1996,1997,1998,1999,...,2031,2032,2033,2034,2035,2036,2037,2038,2039,2040
Electricity,129.53,131.68,134.54,135.46,137.03,142.65,147.68,152.71,165.34,171.99,...,58.98,52.84,49.09,50.34,36.81,35.03,33.56,33.02,33.39,29.23
Stationary energy,66.17,66.95,67.47,69.37,69.35,71.24,71.25,73.21,73.35,74.46,...,93.53,90.77,87.81,83.75,80.08,75.78,72.87,70.76,69.28,67.71
Transport,61.37,60.8,61.81,63.38,64.87,68.22,70.09,71.39,71.6,72.43,...,93.42,91.67,90.12,88.53,86.99,85.46,84.01,82.62,81.28,80.06
Fugitives,40.31,39.66,41.6,40.43,38.25,39.93,39.48,42.49,43.73,40.55,...,44.83,43.0,41.31,39.1,38.01,36.61,34.15,33.62,32.53,31.6
Agriculture,94.96,94.38,91.51,88.87,88.78,85.39,87.27,88.43,88.49,88.28,...,83.33,83.45,83.55,83.64,83.71,83.79,83.87,83.95,84.03,84.12
Industrial processes,25.11,24.31,24.89,24.64,24.89,24.65,24.34,24.42,25.47,25.91,...,26.59,25.78,25.29,24.69,23.97,23.02,22.31,21.52,20.87,20.11
Waste,23.46,23.38,23.12,22.93,22.16,22.09,20.22,19.91,19.09,19.21,...,12.94,12.84,12.8,12.75,12.71,12.67,12.63,12.59,12.56,12.53
LULUCF,178.27,157.77,113.48,92.16,81.79,60.7,55.73,41.82,44.98,59.47,...,-64.28,-63.96,-63.67,-62.25,-60.84,-59.43,-58.05,-56.68,-55.38,-54.08


In [58]:
# Transpose the index and columns 

emissions = emissions.T

In [59]:
# Renaming the index column

emissions.index.name = "Year"

In [60]:
# Create column name consistecy by capitalising the beginning of each word 

column_name_dict = {"Stationary energy":"Stationary Energy",
                    "Industrial processes" :"Industrial Processes"
                   }
emissions = emissions.rename(columns = column_name_dict)

emissions

Unnamed: 0_level_0,Electricity,Stationary Energy,Transport,Fugitives,Agriculture,Industrial Processes,Waste,LULUCF
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
1990,129.53,66.17,61.37,40.31,94.96,25.11,23.46,178.27
1991,131.68,66.95,60.8,39.66,94.38,24.31,23.38,157.77
1992,134.54,67.47,61.81,41.6,91.51,24.89,23.12,113.48
1993,135.46,69.37,63.38,40.43,88.87,24.64,22.93,92.16
1994,137.03,69.35,64.87,38.25,88.78,24.89,22.16,81.79
1995,142.65,71.24,68.22,39.93,85.39,24.65,22.09,60.7
1996,147.68,71.25,70.09,39.48,87.27,24.34,20.22,55.73
1997,152.71,73.21,71.39,42.49,88.43,24.42,19.91,41.82
1998,165.34,73.35,71.6,43.73,88.49,25.47,19.09,44.98
1999,171.99,74.46,72.43,40.55,88.28,25.91,19.21,59.47


In [61]:
# Create a Total Emissions column

emissions["Total Emissions"] = emissions.sum(axis = 1)

emissions

Unnamed: 0_level_0,Electricity,Stationary Energy,Transport,Fugitives,Agriculture,Industrial Processes,Waste,LULUCF,Total Emissions
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1990,129.53,66.17,61.37,40.31,94.96,25.11,23.46,178.27,619.18
1991,131.68,66.95,60.8,39.66,94.38,24.31,23.38,157.77,598.93
1992,134.54,67.47,61.81,41.6,91.51,24.89,23.12,113.48,558.42
1993,135.46,69.37,63.38,40.43,88.87,24.64,22.93,92.16,537.24
1994,137.03,69.35,64.87,38.25,88.78,24.89,22.16,81.79,527.12
1995,142.65,71.24,68.22,39.93,85.39,24.65,22.09,60.7,514.87
1996,147.68,71.25,70.09,39.48,87.27,24.34,20.22,55.73,516.06
1997,152.71,73.21,71.39,42.49,88.43,24.42,19.91,41.82,514.38
1998,165.34,73.35,71.6,43.73,88.49,25.47,19.09,44.98,532.05
1999,171.99,74.46,72.43,40.55,88.28,25.91,19.21,59.47,552.3


In [62]:
# Select the years to be used for analysis 

emissions_1990_2023 = emissions.loc[1990:2023]

emissions_1990_2023

Unnamed: 0_level_0,Electricity,Stationary Energy,Transport,Fugitives,Agriculture,Industrial Processes,Waste,LULUCF,Total Emissions
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1990,129.53,66.17,61.37,40.31,94.96,25.11,23.46,178.27,619.18
1991,131.68,66.95,60.8,39.66,94.38,24.31,23.38,157.77,598.93
1992,134.54,67.47,61.81,41.6,91.51,24.89,23.12,113.48,558.42
1993,135.46,69.37,63.38,40.43,88.87,24.64,22.93,92.16,537.24
1994,137.03,69.35,64.87,38.25,88.78,24.89,22.16,81.79,527.12
1995,142.65,71.24,68.22,39.93,85.39,24.65,22.09,60.7,514.87
1996,147.68,71.25,70.09,39.48,87.27,24.34,20.22,55.73,516.06
1997,152.71,73.21,71.39,42.49,88.43,24.42,19.91,41.82,514.38
1998,165.34,73.35,71.6,43.73,88.49,25.47,19.09,44.98,532.05
1999,171.99,74.46,72.43,40.55,88.28,25.91,19.21,59.47,552.3


In [63]:
# Reorder columns
emissions_1990_2023 = emissions_1990_2023[["Electricity","Agriculture", "Stationary Energy", "Transport", "Fugitives", "Industrial Processes", "Waste","LULUCF", "Total Emissions"]]

emissions_1990_2023

Unnamed: 0_level_0,Electricity,Agriculture,Stationary Energy,Transport,Fugitives,Industrial Processes,Waste,LULUCF,Total Emissions
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1990,129.53,94.96,66.17,61.37,40.31,25.11,23.46,178.27,619.18
1991,131.68,94.38,66.95,60.8,39.66,24.31,23.38,157.77,598.93
1992,134.54,91.51,67.47,61.81,41.6,24.89,23.12,113.48,558.42
1993,135.46,88.87,69.37,63.38,40.43,24.64,22.93,92.16,537.24
1994,137.03,88.78,69.35,64.87,38.25,24.89,22.16,81.79,527.12
1995,142.65,85.39,71.24,68.22,39.93,24.65,22.09,60.7,514.87
1996,147.68,87.27,71.25,70.09,39.48,24.34,20.22,55.73,516.06
1997,152.71,88.43,73.21,71.39,42.49,24.42,19.91,41.82,514.38
1998,165.34,88.49,73.35,71.6,43.73,25.47,19.09,44.98,532.05
1999,171.99,88.28,74.46,72.43,40.55,25.91,19.21,59.47,552.3


In [64]:
# Write data to a csv file 

emissions_1990_2023.to_csv("data/emissions_1990_2023.csv")