Checking out data sets of annual, country-level data:

In [2]:
import pandas as pd

In [14]:
#Annual co2 emissions for all countries as early as 1750
#data includes estimates of course but the more recent years we'd consider are more accurate

co2 = pd.read_csv('./data/annual_country_co2.csv')
co2.head()

Unnamed: 0,Entity,Code,Year,Annual CO2 emissions
0,Afghanistan,AFG,1949,14656
1,Afghanistan,AFG,1950,84272
2,Afghanistan,AFG,1951,91600
3,Afghanistan,AFG,1952,91600
4,Afghanistan,AFG,1953,106256


In [35]:
co2[['Entity', 'Year', 'Annual CO2 emissions']]

Unnamed: 0,Entity,Year,Annual CO2 emissions
0,Afghanistan,1949,14656
1,Afghanistan,1950,84272
2,Afghanistan,1951,91600
3,Afghanistan,1952,91600
4,Afghanistan,1953,106256
...,...,...,...
23944,Zimbabwe,2016,10737567
23945,Zimbabwe,2017,9581633
23946,Zimbabwe,2018,11854367
23947,Zimbabwe,2019,10949084


In [36]:
co2[['Entity', 'Year']].groupby(['Entity']).min().sort_values(['Year'], ascending=False).head()

Unnamed: 0_level_0,Year
Entity,Unnamed: 1_level_1
Kosovo,2008
Timor,2002
Wallis and Futuna,2001
Marshall Islands,1992
Micronesia (country),1992


In [38]:
#This data is the same shape as previous but values are % of world emissions so it's effectively already scaled

share_co2 = pd.read_csv('./data/annual-share-of-co2-emissions.csv')
share_co2.head()

Unnamed: 0,Entity,Code,Year,Share of global annual CO2 emissions
0,Afghanistan,AFG,1949,0.0
1,Afghanistan,AFG,1950,0.0
2,Afghanistan,AFG,1951,0.0
3,Afghanistan,AFG,1952,0.0
4,Afghanistan,AFG,1953,0.0


In [105]:
#not country level data but temp anomaly is the deviation from the 1950-1980 average temp for each year in the time period. 
#data is also monthly
temp_anom = pd.read_csv('./data/climate-change.csv')
temp_anom.head()

Unnamed: 0,Entity,Code,Day,temperature_anomaly
0,Northern Hemisphere,,1880-01-15,-0.35
1,Northern Hemisphere,,1880-02-15,-0.51
2,Northern Hemisphere,,1880-03-15,-0.23
3,Northern Hemisphere,,1880-04-15,-0.3
4,Northern Hemisphere,,1880-05-15,-0.06


In [106]:
temp_anom.shape

(5112, 4)

In [45]:
#annual country data; co2 emissions per capita; similar but not same shape as first 2 df's

co2_percap = pd.read_csv('./data/co-emissions-per-capita.csv')
co2_percap.head()

Unnamed: 0,Entity,Code,Year,Annual CO2 emissions (per capita)
0,Afghanistan,AFG,1949,0.0019
1,Afghanistan,AFG,1950,0.0109
2,Afghanistan,AFG,1951,0.0117
3,Afghanistan,AFG,1952,0.0115
4,Afghanistan,AFG,1953,0.0132


In [47]:
#annual co2 emissions, annual gdp(ppp), and consumption-based emissions

co2_gdp = pd.read_csv('./data/co2-emissions-and-gdp.csv')
co2_gdp.head()

Unnamed: 0,Entity,Code,Year,Annual CO2 emissions,Annual consumption-based CO2 emissions,"GDP, PPP (constant 2017 international $)"
0,Afghanistan,AFG,1990,2603238.0,,
1,Afghanistan,AFG,1991,2427366.0,,
2,Afghanistan,AFG,1992,1379462.0,,
3,Afghanistan,AFG,1993,1333055.0,,
4,Afghanistan,AFG,1994,1281602.0,,


In [50]:
#annual emissions from transportation (tons co2)

transport = pd.read_csv('./data/co2-emissions-transport.csv')
transport.head()

Unnamed: 0,Entity,Code,Year,"Transport (CAIT, 2020)"
0,Albania,ALB,1990,700000.0
1,Albania,ALB,1991,500000.0
2,Albania,ALB,1992,400000.0
3,Albania,ALB,1993,500000.0
4,Albania,ALB,1994,600000.0


In [80]:
# annual per capita emissions from domestic transportation in 2020 $'s by country

transport_percap = pd.read_csv('./data/per-capita-co2-transport.csv')
transport_percap.head()

Unnamed: 0,Entity,Code,Year,"Transport (per capita) (CAIT, 2020)"
0,Albania,ALB,1990,0.213025
1,Albania,ALB,1991,0.152439
2,Albania,ALB,1992,0.123229
3,Albania,ALB,1993,0.156495
4,Albania,ALB,1994,0.190658


In [53]:
#amount of ozone depleting substances (ODS) consumed in tons weighted by depleting potential

ozone = pd.read_csv('./data/consumption-of-ozone-depleting-substances.csv')
ozone.head()

Unnamed: 0,Entity,Code,Year,Consumption of Ozone-Depleting Substances - All
0,Afghanistan,AFG,1989,0.9
1,Afghanistan,AFG,1991,0.0
2,Afghanistan,AFG,1995,381.9
3,Afghanistan,AFG,1996,381.9
4,Afghanistan,AFG,1997,381.9


In [57]:
#amount of co2e (co2 and co2 equivalent weighted substance) emissions from food

food_co2e = pd.read_csv('./data/emissions-from-food.csv')
food_co2e.head()

Unnamed: 0,Entity,Code,Year,Food emissions by country
0,Afghanistan,AFG,1990,10442724.8
1,Afghanistan,AFG,1991,10665824.8
2,Afghanistan,AFG,1992,10805724.8
3,Afghanistan,AFG,1993,11003824.8
4,Afghanistan,AFG,1994,11286224.8


In [59]:
#annual global energy consumption by source (TWh Terawatt hours)

energy_global = pd.read_csv('./data/global-primary-energy.csv')
energy_global.head()

Unnamed: 0,Entity,Code,Year,Coal (TWh; direct energy),Solar (TWh; direct energy),Oil (TWh; direct energy),Gas (TWh; direct energy),Traditional biomass (TWh; direct energy),Other renewables (TWh; direct energy),Hydropower (TWh; direct energy),Nuclear (TWh; direct energy),Wind (TWh; direct energy),Biofuels (TWh; direct energy)
0,World,OWID_WRL,1800,97,0,0,0,5556,0,0,0,0,0
1,World,OWID_WRL,1810,128,0,0,0,5833,0,0,0,0,0
2,World,OWID_WRL,1820,153,0,0,0,6111,0,0,0,0,0
3,World,OWID_WRL,1830,264,0,0,0,6389,0,0,0,0,0
4,World,OWID_WRL,1840,356,0,0,0,6944,0,0,0,0,0


In [62]:
#filename was primary-energy-source-bar
#annual energy consumption by country by source (TWh)

energy_country=pd.read_csv('./data/country-primary-energy.csv')
energy_country.head()

Unnamed: 0,Entity,Code,Year,Coal Consumption - TWh,Oil Consumption - TWh,Gas Consumption - TWh,Nuclear Consumption - TWh,Hydro Consumption - TWh,Wind Consumption - TWh,Solar Consumption - TWh,Geo Biomass Other - TWh
0,Africa,,1965,323.496138,327.333164,9.543754,0.0,38.626764,0.0,0.0,0.0
1,Africa,,1966,323.122193,358.132674,10.669916,0.0,43.083345,0.0,0.0,0.0
2,Africa,,1967,330.291585,355.281459,10.54567,0.0,44.97399,0.0,0.0,0.0
3,Africa,,1968,343.512911,374.852131,10.68897,0.0,52.606502,0.0,0.0,0.0
4,Africa,,1969,346.642922,379.973086,12.492,0.0,61.39136,0.0,0.0,0.0


In [64]:
#only 94 countries
len(energy_country.Entity.unique())

94

In [66]:
#time period 1965 to 2020
energy_country.Year.describe()

count    5003.000000
mean     1993.409954
std        16.003587
min      1965.000000
25%      1980.000000
50%      1994.000000
75%      2007.000000
max      2020.000000
Name: Year, dtype: float64

In [75]:
#list of countries, year of net zero target and y/n net zero target, but only includes Yes's

net_zero_binary = pd.read_csv('./data/net-zero-target-set.csv')
net_zero_binary.head()

Unnamed: 0,Entity,Code,Year,Is there a net-zero target?
0,Antigua and Barbuda,ATG,2040,Yes
1,Australia,AUS,2050,Yes
2,Austria,AUT,2040,Yes
3,Bahrain,BHR,2060,Yes
4,Barbados,BRB,2030,Yes


In [76]:
net_zero_binary['Is there a net-zero target?'].value_counts()

Yes    66
Name: Is there a net-zero target?, dtype: int64

In [70]:
#countries, year of target, status of target

net_zero_targets = pd.read_csv('./data/net-zero-targets.csv')
net_zero_targets.head()

Unnamed: 0,Entity,Code,Year,Status of net-zero target
0,Antigua and Barbuda,ATG,2040,In policy document
1,Australia,AUS,2050,Pledge
2,Austria,AUT,2040,In policy document
3,Bahrain,BHR,2060,Pledge
4,Barbados,BRB,2030,In policy document


In [71]:
net_zero_targets['Status of net-zero target'].value_counts()

In policy document    32
Pledge                14
In law                13
Achieved               7
Name: Status of net-zero target, dtype: int64

In [82]:
#Exposure to air pollution with fine particulate matter(PM25), 1990 to 2017 by country

airpol = pd.read_csv('./data/PM25-air-pollution.csv')
airpol.head()

Unnamed: 0,Entity,Code,Year,"PM2.5 air pollution, mean annual exposure (micrograms per cubic meter)"
0,Afghanistan,AFG,1990,65.486792
1,Afghanistan,AFG,1995,65.179513
2,Afghanistan,AFG,2000,64.922462
3,Afghanistan,AFG,2005,64.522683
4,Afghanistan,AFG,2010,65.245592


In [96]:
# annual share of deaths caused by air pollution by country 1990-2017

airpol_death_share = pd.read_csv('./data/share-deaths-air-pollution.csv')
airpol_death_share.head()

Unnamed: 0,Entity,Code,Year,Deaths - Cause: All causes - Risk: Air pollution - Sex: Both - Age: Age-standardized (Percent)
0,Afghanistan,AFG,1990,21.328446
1,Afghanistan,AFG,1991,21.01177
2,Afghanistan,AFG,1992,21.19281
3,Afghanistan,AFG,1993,21.367169
4,Afghanistan,AFG,1994,21.094811


In [99]:
# annual death rate caused by air pollution by country

airpol_death_rate = pd.read_csv('./data/outdoor-pollution-death-rate.csv')
airpol_death_rate.head()

Unnamed: 0,Entity,Code,Year,Deaths - Cause: All causes - Risk: Outdoor air pollution - OWID - Sex: Both - Age: Age-standardized (Rate)
0,Afghanistan,AFG,1990,37.403786
1,Afghanistan,AFG,1991,36.093797
2,Afghanistan,AFG,1992,35.128474
3,Afghanistan,AFG,1993,35.290047
4,Afghanistan,AFG,1994,35.878601


In [100]:
#df.loc[df['Entity']=='United States']

In [104]:
#temp anomaly by region

#pd.read_csv('./data/temperature-anomaly.csv')

In [103]:
#annual total ghg emissions by country

ghg = pd.read_csv('./data/total-ghg-emissions.csv')
ghg.head()

Unnamed: 0,Entity,Code,Year,Total GHG emissions including LUCF (CAIT)
0,Afghanistan,AFG,1990,15140000.0
1,Afghanistan,AFG,1991,15060000.0
2,Afghanistan,AFG,1992,13600000.0
3,Afghanistan,AFG,1993,13430000.0
4,Afghanistan,AFG,1994,13240000.0
