In [1]:
# Import dependencies
import pandas as pd
# from pyxlsb import open_workbook

# from config import postgres_password
# from sqlalchemy import create_engine


# Extract Data Into DataFrames For Temperature

### NASA Climate Dataset

In [2]:
# Import data file
# This graph illustrates the change in global surface temperature relative to 1951-1980 average temperatures
nasa_file = "raw_data/nasa_land_ocean_temp.csv"

nasa_temp = pd.read_csv(nasa_file)
display(nasa_temp.head(5))
display(nasa_temp.tail(5))

Unnamed: 0,Year,No_Smoothing,Lowess(5)
0,1880,-0.16,-0.08
1,1881,-0.07,-0.12
2,1882,-0.1,-0.16
3,1883,-0.16,-0.19
4,1884,-0.27,-0.23


Unnamed: 0,Year,No_Smoothing,Lowess(5)
136,2016,1.02,0.88
137,2017,0.93,0.91
138,2018,0.85,0.95
139,2019,0.98,0.98
140,2020,1.02,1.01


# Transform Data for Energy and Emission

### NASA Climate Dataset

In [3]:
# Extract the wanted columns
list(nasa_temp.columns)

['Year', 'No_Smoothing', 'Lowess(5)']

In [4]:
# Lowess smooths the data, no_smoothing 
nasa_temp_df = nasa_temp[["Year", "No_Smoothing", "Lowess(5)"]]
nasa_temp_df.head()

Unnamed: 0,Year,No_Smoothing,Lowess(5)
0,1880,-0.16,-0.08
1,1881,-0.07,-0.12
2,1882,-0.1,-0.16
3,1883,-0.16,-0.19
4,1884,-0.27,-0.23


In [5]:
# Extract year from 1965 to the most recent
nasa_temp_new_df = nasa_temp_df[nasa_temp_df["Year"]>1964]
nasa_temp_new_df.head()

Unnamed: 0,Year,No_Smoothing,Lowess(5)
85,1965,-0.11,-0.05
86,1966,-0.06,-0.06
87,1967,-0.02,-0.05
88,1968,-0.08,-0.03
89,1969,0.05,-0.02


In [6]:
nasa_temp_new_df.reset_index(drop=True).head()

Unnamed: 0,Year,No_Smoothing,Lowess(5)
0,1965,-0.11,-0.05
1,1966,-0.06,-0.06
2,1967,-0.02,-0.05
3,1968,-0.08,-0.03
4,1969,0.05,-0.02


### Kaggle Temperature Change Dataset

In [7]:
# Import kaggle data
kaggle_temp = "raw_data/Environment_Temperature_change_E_All_Data_NOFLAG.csv"
kaggle_temp = pd.read_csv(kaggle_temp, encoding="ISO-8859-1")
kaggle_temp.head(5)

Unnamed: 0,Area Code,Area,Months Code,Months,Element Code,Element,Unit,Y1961,Y1962,Y1963,...,Y2010,Y2011,Y2012,Y2013,Y2014,Y2015,Y2016,Y2017,Y2018,Y2019
0,2,Afghanistan,7001,January,7271,Temperature change,°C,0.777,0.062,2.744,...,3.601,1.179,-0.583,1.233,1.755,1.943,3.416,1.201,1.996,2.951
1,2,Afghanistan,7001,January,6078,Standard Deviation,°C,1.95,1.95,1.95,...,1.95,1.95,1.95,1.95,1.95,1.95,1.95,1.95,1.95,1.95
2,2,Afghanistan,7002,February,7271,Temperature change,°C,-1.743,2.465,3.919,...,1.212,0.321,-3.201,1.494,-3.187,2.699,2.251,-0.323,2.705,0.086
3,2,Afghanistan,7002,February,6078,Standard Deviation,°C,2.597,2.597,2.597,...,2.597,2.597,2.597,2.597,2.597,2.597,2.597,2.597,2.597,2.597
4,2,Afghanistan,7003,March,7271,Temperature change,°C,0.516,1.336,0.403,...,3.39,0.748,-0.527,2.246,-0.076,-0.497,2.296,0.834,4.418,0.234


In [8]:
cleaned_temp = kaggle_temp.drop(columns=['Area Code', 'Months Code', 'Element Code', 'Y1961', 'Y1962','Y1963', 'Y1964'])
cleaned_temp.head(5)

Unnamed: 0,Area,Months,Element,Unit,Y1965,Y1966,Y1967,Y1968,Y1969,Y1970,...,Y2010,Y2011,Y2012,Y2013,Y2014,Y2015,Y2016,Y2017,Y2018,Y2019
0,Afghanistan,January,Temperature change,°C,1.868,3.629,-1.432,0.389,-2.298,0.804,...,3.601,1.179,-0.583,1.233,1.755,1.943,3.416,1.201,1.996,2.951
1,Afghanistan,January,Standard Deviation,°C,1.95,1.95,1.95,1.95,1.95,1.95,...,1.95,1.95,1.95,1.95,1.95,1.95,1.95,1.95,1.95,1.95
2,Afghanistan,February,Temperature change,°C,-0.096,3.397,0.296,-2.055,-3.167,1.809,...,1.212,0.321,-3.201,1.494,-3.187,2.699,2.251,-0.323,2.705,0.086
3,Afghanistan,February,Standard Deviation,°C,2.597,2.597,2.597,2.597,2.597,2.597,...,2.597,2.597,2.597,2.597,2.597,2.597,2.597,2.597,2.597,2.597
4,Afghanistan,March,Temperature change,°C,-0.909,-0.069,-0.759,0.496,2.481,-0.915,...,3.39,0.748,-0.527,2.246,-0.076,-0.497,2.296,0.834,4.418,0.234


In [9]:
# Extract only temperature change data
new_kaggle = cleaned_temp[cleaned_temp["Element"]=="Temperature change"]
new_kaggle

Unnamed: 0,Area,Months,Element,Unit,Y1965,Y1966,Y1967,Y1968,Y1969,Y1970,...,Y2010,Y2011,Y2012,Y2013,Y2014,Y2015,Y2016,Y2017,Y2018,Y2019
0,Afghanistan,January,Temperature change,°C,1.868,3.629,-1.432,0.389,-2.298,0.804,...,3.601,1.179,-0.583,1.233,1.755,1.943,3.416,1.201,1.996,2.951
2,Afghanistan,February,Temperature change,°C,-0.096,3.397,0.296,-2.055,-3.167,1.809,...,1.212,0.321,-3.201,1.494,-3.187,2.699,2.251,-0.323,2.705,0.086
4,Afghanistan,March,Temperature change,°C,-0.909,-0.069,-0.759,0.496,2.481,-0.915,...,3.390,0.748,-0.527,2.246,-0.076,-0.497,2.296,0.834,4.418,0.234
6,Afghanistan,April,Temperature change,°C,-1.816,-1.192,-1.496,-0.590,-0.770,1.439,...,2.591,1.712,1.417,-0.052,0.585,1.589,0.980,1.252,1.442,0.899
8,Afghanistan,May,Temperature change,°C,-0.190,-0.192,-1.307,-1.841,-0.977,1.864,...,1.419,3.643,0.909,1.201,0.959,1.862,3.246,3.280,0.855,0.647
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9646,OECD,DecJanFeb,Temperature change,°C,-0.732,-0.274,-0.165,-0.018,-0.188,0.400,...,1.272,0.770,1.709,1.327,0.686,1.307,2.636,1.884,1.453,1.527
9648,OECD,MarAprMay,Temperature change,°C,-0.110,-0.078,-0.334,0.285,-0.080,-0.249,...,1.742,0.390,1.442,0.475,0.778,1.191,1.928,1.237,1.241,1.352
9650,OECD,JunJulAug,Temperature change,°C,-0.495,-0.015,-0.184,-0.437,0.022,0.240,...,1.012,0.954,1.061,1.119,0.779,0.958,1.303,1.081,1.078,1.078
9652,OECD,SepOctNov,Temperature change,°C,-0.203,-0.295,0.321,0.220,-0.027,-0.146,...,0.958,1.106,0.885,1.041,0.999,1.670,1.535,1.194,0.581,1.233


In [10]:
new_kaggle.reset_index(drop=True)

Unnamed: 0,Area,Months,Element,Unit,Y1965,Y1966,Y1967,Y1968,Y1969,Y1970,...,Y2010,Y2011,Y2012,Y2013,Y2014,Y2015,Y2016,Y2017,Y2018,Y2019
0,Afghanistan,January,Temperature change,°C,1.868,3.629,-1.432,0.389,-2.298,0.804,...,3.601,1.179,-0.583,1.233,1.755,1.943,3.416,1.201,1.996,2.951
1,Afghanistan,February,Temperature change,°C,-0.096,3.397,0.296,-2.055,-3.167,1.809,...,1.212,0.321,-3.201,1.494,-3.187,2.699,2.251,-0.323,2.705,0.086
2,Afghanistan,March,Temperature change,°C,-0.909,-0.069,-0.759,0.496,2.481,-0.915,...,3.390,0.748,-0.527,2.246,-0.076,-0.497,2.296,0.834,4.418,0.234
3,Afghanistan,April,Temperature change,°C,-1.816,-1.192,-1.496,-0.590,-0.770,1.439,...,2.591,1.712,1.417,-0.052,0.585,1.589,0.980,1.252,1.442,0.899
4,Afghanistan,May,Temperature change,°C,-0.190,-0.192,-1.307,-1.841,-0.977,1.864,...,1.419,3.643,0.909,1.201,0.959,1.862,3.246,3.280,0.855,0.647
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4823,OECD,DecJanFeb,Temperature change,°C,-0.732,-0.274,-0.165,-0.018,-0.188,0.400,...,1.272,0.770,1.709,1.327,0.686,1.307,2.636,1.884,1.453,1.527
4824,OECD,MarAprMay,Temperature change,°C,-0.110,-0.078,-0.334,0.285,-0.080,-0.249,...,1.742,0.390,1.442,0.475,0.778,1.191,1.928,1.237,1.241,1.352
4825,OECD,JunJulAug,Temperature change,°C,-0.495,-0.015,-0.184,-0.437,0.022,0.240,...,1.012,0.954,1.061,1.119,0.779,0.958,1.303,1.081,1.078,1.078
4826,OECD,SepOctNov,Temperature change,°C,-0.203,-0.295,0.321,0.220,-0.027,-0.146,...,0.958,1.106,0.885,1.041,0.999,1.670,1.535,1.194,0.581,1.233


In [11]:
# Drop quarters and Meteorological year
# A typical meteorological year (TMY) is a set of meteorological data with data values for every hour 
# in a year for a given geographical location. The data are selected from hourly data in a longer time period 
# (normally 10 years or more). For each month in the year the data have been selected from the year that was considered most 
# "typical" for that month. For instance, January might be from 2007, February from 2012 and so on.
delete_me = new_kaggle[new_kaggle['Months'] == "MarAprMay"].index
new_kaggle.drop(delete_me , inplace=True)
delete_me1 = new_kaggle[new_kaggle['Months'] == "JunJulAug"].index
new_kaggle.drop(delete_me1 , inplace=True)
delete_me2 = new_kaggle[new_kaggle['Months'] == "SepOctNov"].index
new_kaggle.drop(delete_me2 , inplace=True)
delete_me2 = new_kaggle[new_kaggle['Months'] == "DecJanFeb"].index
new_kaggle.drop(delete_me2 , inplace=True)
delete_me3 = new_kaggle[new_kaggle['Months'] == "Meteorological year"].index
new_kaggle.drop(delete_me3 , inplace=True)

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  return super().drop(


In [12]:
# Find average change for one country for 1 year
# areas = new_kaggle['Area']
# years = new_kaggle['']

# unique_countries = new_kaggle['Area'].unique()
# unique_countries

In [13]:
# countries

In [14]:
test_kaggle  = new_kaggle.drop(columns=['Months', 'Element', 'Unit'])
test_kaggle.head()

Unnamed: 0,Area,Y1965,Y1966,Y1967,Y1968,Y1969,Y1970,Y1971,Y1972,Y1973,...,Y2010,Y2011,Y2012,Y2013,Y2014,Y2015,Y2016,Y2017,Y2018,Y2019
0,Afghanistan,1.868,3.629,-1.432,0.389,-2.298,0.804,-1.487,-1.305,-2.951,...,3.601,1.179,-0.583,1.233,1.755,1.943,3.416,1.201,1.996,2.951
2,Afghanistan,-0.096,3.397,0.296,-2.055,-3.167,1.809,0.816,-7.722,1.838,...,1.212,0.321,-3.201,1.494,-3.187,2.699,2.251,-0.323,2.705,0.086
4,Afghanistan,-0.909,-0.069,-0.759,0.496,2.481,-0.915,1.658,-1.784,-0.473,...,3.39,0.748,-0.527,2.246,-0.076,-0.497,2.296,0.834,4.418,0.234
6,Afghanistan,-1.816,-1.192,-1.496,-0.59,-0.77,1.439,1.534,-0.602,1.106,...,2.591,1.712,1.417,-0.052,0.585,1.589,0.98,1.252,1.442,0.899
8,Afghanistan,-0.19,-0.192,-1.307,-1.841,-0.977,1.864,2.045,-1.051,0.724,...,1.419,3.643,0.909,1.201,0.959,1.862,3.246,3.28,0.855,0.647


In [15]:
# Mean of all countries/regions for each year
mean_data = test_kaggle.mean(axis=0)
all_mean_df = pd.DataFrame(mean_data)
all_mean_df.columns = ['mean_temp_change']
all_mean_df.head()

Unnamed: 0,mean_temp_change
Y1965,-0.21136
Y1966,0.093431
Y1967,-0.142026
Y1968,-0.154508
Y1969,0.101002


In [16]:
all_mean_df.reset_index(drop=False)

Unnamed: 0,index,mean_temp_change
0,Y1965,-0.21136
1,Y1966,0.093431
2,Y1967,-0.142026
3,Y1968,-0.154508
4,Y1969,0.101002
5,Y1970,0.068726
6,Y1971,-0.171902
7,Y1972,-0.044497
8,Y1973,0.182226
9,Y1974,-0.12071


In [17]:
all_mean_df.index.names = ['Year']

In [18]:
all_mean_df.head()

Unnamed: 0_level_0,mean_temp_change
Year,Unnamed: 1_level_1
Y1965,-0.21136
Y1966,0.093431
Y1967,-0.142026
Y1968,-0.154508
Y1969,0.101002


In [19]:
new_mean = all_mean_df.reset_index(drop=False)

In [20]:
original = "Y1965"
original1 = new_mean['Year']
# newstr = original.replace("Y", "")

years = []
x = 0
for year in original1:
    newyear = year.replace("Y", "")
    years.append(newyear)
    x = x+1


In [21]:
years
temp_change = new_mean['mean_temp_change']

In [22]:
annual_mean = pd.DataFrame(years, temp_change)
annual_mean.head()

Unnamed: 0_level_0,0
mean_temp_change,Unnamed: 1_level_1
-0.21136,1965
0.093431,1966
-0.142026,1967
-0.154508,1968
0.101002,1969


In [23]:
annual_mean.reset_index(drop=False)

Unnamed: 0,mean_temp_change,0
0,-0.21136,1965
1,0.093431,1966
2,-0.142026,1967
3,-0.154508,1968
4,0.101002,1969
5,0.068726,1970
6,-0.171902,1971
7,-0.044497,1972
8,0.182226,1973
9,-0.12071,1974


In [24]:
annual_mean['Year'] = annual_mean[0]

In [25]:
cleaned_mean = annual_mean.drop(columns=[0])

In [26]:
cleaned_mean.reset_index(drop=False)

Unnamed: 0,mean_temp_change,Year
0,-0.21136,1965
1,0.093431,1966
2,-0.142026,1967
3,-0.154508,1968
4,0.101002,1969
5,0.068726,1970
6,-0.171902,1971
7,-0.044497,1972
8,0.182226,1973
9,-0.12071,1974


In [27]:
cleaned_mean['Year']=cleaned_mean['Year'].astype(int)

In [28]:
# test_mean = cleaned_mean.drop(columns='year')

In [29]:
test_mean = cleaned_mean.rename(columns = {'index':'mean_temp_change'})
test_mean.head()

Unnamed: 0_level_0,Year
mean_temp_change,Unnamed: 1_level_1
-0.21136,1965
0.093431,1966
-0.142026,1967
-0.154508,1968
0.101002,1969


In [30]:
test_mean.reset_index(drop=False, inplace=True)

In [31]:
# nasa_temp_new_df.dtypes
test_mean.dtypes

mean_temp_change    float64
Year                  int32
dtype: object

In [32]:
# Merge temperatures and NASA data
merged_df = nasa_temp_new_df.merge(test_mean, on='Year', how='right')
merged_df.head()

Unnamed: 0,Year,No_Smoothing,Lowess(5),mean_temp_change
0,1965,-0.11,-0.05,-0.21136
1,1966,-0.06,-0.06,0.093431
2,1967,-0.02,-0.05,-0.142026
3,1968,-0.08,-0.03,-0.154508
4,1969,0.05,-0.02,0.101002


In [33]:
output = merged_df.to_csv("nasa_kaggle_temp_merged")

In [34]:
afg = new_kaggle[new_kaggle['Area']== "Afghanistan"]
afg.head()

Unnamed: 0,Area,Months,Element,Unit,Y1965,Y1966,Y1967,Y1968,Y1969,Y1970,...,Y2010,Y2011,Y2012,Y2013,Y2014,Y2015,Y2016,Y2017,Y2018,Y2019
0,Afghanistan,January,Temperature change,°C,1.868,3.629,-1.432,0.389,-2.298,0.804,...,3.601,1.179,-0.583,1.233,1.755,1.943,3.416,1.201,1.996,2.951
2,Afghanistan,February,Temperature change,°C,-0.096,3.397,0.296,-2.055,-3.167,1.809,...,1.212,0.321,-3.201,1.494,-3.187,2.699,2.251,-0.323,2.705,0.086
4,Afghanistan,March,Temperature change,°C,-0.909,-0.069,-0.759,0.496,2.481,-0.915,...,3.39,0.748,-0.527,2.246,-0.076,-0.497,2.296,0.834,4.418,0.234
6,Afghanistan,April,Temperature change,°C,-1.816,-1.192,-1.496,-0.59,-0.77,1.439,...,2.591,1.712,1.417,-0.052,0.585,1.589,0.98,1.252,1.442,0.899
8,Afghanistan,May,Temperature change,°C,-0.19,-0.192,-1.307,-1.841,-0.977,1.864,...,1.419,3.643,0.909,1.201,0.959,1.862,3.246,3.28,0.855,0.647


In [35]:
len(afg)

12

In [36]:
(afg['Y1965']).mean()

0.010000000000000009

In [37]:
# Get temperatures for 
grouped_df = new_kaggle.groupby(new_kaggle['Area']).mean()

In [38]:
grouped_df.head()

Unnamed: 0_level_0,Y1965,Y1966,Y1967,Y1968,Y1969,Y1970,Y1971,Y1972,Y1973,Y1974,...,Y2010,Y2011,Y2012,Y2013,Y2014,Y2015,Y2016,Y2017,Y2018,Y2019
Area,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Afghanistan,0.01,0.241417,-0.362667,-0.339417,-0.330667,0.676667,0.837417,-1.505417,0.329417,-0.554917,...,1.472167,1.206083,0.212167,1.257833,0.492417,1.099333,1.75475,1.233417,1.596,0.902417
Africa,-0.194667,0.15025,-0.228167,-0.166583,0.348833,0.168667,-0.219833,0.065083,0.32725,-0.268917,...,1.508667,0.8695,0.828917,0.9975,1.05475,1.207833,1.50125,1.174,1.242,1.433417
Albania,-0.348833,0.422583,-0.076083,0.056417,-0.043417,-0.05425,-0.264583,-0.139167,-0.24325,-0.187583,...,1.173167,1.143917,1.475667,1.56125,1.4945,1.67475,1.582167,1.449583,2.195667,2.078333
Algeria,-0.031917,0.28575,-0.093,0.08675,0.150083,0.167,-0.4085,-0.453167,-0.007167,-0.48175,...,2.323667,1.296833,1.267417,1.206583,1.772,1.31075,1.929333,1.472167,1.437083,1.31675
American Samoa,-0.3885,0.115,-0.360083,-0.137583,0.08625,-0.13825,-0.372333,0.115833,0.267583,-0.16125,...,1.013833,0.8868,0.9576,1.1708,1.084444,0.822222,1.527778,1.272222,1.127778,1.45


In [46]:
transformed_group = grouped_df.T

In [47]:
transformed_group = transformed_group.reset_index(drop=False)

In [48]:
transformed_group = transformed_group.rename(columns = {'index':'Year'})
transformed_group

Area,Year,Afghanistan,Africa,Albania,Algeria,American Samoa,Americas,Andorra,Angola,Anguilla,...,Wallis and Futuna Islands,Western Africa,Western Asia,Western Europe,Western Sahara,World,Yemen,Yugoslav SFR,Zambia,Zimbabwe
0,Y1965,0.01,-0.194667,-0.348833,-0.031917,-0.3885,-0.167583,-0.26925,-0.139833,-0.235833,...,-0.344833,-0.331667,-0.026833,-0.52875,-0.281417,-0.148167,-0.554583,-0.444583,-0.345833,-0.244083
1,Y1966,0.241417,0.15025,0.422583,0.28575,0.115,-0.13975,0.355833,0.20675,-0.009333,...,0.006667,0.1115,0.744,0.378167,0.267917,0.159,0.062,0.55675,0.290833,0.165333
2,Y1967,-0.362667,-0.228167,-0.076083,-0.093,-0.360083,-0.056,0.357333,-0.114667,-0.29475,...,-0.230167,-0.281,-0.734417,0.47625,-0.079917,-0.1135,-0.235083,0.1715,-0.081917,-0.121333
3,Y1968,-0.339417,-0.166583,0.056417,0.08675,-0.137583,-0.09025,0.198083,-0.160333,-0.1875,...,-0.095333,-0.063667,-0.198083,-0.011083,-0.141417,-0.10875,-0.151167,0.144667,-0.128417,0.08925
4,Y1969,-0.330667,0.348833,-0.043417,0.150083,0.08625,0.27825,-0.363667,0.2075,0.27025,...,-0.233833,0.540917,0.345,-0.21675,0.250917,-0.0445,0.18325,-0.28875,0.240583,0.101917
5,Y1970,0.676667,0.168667,-0.05425,0.167,-0.13825,-0.010417,0.120583,0.209167,-0.011667,...,0.039167,0.24125,0.3425,-0.18225,0.5565,0.081833,0.3455,-0.100417,0.334583,0.577333
6,Y1971,0.837417,-0.219833,-0.264583,-0.4085,-0.372333,-0.24175,-0.095167,-0.180333,-0.361667,...,-0.062667,-0.083333,-0.308583,0.13875,-0.63625,-0.048833,-0.25525,-0.109417,-0.243917,-0.110333
7,Y1972,-1.505417,0.065083,-0.139167,-0.453167,0.115833,-0.48025,-0.510083,0.035667,-0.195583,...,-0.02825,0.173,-0.558583,-0.276833,-1.145667,-0.215917,0.107333,0.033833,-0.009583,-0.213167
8,Y1973,0.329417,0.32725,-0.24325,-0.007167,0.267583,0.269,-0.090583,0.385667,-0.0225,...,0.3365,0.538333,-0.05775,0.026167,-0.007,0.277083,0.249917,-0.292333,0.177583,0.284083
9,Y1974,-0.554917,-0.268917,-0.187583,-0.48175,-0.16125,-0.283833,-0.195833,-0.207,-0.42175,...,0.09725,-0.276583,-0.22975,0.3945,-0.4535,-0.193917,-0.123667,0.130167,-0.426583,-0.497417


In [49]:
original2 = transformed_group['Year']
years1 = []
x = 0
for year in original2:
    newyear1 = year.replace("Y", "")
    years1.append(newyear1)
    x = x+1

In [50]:
transformed_group['Year'] = years1

In [55]:
transformed_group.head()

Area,Year,Afghanistan,Africa,Albania,Algeria,American Samoa,Americas,Andorra,Angola,Anguilla,...,Wallis and Futuna Islands,Western Africa,Western Asia,Western Europe,Western Sahara,World,Yemen,Yugoslav SFR,Zambia,Zimbabwe
0,1965,0.01,-0.194667,-0.348833,-0.031917,-0.3885,-0.167583,-0.26925,-0.139833,-0.235833,...,-0.344833,-0.331667,-0.026833,-0.52875,-0.281417,-0.148167,-0.554583,-0.444583,-0.345833,-0.244083
1,1966,0.241417,0.15025,0.422583,0.28575,0.115,-0.13975,0.355833,0.20675,-0.009333,...,0.006667,0.1115,0.744,0.378167,0.267917,0.159,0.062,0.55675,0.290833,0.165333
2,1967,-0.362667,-0.228167,-0.076083,-0.093,-0.360083,-0.056,0.357333,-0.114667,-0.29475,...,-0.230167,-0.281,-0.734417,0.47625,-0.079917,-0.1135,-0.235083,0.1715,-0.081917,-0.121333
3,1968,-0.339417,-0.166583,0.056417,0.08675,-0.137583,-0.09025,0.198083,-0.160333,-0.1875,...,-0.095333,-0.063667,-0.198083,-0.011083,-0.141417,-0.10875,-0.151167,0.144667,-0.128417,0.08925
4,1969,-0.330667,0.348833,-0.043417,0.150083,0.08625,0.27825,-0.363667,0.2075,0.27025,...,-0.233833,0.540917,0.345,-0.21675,0.250917,-0.0445,0.18325,-0.28875,0.240583,0.101917


In [None]:
output1 = transformed_group()