# Merging LAP, P5V, GDP Columns Subset

## Function Definitions

In [1]:
def read_file(file_string):
    f = open(file_string, "r")
    df = []
    headers = f.readline()
    line = f.readline()
    while line:
        line = line.strip().split(",")
        df.append(line)
        line = f.readline()
    f.close()
    return df

## Read-in 3 Tables

### LAP

In [2]:
lap = read_file("LAP.csv")

In [3]:
import pandas as pd
pd_lap = pd.DataFrame(data = lap, columns = ['title', 'type', 'geography', 'geography iso', 'frameworks', 'responses', 'instruments', 
                                             'document types', 'natural Hazards', 'keywords', 'sectors', 'd', 'm', 'year', 'events', 
                                             'x1', 'x2', 'x3', 'x4', 'x5', 'x6', 'x7', 'x8'])
pd_lap = pd_lap[['title', 'geography', 'geography iso', 'year', 'type', 'responses', 'document types', 'sectors']]

In [4]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd_lap.head()

Unnamed: 0,title,geography,geography iso,year,type,responses,document types,sectors
0,Energy Sector Strategy 1387-1391 (2007/8-2012/3),Afghanistan,AFG,2008,executive,Mitigation,Strategy,Energy
1,Rural Renewable Energy Policy (RREP),Afghanistan,AFG,2013,executive,Adaptation,Policy,Energy
2,National Forestry Management Policy (NFMP),Afghanistan,AFG,2007,executive,Adaptation; Mitigation,Policy,Economy-wide
3,Strategic National Action Plan for Disaster Ri...,Afghanistan,AFG,2011,executive,Adaptation; Disaster Risk Management,Plan,
4,The National Environmental Action Plan (NEAP),Afghanistan,AFG,2009,executive,Adaptation,Plan,


### P5V

In [5]:
p5v = read_file("P5V.csv")

In [6]:
import pandas as pd
pd_p5v = pd.DataFrame(data = p5v, columns=['p5', 'cyear', 'ccode', 'geography iso', 'country', 'year', 'flag', 'fragment', 'democ', 'autoc', 'polity', 
                                           'polity2', 'durable', 'xrreg', 'xrcomp', 'xropen', 'xconst', 'parreg', 'parcomp', 'exrec', 'exconst', 
                                           'polcomp', 'prior', 'emonth', 'eday', 'eyear', 'eprec', 'interim', 'bmonth', 'bday', 'byear', 'bprec', 
                                           'post', 'change', 'd5', 'sf', 'regtrans'])
pd_p5v = pd_p5v[['p5', 'cyear', 'geography iso', 'year', 'polity2']]

In [7]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd_p5v.head()

Unnamed: 0,p5,cyear,geography iso,year,polity2
0,0,7001800,AFG,1800,-6
1,0,7001801,AFG,1801,-6
2,0,7001802,AFG,1802,-6
3,0,7001803,AFG,1803,-6
4,0,7001804,AFG,1804,-6


### GDP

In [8]:
gdp = read_file("GDP.csv")

In [9]:
new_df = []
for i in range(len(gdp)):
    for j in range(len(gdp[i]) - 4):
        row = []
#         row.append(gdp[i][0])    #country
        row.append(str(gdp[i][1]))    #country code
        row.append(str(1960+j))          #year
        row.append(str(gdp[i][j+4]))  #gdp
        new_df.append(row)
gdp = new_df

In [10]:
import pandas as pd
pd_gdp = pd.DataFrame(gdp, columns=['geography iso', 'year', 'GDPpc'])

In [11]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd_gdp.head(50)

Unnamed: 0,geography iso,year,GDPpc
0,ABW,1960,
1,ABW,1961,
2,ABW,1962,
3,ABW,1963,
4,ABW,1964,
5,ABW,1965,
6,ABW,1966,
7,ABW,1967,
8,ABW,1968,
9,ABW,1969,


## Merge the Data

In [13]:
df_lap_p5v = pd.merge(pd_lap, pd_p5v, on=['geography iso', 'year'])
df_lap_p5v.head(10)

Unnamed: 0,title,geography,geography iso,year,type,responses,document types,sectors,p5,cyear,polity2
0,Energy Sector Strategy 1387-1391 (2007/8-2012/3),Afghanistan,AFG,2008,executive,Mitigation,Strategy,Energy,0,7002008,
1,Rural Renewable Energy Policy (RREP),Afghanistan,AFG,2013,executive,Adaptation,Policy,Energy,0,7002013,
2,National Forestry Management Policy (NFMP),Afghanistan,AFG,2007,executive,Adaptation; Mitigation,Policy,Economy-wide,0,7002007,
3,Strategic National Action Plan for Disaster Ri...,Afghanistan,AFG,2011,executive,Adaptation; Disaster Risk Management,Plan,,0,7002011,
4,The Law On Regulating Forest Affairs 2011,Afghanistan,AFG,2011,legislative,Adaptation; Mitigation,Law; Act,LULUCF,0,7002011,
5,The National Environmental Action Plan (NEAP),Afghanistan,AFG,2009,executive,Adaptation,Plan,,0,7002009,
6,National Biodiversity Strategy and Action Plan,Afghanistan,AFG,2014,executive,Adaptation,Strategy,Environment; LULUCF,0,7002014,-1.0
7,Disaster management strategy (2014-2017),Afghanistan,AFG,2014,executive,Disaster Risk Management,Plan; Strategy,Disaster Risk Management (Drm),0,7002014,-1.0
8,National Comprehensive Agriculture Development...,Afghanistan,AFG,2016,executive,Adaptation,Programme,Agriculture; Energy; Environment; Residential ...,0,7002016,-1.0
9,Law on Disaster Response; Management; and Prep...,Afghanistan,AFG,2012,legislative,Adaptation; Disaster Risk Management,Law,LULUCF; Water,0,7002012,


In [14]:
lap_p5v_gdp_narrow = pd.merge(df_lap_p5v, pd_gdp, on=['geography iso', 'year'])
lap_p5v_gdp_narrow.head(10)

Unnamed: 0,title,geography,geography iso,year,type,responses,document types,sectors,p5,cyear,polity2,GDPpc
0,Energy Sector Strategy 1387-1391 (2007/8-2012/3),Afghanistan,AFG,2008,executive,Mitigation,Strategy,Energy,0,7002008,,398.9711165
1,Rural Renewable Energy Policy (RREP),Afghanistan,AFG,2013,executive,Adaptation,Policy,Energy,0,7002013,,568.9645435
2,National Forestry Management Policy (NFMP),Afghanistan,AFG,2007,executive,Adaptation; Mitigation,Policy,Economy-wide,0,7002007,,392.7104656
3,Strategic National Action Plan for Disaster Ri...,Afghanistan,AFG,2011,executive,Adaptation; Disaster Risk Management,Plan,,0,7002011,,511.9985148
4,The Law On Regulating Forest Affairs 2011,Afghanistan,AFG,2011,legislative,Adaptation; Mitigation,Law; Act,LULUCF,0,7002011,,511.9985148
5,The National Environmental Action Plan (NEAP),Afghanistan,AFG,2009,executive,Adaptation,Plan,,0,7002009,,472.8422916
6,National Biodiversity Strategy and Action Plan,Afghanistan,AFG,2014,executive,Adaptation,Strategy,Environment; LULUCF,0,7002014,-1.0,565.1792733
7,Disaster management strategy (2014-2017),Afghanistan,AFG,2014,executive,Disaster Risk Management,Plan; Strategy,Disaster Risk Management (Drm),0,7002014,-1.0,565.1792733
8,National Comprehensive Agriculture Development...,Afghanistan,AFG,2016,executive,Adaptation,Programme,Agriculture; Energy; Environment; Residential ...,0,7002016,-1.0,552.9969077
9,Law on Disaster Response; Management; and Prep...,Afghanistan,AFG,2012,legislative,Adaptation; Disaster Risk Management,Law,LULUCF; Water,0,7002012,,557.9496921


In [15]:
lap_p5v_gdp_narrow.to_csv('lap_p5v_gdp_narrow.csv', index=False)