# JSON examples and exercise
****
+ get familiar with packages for dealing with JSON
+ study examples with JSON strings and files 
+ work on exercise to be completed and submitted 
****
+ reference: http://pandas.pydata.org/pandas-docs/stable/io.html#io-json-reader
+ data source: http://jsonstudio.com/resources/
****

In [3]:
import pandas as pd

## imports for Python, Pandas

In [6]:
import json
from pandas.io.json import json_normalize

## JSON example, with string

+ demonstrates creation of normalized dataframes (tables) from nested json string
+ source: http://pandas.pydata.org/pandas-docs/stable/io.html#normalization

In [4]:
# define json string
data = [{'state': 'Florida', 
         'shortname': 'FL',
         'info': {'governor': 'Rick Scott'},
         'counties': [{'name': 'Dade', 'population': 12345},
                      {'name': 'Broward', 'population': 40000},
                      {'name': 'Palm Beach', 'population': 60000}]},
        {'state': 'Ohio',
         'shortname': 'OH',
         'info': {'governor': 'John Kasich'},
         'counties': [{'name': 'Summit', 'population': 1234},
                      {'name': 'Cuyahoga', 'population': 1337}]}]

In [7]:
# use normalization to create tables from nested element
json_normalize(data, 'counties')

Unnamed: 0,name,population
0,Dade,12345
1,Broward,40000
2,Palm Beach,60000
3,Summit,1234
4,Cuyahoga,1337


In [8]:
# further populate tables created from nested element
json_normalize(data, 'counties', ['state', 'shortname', ['info', 'governor']])

Unnamed: 0,name,population,info.governor,state,shortname
0,Dade,12345,Rick Scott,Florida,FL
1,Broward,40000,Rick Scott,Florida,FL
2,Palm Beach,60000,Rick Scott,Florida,FL
3,Summit,1234,John Kasich,Ohio,OH
4,Cuyahoga,1337,John Kasich,Ohio,OH


****
## JSON example, with file

+ demonstrates reading in a json file as a string and as a table
+ uses small sample file containing data about projects funded by the World Bank 
+ data source: http://jsonstudio.com/resources/

In [9]:
# load json as string
json.load((open('data/world_bank_projects_less.json')))

[{u'_id': {u'$oid': u'52b213b38594d8a2be17c780'},
  u'approvalfy': 1999,
  u'board_approval_month': u'November',
  u'boardapprovaldate': u'2013-11-12T00:00:00Z',
  u'borrower': u'FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA',
  u'closingdate': u'2018-07-07T00:00:00Z',
  u'country_namecode': u'Federal Democratic Republic of Ethiopia!$!ET',
  u'countrycode': u'ET',
  u'countryname': u'Federal Democratic Republic of Ethiopia',
  u'countryshortname': u'Ethiopia',
  u'docty': u'Project Information Document,Indigenous Peoples Plan,Project Information Document',
  u'envassesmentcategorycode': u'C',
  u'grantamt': 0,
  u'ibrdcommamt': 0,
  u'id': u'P129828',
  u'idacommamt': 130000000,
  u'impagency': u'MINISTRY OF EDUCATION',
  u'lendinginstr': u'Investment Project Financing',
  u'lendinginstrtype': u'IN',
  u'lendprojectcost': 550000000,
  u'majorsector_percent': [{u'Name': u'Education', u'Percent': 46},
   {u'Name': u'Education', u'Percent': 26},
   {u'Name': u'Public Administration, Law, and Ju

In [10]:
# load as Pandas dataframe
sample_json_df = pd.read_json('data/world_bank_projects_less.json')
sample_json_df

Unnamed: 0,_id,approvalfy,board_approval_month,boardapprovaldate,borrower,closingdate,country_namecode,countrycode,countryname,countryshortname,...,sectorcode,source,status,supplementprojectflg,theme1,theme_namecode,themecode,totalamt,totalcommamt,url
0,{u'$oid': u'52b213b38594d8a2be17c780'},1999,November,2013-11-12T00:00:00Z,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,2018-07-07T00:00:00Z,Federal Democratic Republic of Ethiopia!$!ET,ET,Federal Democratic Republic of Ethiopia,Ethiopia,...,"ET,BS,ES,EP",IBRD,Active,N,"{u'Percent': 100, u'Name': u'Education for all'}","[{u'code': u'65', u'name': u'Education for all'}]",65,130000000,130000000,http://www.worldbank.org/projects/P129828/ethi...
1,{u'$oid': u'52b213b38594d8a2be17c781'},2015,November,2013-11-04T00:00:00Z,GOVERNMENT OF TUNISIA,,Republic of Tunisia!$!TN,TN,Republic of Tunisia,Tunisia,...,"BZ,BS",IBRD,Active,N,"{u'Percent': 30, u'Name': u'Other economic man...","[{u'code': u'24', u'name': u'Other economic ma...",5424,0,4700000,http://www.worldbank.org/projects/P144674?lang=en


****
## JSON exercise

Using data in file 'data/world_bank_projects.json' and the techniques demonstrated above,
1. Find the 10 countries with most projects
2. Find the top 10 major project themes (using column 'mjtheme_namecode')
3. In 2. above you will notice that some entries have only the code and the name is missing. Create a dataframe with the missing names filled in.

In [126]:
import json
import pandas as pd
import collections
from pandas.io.json import json_normalize
import numpy as np
from collections import Counter
from itertools import chain

In [127]:
pd.options.display.max_columns = None
pd.options.display.max_rows = None

In [128]:
# load json as string
json.load((open('data/world_bank_projects.json')))

[{'sector': [{'Name': 'Primary education'},
   {'Name': 'Secondary education'},
   {'Name': 'Public administration- Other social services'},
   {'Name': 'Tertiary education'}],
  'supplementprojectflg': 'N',
  'projectfinancialtype': 'IDA',
  'prodline': 'PE',
  'mjtheme': ['Human development'],
  'idacommamt': 130000000,
  'impagency': 'MINISTRY OF EDUCATION',
  'project_name': 'Ethiopia General Education Quality Improvement Project II',
  'mjthemecode': '8,11',
  'closingdate': '2018-07-07T00:00:00Z',
  'totalcommamt': 130000000,
  'id': 'P129828',
  'mjsector_namecode': [{'code': 'EX', 'name': 'Education'},
   {'code': 'EX', 'name': 'Education'},
   {'code': 'BX', 'name': 'Public Administration, Law, and Justice'},
   {'code': 'EX', 'name': 'Education'}],
  'docty': 'Project Information Document,Indigenous Peoples Plan,Project Information Document',
  'sector1': {'Percent': 46, 'Name': 'Primary education'},
  'lendinginstr': 'Investment Project Financing',
  'countrycode': 'ET',
  '

In [129]:
# load as Pandas dataframe
bank_df = pd.read_json('data/world_bank_projects.json')

In [130]:
bank_df

Unnamed: 0,sector,supplementprojectflg,projectfinancialtype,prodline,mjtheme,idacommamt,impagency,project_name,mjthemecode,closingdate,totalcommamt,id,mjsector_namecode,docty,sector1,lendinginstr,countrycode,sector2,totalamt,mjtheme_namecode,boardapprovaldate,countryshortname,sector4,prodlinetext,productlinetype,regionname,status,country_namecode,envassesmentcategorycode,project_abstract,approvalfy,projectdocs,lendprojectcost,lendinginstrtype,theme1,grantamt,themecode,borrower,sectorcode,sector3,majorsector_percent,board_approval_month,theme_namecode,countryname,url,source,projectstatusdisplay,ibrdcommamt,sector_namecode,_id
0,"[{'Name': 'Primary education'}, {'Name': 'Seco...",N,IDA,PE,[Human development],130000000,MINISTRY OF EDUCATION,Ethiopia General Education Quality Improvement...,811,2018-07-07T00:00:00Z,130000000,P129828,"[{'code': 'EX', 'name': 'Education'}, {'code':...","Project Information Document,Indigenous People...","{'Percent': 46, 'Name': 'Primary education'}",Investment Project Financing,ET,"{'Percent': 26, 'Name': 'Secondary education'}",130000000,"[{'code': '8', 'name': 'Human development'}, {...",2013-11-12T00:00:00Z,Ethiopia,"{'Percent': 12, 'Name': 'Tertiary education'}",IBRD/IDA,L,Africa,Active,Federal Democratic Republic of Ethiopia!$!ET,C,{'cdata': 'The development objective of the Se...,1999,"[{'DocDate': '28-AUG-2013', 'EntityID': '09022...",550000000,IN,"{'Percent': 100, 'Name': 'Education for all'}",0,65.0,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,"ET,BS,ES,EP","{'Percent': 16, 'Name': 'Public administration...","[{'Percent': 46, 'Name': 'Education'}, {'Perce...",November,"[{'code': '65', 'name': 'Education for all'}]",Federal Democratic Republic of Ethiopia,http://www.worldbank.org/projects/P129828/ethi...,IBRD,Active,0,"[{'code': 'EP', 'name': 'Primary education'}, ...",{'$oid': '52b213b38594d8a2be17c780'}
1,[{'Name': 'Public administration- Other social...,N,OTHER,RE,"[Economic management, Social protection and ri...",0,MINISTRY OF FINANCE,TN: DTF Social Protection Reforms Support,16,,4700000,P144674,"[{'code': 'BX', 'name': 'Public Administration...","Project Information Document,Integrated Safegu...","{'Percent': 70, 'Name': 'Public administration...",Specific Investment Loan,TN,"{'Percent': 30, 'Name': 'General public admini...",0,"[{'code': '1', 'name': 'Economic management'},...",2013-11-04T00:00:00Z,Tunisia,,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Tunisia!$!TN,C,,2015,"[{'DocDate': '29-MAR-2013', 'EntityID': '00033...",5700000,IN,"{'Percent': 30, 'Name': 'Other economic manage...",4700000,5424.0,GOVERNMENT OF TUNISIA,"BZ,BS",,"[{'Percent': 70, 'Name': 'Public Administratio...",November,"[{'code': '24', 'name': 'Other economic manage...",Republic of Tunisia,http://www.worldbank.org/projects/P144674?lang=en,IBRD,Active,0,"[{'code': 'BS', 'name': 'Public administration...",{'$oid': '52b213b38594d8a2be17c781'}
2,[{'Name': 'Rural and Inter-Urban Roads and Hig...,Y,IDA,PE,"[Trade and integration, Public sector governan...",6060000,MINISTRY OF TRANSPORT AND COMMUNICATIONS,Tuvalu Aviation Investment Project - Additiona...,52116,,6060000,P145310,"[{'code': 'TX', 'name': 'Transportation'}]","Resettlement Plan,Environmental Assessment,Int...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Investment Project Financing,TV,,6060000,"[{'code': '5', 'name': 'Trade and integration'...",2013-11-01T00:00:00Z,Tuvalu,,IBRD/IDA,L,East Asia and Pacific,Active,Tuvalu!$!TV,B,,2014,"[{'DocDate': '21-OCT-2013', 'EntityID': '00033...",6060000,IN,"{'Percent': 46, 'Name': 'Regional integration'}",0,52812547.0,MINISTRY OF FINANCE AND ECONOMIC DEVEL,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",November,"[{'code': '47', 'name': 'Regional integration'...",Tuvalu,http://www.worldbank.org/projects/P145310?lang=en,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c782'}
3,[{'Name': 'Other social services'}],N,OTHER,RE,"[Social dev/gender/inclusion, Social dev/gende...",0,LABOR INTENSIVE PUBLIC WORKS PROJECT PMU,Gov't and Civil Society Organization Partnership,77,,1500000,P144665,"[{'code': 'JX', 'name': 'Health and other soci...","Procurement Plan,Project Information Document,...","{'Percent': 100, 'Name': 'Other social services'}",Technical Assistance Loan,RY,,0,"[{'code': '7', 'name': 'Social dev/gender/incl...",2013-10-31T00:00:00Z,"Yemen, Republic of",,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Yemen!$!RY,C,,2014,"[{'DocDate': '15-MAY-2013', 'EntityID': '00035...",1500000,IN,"{'Percent': 50, 'Name': 'Participation and civ...",1500000,5957.0,MIN. OF PLANNING AND INT'L COOPERATION,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '57', 'name': 'Participation and civ...",Republic of Yemen,http://www.worldbank.org/projects/P144665?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c783'}
4,[{'Name': 'General industry and trade sector'}...,N,IDA,PE,"[Trade and integration, Financial and private ...",13100000,MINISTRY OF TRADE AND INDUSTRY,Second Private Sector Competitiveness and Econ...,54,2019-04-30T00:00:00Z,13100000,P144933,"[{'code': 'YX', 'name': 'Industry and trade'},...","Project Information Document,Integrated Safegu...","{'Percent': 50, 'Name': 'General industry and ...",Investment Project Financing,LS,"{'Percent': 40, 'Name': 'Other industry'}",13100000,"[{'code': '5', 'name': 'Trade and integration'...",2013-10-31T00:00:00Z,Lesotho,,IBRD/IDA,L,Africa,Active,Kingdom of Lesotho!$!LS,B,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '06-SEP-2013', 'EntityID': '09022...",15000000,IN,"{'Percent': 30, 'Name': 'Export development an...",0,4145.0,MINISTRY OF FINANCE,"FH,YW,YZ","{'Percent': 10, 'Name': 'SME Finance'}","[{'Percent': 50, 'Name': 'Industry and trade'}...",October,"[{'code': '45', 'name': 'Export development an...",Kingdom of Lesotho,http://www.worldbank.org/projects/P144933/seco...,IBRD,Active,0,"[{'code': 'YZ', 'name': 'General industry and ...",{'$oid': '52b213b38594d8a2be17c784'}
5,[{'Name': 'Other social services'}],Y,IDA,PE,[Social protection and risk management],10000000,,Additional Financing for Cash Transfers for Or...,66,,10000000,P146161,"[{'code': 'JX', 'name': 'Health and other soci...","Integrated Safeguards Data Sheet,Project Infor...","{'Percent': 100, 'Name': 'Other social services'}",Investment Project Financing,KE,,10000000,"[{'code': '6', 'name': 'Social protection and ...",2013-10-31T00:00:00Z,Kenya,,IBRD/IDA,L,Africa,Active,Republic of Kenya!$!KE,C,,2014,"[{'DocDate': '16-SEP-2013', 'EntityID': '09022...",66400000,IN,"{'Percent': 100, 'Name': 'Social safety nets'}",0,54.0,REPUBLIC OF KENYA,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '54', 'name': 'Social safety nets'}]",Republic of Kenya,http://www.worldbank.org/projects/P146161?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c785'}
6,[{'Name': 'Rural and Inter-Urban Roads and Hig...,N,IBRD,PE,"[Public sector governance, Financial and priva...",0,MINISTRY OF ROAD TRANSPORT AND HIGHWAYS,National Highways Interconnectivity Improvemen...,24,2019-06-30T00:00:00Z,500000000,P121185,"[{'code': 'TX', 'name': 'Transportation'}]","Project Appraisal Document,Procurement Plan,In...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Specific Investment Loan,IN,,500000000,"[{'code': '2', 'name': 'Public sector governan...",2013-10-29T00:00:00Z,India,,IBRD/IDA,L,South Asia,Active,Republic of India!$!IN,A,{'cdata': 'The development objective of the pr...,2014,"[{'DocDate': '02-OCT-2013', 'EntityID': '00035...",1146050000,IN,"{'Percent': 20, 'Name': 'Administrative and ci...",0,3925.0,GOVERNMENT OF INDIA,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",October,"[{'code': '25', 'name': 'Administrative and ci...",Republic of India,http://www.worldbank.org/projects/P121185/firs...,IBRD,Active,500000000,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c786'}
7,[{'Name': 'Other Renewable Energy'}],N,OTHER,GE,[Environment and natural resources management],0,NATIONAL ENERGY ADMINISTRATION,China Renewable Energy Scale-Up Program Phase II,118,,27280000,P127033,"[{'code': 'LX', 'name': 'Energy and mining'}]","Project Appraisal Document,Integrated Safeguar...","{'Percent': 100, 'Name': 'Other Renewable Ener...",Investment Project Financing,CN,,0,"[{'code': '11', 'name': 'Environment and natur...",2013-10-29T00:00:00Z,China,,Global Environment Project,L,East Asia and Pacific,Active,People's Republic of China!$!CN,C,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '18-SEP-2013', 'EntityID': '00045...",27280000,IN,"{'Percent': 100, 'Name': 'Climate change'}",27280000,81.0,PEOPLE'S REPUBLIC OF CHINA,LR,,"[{'Percent': 100, 'Name': 'Energy and mining'}]",October,"[{'code': '81', 'name': 'Climate change'}]",People's Republic of China,http://www.worldbank.org/projects/P127033/chin...,IBRD,Active,0,"[{'code': 'LR', 'name': 'Other Renewable Energ...",{'$oid': '52b213b38594d8a2be17c787'}
8,[{'Name': 'Rural and Inter-Urban Roads and Hig...,N,IDA,PE,[Rural development],160000000,"PUBLIC WORKS DEPARTMANT, RAJASTHAN",Rajasthan Road Sector Modernization Project,107,2018-12-31T00:00:00Z,160000000,P130164,"[{'code': 'TX', 'name': 'Transportation'}]","Project Appraisal Document,Integrated Safeguar...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Specific Investment Loan,IN,,160000000,"[{'code': '10', 'name': 'Rural development'}, ...",2013-10-29T00:00:00Z,India,,IBRD/IDA,L,South Asia,Active,Republic of India!$!IN,B,{'cdata': 'The development objective of the Ra...,2014,"[{'DocDate': '01-OCT-2013', 'EntityID': '00044...",227000000,IN,"{'Percent': 87, 'Name': 'Other rural developme...",0,79.0,THE GOVERNMENT OF INDIA,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",October,"[{'code': '79', 'name': 'Other rural developme...",Republic of India,http://www.worldbank.org/projects/P130164/raja...,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c788'}
9,[{'Name': 'General public administration secto...,N,IBRD,PE,"[Public sector governance, Public sector gover...",0,MINISTRY OF FINANCE,MA Accountability and Transparency DPL,222,2014-12-31T00:00:00Z,200000000,P130903,"[{'code': 'BX', 'name': 'Public Administration...","Program Document,Project Information Document,...","{'Percent': 34, 'Name': 'General public admini...",Development Policy Lending,MA,"{'Percent': 33, 'Name': 'Central government ad...",200000000,"[{'code': '2', 'name': 'Public sector governan...",2013-10-29T00:00:00Z,Morocco,,IBRD/IDA,L,Middle East and North Africa,Active,Kingdom of Morocco!$!MA,,{'cdata': 'The objective of this First Transpa...,2014,"[{'DocDate': '30-SEP-2013', 'EntityID': '00033...",200000000,AD,"{'Percent': 33, 'Name': 'Other accountability/...",0,273029.0,THE KINGDOM OF MOROCCO,"BM,BC,BZ","{'Percent': 33, 'Name': 'Public administration...","[{'Percent': 34, 'Name': 'Public Administratio...",October,"[{'code': '29', 'name': 'Other accountability/...",Kingdom of Morocco,http://www.worldbank.org/projects/P130903?lang=en,IBRD,Active,200000000,"[{'code': 'BZ', 'name': 'General public admini...",{'$oid': '52b213b38594d8a2be17c789'}


In [131]:
country = bank_df.groupby('countryname').size()

In [132]:
country_df = pd.DataFrame(country).reset_index()

In [133]:
country_df.head()

Unnamed: 0,countryname,0
0,Africa,11
1,Antigua and Barbuda,1
2,Arab Republic of Egypt,2
3,Argentine Republic,2
4,Bosnia and Herzegovina,1


In [134]:
country_df.columns=['CountryName','Count']

In [135]:
country_df.head()

Unnamed: 0,CountryName,Count
0,Africa,11
1,Antigua and Barbuda,1
2,Arab Republic of Egypt,2
3,Argentine Republic,2
4,Bosnia and Herzegovina,1


In [136]:
#The 10 countries with most projects
country_df.sort_values(by='Count', ascending=False, inplace=True)
country_df.set_index('CountryName').head(10)

Unnamed: 0_level_0,Count
CountryName,Unnamed: 1_level_1
People's Republic of China,19
Republic of Indonesia,19
Socialist Republic of Vietnam,17
Republic of India,16
Republic of Yemen,13
People's Republic of Bangladesh,12
Nepal,12
Kingdom of Morocco,12
Republic of Mozambique,11
Africa,11


In [137]:
bank_df.head()

Unnamed: 0,sector,supplementprojectflg,projectfinancialtype,prodline,mjtheme,idacommamt,impagency,project_name,mjthemecode,closingdate,totalcommamt,id,mjsector_namecode,docty,sector1,lendinginstr,countrycode,sector2,totalamt,mjtheme_namecode,boardapprovaldate,countryshortname,sector4,prodlinetext,productlinetype,regionname,status,country_namecode,envassesmentcategorycode,project_abstract,approvalfy,projectdocs,lendprojectcost,lendinginstrtype,theme1,grantamt,themecode,borrower,sectorcode,sector3,majorsector_percent,board_approval_month,theme_namecode,countryname,url,source,projectstatusdisplay,ibrdcommamt,sector_namecode,_id
0,"[{'Name': 'Primary education'}, {'Name': 'Seco...",N,IDA,PE,[Human development],130000000,MINISTRY OF EDUCATION,Ethiopia General Education Quality Improvement...,811,2018-07-07T00:00:00Z,130000000,P129828,"[{'code': 'EX', 'name': 'Education'}, {'code':...","Project Information Document,Indigenous People...","{'Percent': 46, 'Name': 'Primary education'}",Investment Project Financing,ET,"{'Percent': 26, 'Name': 'Secondary education'}",130000000,"[{'code': '8', 'name': 'Human development'}, {...",2013-11-12T00:00:00Z,Ethiopia,"{'Percent': 12, 'Name': 'Tertiary education'}",IBRD/IDA,L,Africa,Active,Federal Democratic Republic of Ethiopia!$!ET,C,{'cdata': 'The development objective of the Se...,1999,"[{'DocDate': '28-AUG-2013', 'EntityID': '09022...",550000000,IN,"{'Percent': 100, 'Name': 'Education for all'}",0,65,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,"ET,BS,ES,EP","{'Percent': 16, 'Name': 'Public administration...","[{'Percent': 46, 'Name': 'Education'}, {'Perce...",November,"[{'code': '65', 'name': 'Education for all'}]",Federal Democratic Republic of Ethiopia,http://www.worldbank.org/projects/P129828/ethi...,IBRD,Active,0,"[{'code': 'EP', 'name': 'Primary education'}, ...",{'$oid': '52b213b38594d8a2be17c780'}
1,[{'Name': 'Public administration- Other social...,N,OTHER,RE,"[Economic management, Social protection and ri...",0,MINISTRY OF FINANCE,TN: DTF Social Protection Reforms Support,16,,4700000,P144674,"[{'code': 'BX', 'name': 'Public Administration...","Project Information Document,Integrated Safegu...","{'Percent': 70, 'Name': 'Public administration...",Specific Investment Loan,TN,"{'Percent': 30, 'Name': 'General public admini...",0,"[{'code': '1', 'name': 'Economic management'},...",2013-11-04T00:00:00Z,Tunisia,,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Tunisia!$!TN,C,,2015,"[{'DocDate': '29-MAR-2013', 'EntityID': '00033...",5700000,IN,"{'Percent': 30, 'Name': 'Other economic manage...",4700000,5424,GOVERNMENT OF TUNISIA,"BZ,BS",,"[{'Percent': 70, 'Name': 'Public Administratio...",November,"[{'code': '24', 'name': 'Other economic manage...",Republic of Tunisia,http://www.worldbank.org/projects/P144674?lang=en,IBRD,Active,0,"[{'code': 'BS', 'name': 'Public administration...",{'$oid': '52b213b38594d8a2be17c781'}
2,[{'Name': 'Rural and Inter-Urban Roads and Hig...,Y,IDA,PE,"[Trade and integration, Public sector governan...",6060000,MINISTRY OF TRANSPORT AND COMMUNICATIONS,Tuvalu Aviation Investment Project - Additiona...,52116,,6060000,P145310,"[{'code': 'TX', 'name': 'Transportation'}]","Resettlement Plan,Environmental Assessment,Int...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Investment Project Financing,TV,,6060000,"[{'code': '5', 'name': 'Trade and integration'...",2013-11-01T00:00:00Z,Tuvalu,,IBRD/IDA,L,East Asia and Pacific,Active,Tuvalu!$!TV,B,,2014,"[{'DocDate': '21-OCT-2013', 'EntityID': '00033...",6060000,IN,"{'Percent': 46, 'Name': 'Regional integration'}",0,52812547,MINISTRY OF FINANCE AND ECONOMIC DEVEL,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",November,"[{'code': '47', 'name': 'Regional integration'...",Tuvalu,http://www.worldbank.org/projects/P145310?lang=en,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c782'}
3,[{'Name': 'Other social services'}],N,OTHER,RE,"[Social dev/gender/inclusion, Social dev/gende...",0,LABOR INTENSIVE PUBLIC WORKS PROJECT PMU,Gov't and Civil Society Organization Partnership,77,,1500000,P144665,"[{'code': 'JX', 'name': 'Health and other soci...","Procurement Plan,Project Information Document,...","{'Percent': 100, 'Name': 'Other social services'}",Technical Assistance Loan,RY,,0,"[{'code': '7', 'name': 'Social dev/gender/incl...",2013-10-31T00:00:00Z,"Yemen, Republic of",,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Yemen!$!RY,C,,2014,"[{'DocDate': '15-MAY-2013', 'EntityID': '00035...",1500000,IN,"{'Percent': 50, 'Name': 'Participation and civ...",1500000,5957,MIN. OF PLANNING AND INT'L COOPERATION,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '57', 'name': 'Participation and civ...",Republic of Yemen,http://www.worldbank.org/projects/P144665?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c783'}
4,[{'Name': 'General industry and trade sector'}...,N,IDA,PE,"[Trade and integration, Financial and private ...",13100000,MINISTRY OF TRADE AND INDUSTRY,Second Private Sector Competitiveness and Econ...,54,2019-04-30T00:00:00Z,13100000,P144933,"[{'code': 'YX', 'name': 'Industry and trade'},...","Project Information Document,Integrated Safegu...","{'Percent': 50, 'Name': 'General industry and ...",Investment Project Financing,LS,"{'Percent': 40, 'Name': 'Other industry'}",13100000,"[{'code': '5', 'name': 'Trade and integration'...",2013-10-31T00:00:00Z,Lesotho,,IBRD/IDA,L,Africa,Active,Kingdom of Lesotho!$!LS,B,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '06-SEP-2013', 'EntityID': '09022...",15000000,IN,"{'Percent': 30, 'Name': 'Export development an...",0,4145,MINISTRY OF FINANCE,"FH,YW,YZ","{'Percent': 10, 'Name': 'SME Finance'}","[{'Percent': 50, 'Name': 'Industry and trade'}...",October,"[{'code': '45', 'name': 'Export development an...",Kingdom of Lesotho,http://www.worldbank.org/projects/P144933/seco...,IBRD,Active,0,"[{'code': 'YZ', 'name': 'General industry and ...",{'$oid': '52b213b38594d8a2be17c784'}


In [138]:
theme_df = pd.DataFrame(bank_df,columns=['mjthemecode','countryshortname'])

In [139]:
theme_df.columns = ['Code','Country']

In [140]:
theme_df.head()

Unnamed: 0,Code,Country
0,811,Ethiopia
1,16,Tunisia
2,52116,Tuvalu
3,77,"Yemen, Republic of"
4,54,Lesotho


In [141]:
new_theme_df = theme_df['Code'].str.split(',', expand=True)

In [142]:
new_theme_df.fillna(value=0, inplace=True)

In [143]:
new_theme_df.columns=['list1','list2','list3','list4','list5']

In [144]:
new_theme_df.head()

Unnamed: 0,list1,list2,list3,list4,list5
0,8,11,0,0,0
1,1,6,0,0,0
2,5,2,11,6,0
3,7,7,0,0,0
4,5,4,0,0,0


In [145]:
theme_list1=new_theme_df['list1'].tolist()
theme_list2=new_theme_df['list2'].tolist()
theme_list3=new_theme_df['list3'].tolist()
theme_list4=new_theme_df['list4'].tolist()
theme_list5=new_theme_df['list5'].tolist()

In [146]:
code_list = theme_list1 + theme_list2 + theme_list3 + theme_list4 + theme_list5

In [147]:
code_count = Counter(code_list)

In [148]:
code_count

Counter({'8': 210,
         '1': 38,
         '5': 77,
         '7': 130,
         '6': 168,
         '2': 199,
         '11': 250,
         '10': 216,
         '4': 146,
         '9': 50,
         '3': 15,
         0: 1001})

In [149]:
code_count_df = pd.DataFrame.from_dict(code_count, orient='index').reset_index()

In [150]:
#Count for each MJ Theme Code
code_count_df.columns = ['code','count']
code_count_df = code_count_df.apply(pd.to_numeric).sort_values(by=['code']).set_index('code')

In [151]:
code_count_df
unique_codes = code_count_df[1:]

In [152]:
project_names_df = pd.DataFrame(bank_df['mjtheme_namecode'])

In [153]:
project_names_df

Unnamed: 0,mjtheme_namecode
0,"[{'code': '8', 'name': 'Human development'}, {..."
1,"[{'code': '1', 'name': 'Economic management'},..."
2,"[{'code': '5', 'name': 'Trade and integration'..."
3,"[{'code': '7', 'name': 'Social dev/gender/incl..."
4,"[{'code': '5', 'name': 'Trade and integration'..."
5,"[{'code': '6', 'name': 'Social protection and ..."
6,"[{'code': '2', 'name': 'Public sector governan..."
7,"[{'code': '11', 'name': 'Environment and natur..."
8,"[{'code': '10', 'name': 'Rural development'}, ..."
9,"[{'code': '2', 'name': 'Public sector governan..."


In [154]:
project_names_dict = project_names_df['mjtheme_namecode'].to_dict()

In [155]:
project_names = project_names_df['mjtheme_namecode']
project_names_dict

{0: [{'code': '8', 'name': 'Human development'}, {'code': '11', 'name': ''}],
 1: [{'code': '1', 'name': 'Economic management'},
  {'code': '6', 'name': 'Social protection and risk management'}],
 2: [{'code': '5', 'name': 'Trade and integration'},
  {'code': '2', 'name': 'Public sector governance'},
  {'code': '11', 'name': 'Environment and natural resources management'},
  {'code': '6', 'name': 'Social protection and risk management'}],
 3: [{'code': '7', 'name': 'Social dev/gender/inclusion'},
  {'code': '7', 'name': 'Social dev/gender/inclusion'}],
 4: [{'code': '5', 'name': 'Trade and integration'},
  {'code': '4', 'name': 'Financial and private sector development'}],
 5: [{'code': '6', 'name': 'Social protection and risk management'},
  {'code': '6', 'name': ''}],
 6: [{'code': '2', 'name': 'Public sector governance'},
  {'code': '4', 'name': 'Financial and private sector development'}],
 7: [{'code': '11', 'name': 'Environment and natural resources management'},
  {'code': '8', 

In [156]:
project_names=list()
for i in range(0,499):
    for j in range(0,1):
        name = project_names_dict[i][j]
        project_names.append(name)

In [157]:
project_names

[{'code': '8', 'name': 'Human development'},
 {'code': '1', 'name': 'Economic management'},
 {'code': '5', 'name': 'Trade and integration'},
 {'code': '7', 'name': 'Social dev/gender/inclusion'},
 {'code': '5', 'name': 'Trade and integration'},
 {'code': '6', 'name': 'Social protection and risk management'},
 {'code': '2', 'name': 'Public sector governance'},
 {'code': '11', 'name': 'Environment and natural resources management'},
 {'code': '10', 'name': 'Rural development'},
 {'code': '2', 'name': 'Public sector governance'},
 {'code': '10', 'name': 'Rural development'},
 {'code': '10', 'name': 'Rural development'},
 {'code': '4', 'name': ''},
 {'code': '5', 'name': 'Trade and integration'},
 {'code': '6', 'name': 'Social protection and risk management'},
 {'code': '10', 'name': 'Rural development'},
 {'code': '10', 'name': 'Rural development'},
 {'code': '8', 'name': 'Human development'},
 {'code': '8', 'name': 'Human development'},
 {'code': '2', 'name': 'Public sector governance'},

In [158]:
project_name_code_df = pd.DataFrame(project_names)

In [159]:
project_name_code_df

Unnamed: 0,code,name
0,8,Human development
1,1,Economic management
2,5,Trade and integration
3,7,Social dev/gender/inclusion
4,5,Trade and integration
5,6,Social protection and risk management
6,2,Public sector governance
7,11,Environment and natural resources management
8,10,Rural development
9,2,Public sector governance


In [160]:
Theme_Name_Code_df = project_name_code_df.drop_duplicates()

In [161]:
Theme_Name_Code_df

Unnamed: 0,code,name
0,8,Human development
1,1,Economic management
2,5,Trade and integration
3,7,Social dev/gender/inclusion
5,6,Social protection and risk management
6,2,Public sector governance
7,11,Environment and natural resources management
8,10,Rural development
12,4,
21,9,Urban development


In [162]:
unique_code_names_df = Theme_Name_Code_df.replace(r'^\s*$', np.nan, regex=True).dropna()

In [163]:
unique_code_names_df = unique_code_names_df.apply(pd.to_numeric,errors='ignore').sort_values(by=['code'])

In [164]:
unique_code_names_df = unique_code_names_df.set_index('code')

In [165]:
unique_codes

Unnamed: 0_level_0,count
code,Unnamed: 1_level_1
1,38
2,199
3,15
4,146
5,77
6,168
7,130
8,210
9,50
10,216


In [166]:
unique_code_names_df['Count'] = pd.Series(unique_codes['count'])

In [167]:
#Top 10 major project themes
unique_code_names_df.sort_values(by=['Count'],ascending=False, inplace=True)
unique_code_names_df.head(10)

Unnamed: 0_level_0,name,Count
code,Unnamed: 1_level_1,Unnamed: 2_level_1
11,Environment and natural resources management,250
10,Rural development,216
8,Human development,210
2,Public sector governance,199
6,Social protection and risk management,168
4,Financial and private sector development,146
7,Social dev/gender/inclusion,130
5,Trade and integration,77
9,Urban development,50
1,Economic management,38


In [168]:
unique_code_names_df = unique_code_names_df.reset_index()

In [169]:
unique_code_names_df

Unnamed: 0,code,name,Count
0,11,Environment and natural resources management,250
1,10,Rural development,216
2,8,Human development,210
3,2,Public sector governance,199
4,6,Social protection and risk management,168
5,4,Financial and private sector development,146
6,7,Social dev/gender/inclusion,130
7,5,Trade and integration,77
8,9,Urban development,50
9,1,Economic management,38


In [186]:
# {code:10,name:'Rural development'}

unique_code_names_df['Theme']= '{code:'+unique_code_names_df['code'].astype(str)+',name:'+unique_code_names_df['name']+'}'

unique_code_names_df

Unnamed: 0,code,name,Count,Theme
0,11,Environment and natural resources management,250,"{code:11,name:Environment and natural resource..."
1,10,Rural development,216,"{code:10,name:Rural development}"
2,8,Human development,210,"{code:8,name:Human development}"
3,2,Public sector governance,199,"{code:2,name:Public sector governance}"
4,6,Social protection and risk management,168,"{code:6,name:Social protection and risk manage..."
5,4,Financial and private sector development,146,"{code:4,name:Financial and private sector deve..."
6,7,Social dev/gender/inclusion,130,"{code:7,name:Social dev/gender/inclusion}"
7,5,Trade and integration,77,"{code:5,name:Trade and integration}"
8,9,Urban development,50,"{code:9,name:Urban development}"
9,1,Economic management,38,"{code:1,name:Economic management}"


In [187]:
unique_code_names_df.set_index('code',inplace=True)
unique_code_names_df.loc[3]

name                   Rule of law
Count                           15
Theme    {code:3,name:Rule of law}
Name: 3, dtype: object

In [174]:
bank_df.head()

Unnamed: 0,sector,supplementprojectflg,projectfinancialtype,prodline,mjtheme,idacommamt,impagency,project_name,mjthemecode,closingdate,totalcommamt,id,mjsector_namecode,docty,sector1,lendinginstr,countrycode,sector2,totalamt,mjtheme_namecode,boardapprovaldate,countryshortname,sector4,prodlinetext,productlinetype,regionname,status,country_namecode,envassesmentcategorycode,project_abstract,approvalfy,projectdocs,lendprojectcost,lendinginstrtype,theme1,grantamt,themecode,borrower,sectorcode,sector3,majorsector_percent,board_approval_month,theme_namecode,countryname,url,source,projectstatusdisplay,ibrdcommamt,sector_namecode,_id
0,"[{'Name': 'Primary education'}, {'Name': 'Seco...",N,IDA,PE,[Human development],130000000,MINISTRY OF EDUCATION,Ethiopia General Education Quality Improvement...,811,2018-07-07T00:00:00Z,130000000,P129828,"[{'code': 'EX', 'name': 'Education'}, {'code':...","Project Information Document,Indigenous People...","{'Percent': 46, 'Name': 'Primary education'}",Investment Project Financing,ET,"{'Percent': 26, 'Name': 'Secondary education'}",130000000,"[{'code': '8', 'name': 'Human development'}, {...",2013-11-12T00:00:00Z,Ethiopia,"{'Percent': 12, 'Name': 'Tertiary education'}",IBRD/IDA,L,Africa,Active,Federal Democratic Republic of Ethiopia!$!ET,C,{'cdata': 'The development objective of the Se...,1999,"[{'DocDate': '28-AUG-2013', 'EntityID': '09022...",550000000,IN,"{'Percent': 100, 'Name': 'Education for all'}",0,65,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,"ET,BS,ES,EP","{'Percent': 16, 'Name': 'Public administration...","[{'Percent': 46, 'Name': 'Education'}, {'Perce...",November,"[{'code': '65', 'name': 'Education for all'}]",Federal Democratic Republic of Ethiopia,http://www.worldbank.org/projects/P129828/ethi...,IBRD,Active,0,"[{'code': 'EP', 'name': 'Primary education'}, ...",{'$oid': '52b213b38594d8a2be17c780'}
1,[{'Name': 'Public administration- Other social...,N,OTHER,RE,"[Economic management, Social protection and ri...",0,MINISTRY OF FINANCE,TN: DTF Social Protection Reforms Support,16,,4700000,P144674,"[{'code': 'BX', 'name': 'Public Administration...","Project Information Document,Integrated Safegu...","{'Percent': 70, 'Name': 'Public administration...",Specific Investment Loan,TN,"{'Percent': 30, 'Name': 'General public admini...",0,"[{'code': '1', 'name': 'Economic management'},...",2013-11-04T00:00:00Z,Tunisia,,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Tunisia!$!TN,C,,2015,"[{'DocDate': '29-MAR-2013', 'EntityID': '00033...",5700000,IN,"{'Percent': 30, 'Name': 'Other economic manage...",4700000,5424,GOVERNMENT OF TUNISIA,"BZ,BS",,"[{'Percent': 70, 'Name': 'Public Administratio...",November,"[{'code': '24', 'name': 'Other economic manage...",Republic of Tunisia,http://www.worldbank.org/projects/P144674?lang=en,IBRD,Active,0,"[{'code': 'BS', 'name': 'Public administration...",{'$oid': '52b213b38594d8a2be17c781'}
2,[{'Name': 'Rural and Inter-Urban Roads and Hig...,Y,IDA,PE,"[Trade and integration, Public sector governan...",6060000,MINISTRY OF TRANSPORT AND COMMUNICATIONS,Tuvalu Aviation Investment Project - Additiona...,52116,,6060000,P145310,"[{'code': 'TX', 'name': 'Transportation'}]","Resettlement Plan,Environmental Assessment,Int...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Investment Project Financing,TV,,6060000,"[{'code': '5', 'name': 'Trade and integration'...",2013-11-01T00:00:00Z,Tuvalu,,IBRD/IDA,L,East Asia and Pacific,Active,Tuvalu!$!TV,B,,2014,"[{'DocDate': '21-OCT-2013', 'EntityID': '00033...",6060000,IN,"{'Percent': 46, 'Name': 'Regional integration'}",0,52812547,MINISTRY OF FINANCE AND ECONOMIC DEVEL,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",November,"[{'code': '47', 'name': 'Regional integration'...",Tuvalu,http://www.worldbank.org/projects/P145310?lang=en,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c782'}
3,[{'Name': 'Other social services'}],N,OTHER,RE,"[Social dev/gender/inclusion, Social dev/gende...",0,LABOR INTENSIVE PUBLIC WORKS PROJECT PMU,Gov't and Civil Society Organization Partnership,77,,1500000,P144665,"[{'code': 'JX', 'name': 'Health and other soci...","Procurement Plan,Project Information Document,...","{'Percent': 100, 'Name': 'Other social services'}",Technical Assistance Loan,RY,,0,"[{'code': '7', 'name': 'Social dev/gender/incl...",2013-10-31T00:00:00Z,"Yemen, Republic of",,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Yemen!$!RY,C,,2014,"[{'DocDate': '15-MAY-2013', 'EntityID': '00035...",1500000,IN,"{'Percent': 50, 'Name': 'Participation and civ...",1500000,5957,MIN. OF PLANNING AND INT'L COOPERATION,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '57', 'name': 'Participation and civ...",Republic of Yemen,http://www.worldbank.org/projects/P144665?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c783'}
4,[{'Name': 'General industry and trade sector'}...,N,IDA,PE,"[Trade and integration, Financial and private ...",13100000,MINISTRY OF TRADE AND INDUSTRY,Second Private Sector Competitiveness and Econ...,54,2019-04-30T00:00:00Z,13100000,P144933,"[{'code': 'YX', 'name': 'Industry and trade'},...","Project Information Document,Integrated Safegu...","{'Percent': 50, 'Name': 'General industry and ...",Investment Project Financing,LS,"{'Percent': 40, 'Name': 'Other industry'}",13100000,"[{'code': '5', 'name': 'Trade and integration'...",2013-10-31T00:00:00Z,Lesotho,,IBRD/IDA,L,Africa,Active,Kingdom of Lesotho!$!LS,B,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '06-SEP-2013', 'EntityID': '09022...",15000000,IN,"{'Percent': 30, 'Name': 'Export development an...",0,4145,MINISTRY OF FINANCE,"FH,YW,YZ","{'Percent': 10, 'Name': 'SME Finance'}","[{'Percent': 50, 'Name': 'Industry and trade'}...",October,"[{'code': '45', 'name': 'Export development an...",Kingdom of Lesotho,http://www.worldbank.org/projects/P144933/seco...,IBRD,Active,0,"[{'code': 'YZ', 'name': 'General industry and ...",{'$oid': '52b213b38594d8a2be17c784'}


In [188]:
theme_code_df = pd.DataFrame(bank_df['mjthemecode'])

In [190]:
theme_code_df['mjthemecode']=theme_code_df['mjthemecode'].astype(str)
theme_code_df.head

<bound method NDFrame.head of         mjthemecode
0              8,11
1               1,6
2          5,2,11,6
3               7,7
4               5,4
5               6,6
6               2,4
7              11,8
8              10,7
9             2,2,2
10             10,2
11        10,6,6,11
12                4
13          5,11,10
14            6,6,6
15          10,11,5
16             10,2
17              8,7
18        8,8,2,7,8
19            2,2,2
20              7,7
21              9,7
22              7,7
23              8,8
24       10,10,10,6
25         11,11,11
26          4,5,2,8
27         11,2,5,6
28          10,10,7
29             7,11
30              8,4
31      11,11,11,11
32             11,4
33            6,1,4
34          2,8,5,5
35           7,10,4
36            10,11
37              6,7
38    11,11,6,11,11
39              2,4
40       11,6,11,11
41              4,8
42              2,2
43              2,8
44             11,7
45             8,10
46         2,10,4,4
47        

In [191]:
import nltk, re
from nltk.tokenize import word_tokenize
from nltk.tokenize import RegexpTokenizer

In [192]:
#tokenizer=RegexpTokenizer(',', gaps=True)
#x='8,11'

#l=tokenizer.tokenize(x)

def mapper(code_list,unique_code_names_df):
    temp_code_list=[]
    for i in code_list:
        temp_code_list.append(unique_code_names_df.loc[int(i)]['Theme'])
    return temp_code_list 

def splitter(x,i2):
    l=tokenizer.tokenize(x)
    theme = mapper(l,i2)
    return theme


In [193]:
theme_code_df['New_Theme']=theme_code_df['mjthemecode'].apply(splitter, args = (unique_code_names_df,))

In [194]:
theme_code_df

Unnamed: 0,mjthemecode,New_Theme
0,811,"[{code:8,name:Human development}, {code:11,nam..."
1,16,"[{code:1,name:Economic management}, {code:6,na..."
2,52116,"[{code:5,name:Trade and integration}, {code:2,..."
3,77,"[{code:7,name:Social dev/gender/inclusion}, {c..."
4,54,"[{code:5,name:Trade and integration}, {code:4,..."
5,66,"[{code:6,name:Social protection and risk manag..."
6,24,"[{code:2,name:Public sector governance}, {code..."
7,118,"[{code:11,name:Environment and natural resourc..."
8,107,"[{code:10,name:Rural development}, {code:7,nam..."
9,222,"[{code:2,name:Public sector governance}, {code..."


In [195]:
bank_df.head()

Unnamed: 0,sector,supplementprojectflg,projectfinancialtype,prodline,mjtheme,idacommamt,impagency,project_name,mjthemecode,closingdate,totalcommamt,id,mjsector_namecode,docty,sector1,lendinginstr,countrycode,sector2,totalamt,mjtheme_namecode,boardapprovaldate,countryshortname,sector4,prodlinetext,productlinetype,regionname,status,country_namecode,envassesmentcategorycode,project_abstract,approvalfy,projectdocs,lendprojectcost,lendinginstrtype,theme1,grantamt,themecode,borrower,sectorcode,sector3,majorsector_percent,board_approval_month,theme_namecode,countryname,url,source,projectstatusdisplay,ibrdcommamt,sector_namecode,_id
0,"[{'Name': 'Primary education'}, {'Name': 'Seco...",N,IDA,PE,[Human development],130000000,MINISTRY OF EDUCATION,Ethiopia General Education Quality Improvement...,811,2018-07-07T00:00:00Z,130000000,P129828,"[{'code': 'EX', 'name': 'Education'}, {'code':...","Project Information Document,Indigenous People...","{'Percent': 46, 'Name': 'Primary education'}",Investment Project Financing,ET,"{'Percent': 26, 'Name': 'Secondary education'}",130000000,"[{'code': '8', 'name': 'Human development'}, {...",2013-11-12T00:00:00Z,Ethiopia,"{'Percent': 12, 'Name': 'Tertiary education'}",IBRD/IDA,L,Africa,Active,Federal Democratic Republic of Ethiopia!$!ET,C,{'cdata': 'The development objective of the Se...,1999,"[{'DocDate': '28-AUG-2013', 'EntityID': '09022...",550000000,IN,"{'Percent': 100, 'Name': 'Education for all'}",0,65,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,"ET,BS,ES,EP","{'Percent': 16, 'Name': 'Public administration...","[{'Percent': 46, 'Name': 'Education'}, {'Perce...",November,"[{'code': '65', 'name': 'Education for all'}]",Federal Democratic Republic of Ethiopia,http://www.worldbank.org/projects/P129828/ethi...,IBRD,Active,0,"[{'code': 'EP', 'name': 'Primary education'}, ...",{'$oid': '52b213b38594d8a2be17c780'}
1,[{'Name': 'Public administration- Other social...,N,OTHER,RE,"[Economic management, Social protection and ri...",0,MINISTRY OF FINANCE,TN: DTF Social Protection Reforms Support,16,,4700000,P144674,"[{'code': 'BX', 'name': 'Public Administration...","Project Information Document,Integrated Safegu...","{'Percent': 70, 'Name': 'Public administration...",Specific Investment Loan,TN,"{'Percent': 30, 'Name': 'General public admini...",0,"[{'code': '1', 'name': 'Economic management'},...",2013-11-04T00:00:00Z,Tunisia,,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Tunisia!$!TN,C,,2015,"[{'DocDate': '29-MAR-2013', 'EntityID': '00033...",5700000,IN,"{'Percent': 30, 'Name': 'Other economic manage...",4700000,5424,GOVERNMENT OF TUNISIA,"BZ,BS",,"[{'Percent': 70, 'Name': 'Public Administratio...",November,"[{'code': '24', 'name': 'Other economic manage...",Republic of Tunisia,http://www.worldbank.org/projects/P144674?lang=en,IBRD,Active,0,"[{'code': 'BS', 'name': 'Public administration...",{'$oid': '52b213b38594d8a2be17c781'}
2,[{'Name': 'Rural and Inter-Urban Roads and Hig...,Y,IDA,PE,"[Trade and integration, Public sector governan...",6060000,MINISTRY OF TRANSPORT AND COMMUNICATIONS,Tuvalu Aviation Investment Project - Additiona...,52116,,6060000,P145310,"[{'code': 'TX', 'name': 'Transportation'}]","Resettlement Plan,Environmental Assessment,Int...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Investment Project Financing,TV,,6060000,"[{'code': '5', 'name': 'Trade and integration'...",2013-11-01T00:00:00Z,Tuvalu,,IBRD/IDA,L,East Asia and Pacific,Active,Tuvalu!$!TV,B,,2014,"[{'DocDate': '21-OCT-2013', 'EntityID': '00033...",6060000,IN,"{'Percent': 46, 'Name': 'Regional integration'}",0,52812547,MINISTRY OF FINANCE AND ECONOMIC DEVEL,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",November,"[{'code': '47', 'name': 'Regional integration'...",Tuvalu,http://www.worldbank.org/projects/P145310?lang=en,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c782'}
3,[{'Name': 'Other social services'}],N,OTHER,RE,"[Social dev/gender/inclusion, Social dev/gende...",0,LABOR INTENSIVE PUBLIC WORKS PROJECT PMU,Gov't and Civil Society Organization Partnership,77,,1500000,P144665,"[{'code': 'JX', 'name': 'Health and other soci...","Procurement Plan,Project Information Document,...","{'Percent': 100, 'Name': 'Other social services'}",Technical Assistance Loan,RY,,0,"[{'code': '7', 'name': 'Social dev/gender/incl...",2013-10-31T00:00:00Z,"Yemen, Republic of",,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Yemen!$!RY,C,,2014,"[{'DocDate': '15-MAY-2013', 'EntityID': '00035...",1500000,IN,"{'Percent': 50, 'Name': 'Participation and civ...",1500000,5957,MIN. OF PLANNING AND INT'L COOPERATION,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '57', 'name': 'Participation and civ...",Republic of Yemen,http://www.worldbank.org/projects/P144665?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c783'}
4,[{'Name': 'General industry and trade sector'}...,N,IDA,PE,"[Trade and integration, Financial and private ...",13100000,MINISTRY OF TRADE AND INDUSTRY,Second Private Sector Competitiveness and Econ...,54,2019-04-30T00:00:00Z,13100000,P144933,"[{'code': 'YX', 'name': 'Industry and trade'},...","Project Information Document,Integrated Safegu...","{'Percent': 50, 'Name': 'General industry and ...",Investment Project Financing,LS,"{'Percent': 40, 'Name': 'Other industry'}",13100000,"[{'code': '5', 'name': 'Trade and integration'...",2013-10-31T00:00:00Z,Lesotho,,IBRD/IDA,L,Africa,Active,Kingdom of Lesotho!$!LS,B,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '06-SEP-2013', 'EntityID': '09022...",15000000,IN,"{'Percent': 30, 'Name': 'Export development an...",0,4145,MINISTRY OF FINANCE,"FH,YW,YZ","{'Percent': 10, 'Name': 'SME Finance'}","[{'Percent': 50, 'Name': 'Industry and trade'}...",October,"[{'code': '45', 'name': 'Export development an...",Kingdom of Lesotho,http://www.worldbank.org/projects/P144933/seco...,IBRD,Active,0,"[{'code': 'YZ', 'name': 'General industry and ...",{'$oid': '52b213b38594d8a2be17c784'}


In [196]:
Updated_Bank_df = bank_df.drop(['mjtheme_namecode'],axis=1)

In [197]:
Updated_Bank_df.head()

Unnamed: 0,sector,supplementprojectflg,projectfinancialtype,prodline,mjtheme,idacommamt,impagency,project_name,mjthemecode,closingdate,totalcommamt,id,mjsector_namecode,docty,sector1,lendinginstr,countrycode,sector2,totalamt,boardapprovaldate,countryshortname,sector4,prodlinetext,productlinetype,regionname,status,country_namecode,envassesmentcategorycode,project_abstract,approvalfy,projectdocs,lendprojectcost,lendinginstrtype,theme1,grantamt,themecode,borrower,sectorcode,sector3,majorsector_percent,board_approval_month,theme_namecode,countryname,url,source,projectstatusdisplay,ibrdcommamt,sector_namecode,_id
0,"[{'Name': 'Primary education'}, {'Name': 'Seco...",N,IDA,PE,[Human development],130000000,MINISTRY OF EDUCATION,Ethiopia General Education Quality Improvement...,811,2018-07-07T00:00:00Z,130000000,P129828,"[{'code': 'EX', 'name': 'Education'}, {'code':...","Project Information Document,Indigenous People...","{'Percent': 46, 'Name': 'Primary education'}",Investment Project Financing,ET,"{'Percent': 26, 'Name': 'Secondary education'}",130000000,2013-11-12T00:00:00Z,Ethiopia,"{'Percent': 12, 'Name': 'Tertiary education'}",IBRD/IDA,L,Africa,Active,Federal Democratic Republic of Ethiopia!$!ET,C,{'cdata': 'The development objective of the Se...,1999,"[{'DocDate': '28-AUG-2013', 'EntityID': '09022...",550000000,IN,"{'Percent': 100, 'Name': 'Education for all'}",0,65,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,"ET,BS,ES,EP","{'Percent': 16, 'Name': 'Public administration...","[{'Percent': 46, 'Name': 'Education'}, {'Perce...",November,"[{'code': '65', 'name': 'Education for all'}]",Federal Democratic Republic of Ethiopia,http://www.worldbank.org/projects/P129828/ethi...,IBRD,Active,0,"[{'code': 'EP', 'name': 'Primary education'}, ...",{'$oid': '52b213b38594d8a2be17c780'}
1,[{'Name': 'Public administration- Other social...,N,OTHER,RE,"[Economic management, Social protection and ri...",0,MINISTRY OF FINANCE,TN: DTF Social Protection Reforms Support,16,,4700000,P144674,"[{'code': 'BX', 'name': 'Public Administration...","Project Information Document,Integrated Safegu...","{'Percent': 70, 'Name': 'Public administration...",Specific Investment Loan,TN,"{'Percent': 30, 'Name': 'General public admini...",0,2013-11-04T00:00:00Z,Tunisia,,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Tunisia!$!TN,C,,2015,"[{'DocDate': '29-MAR-2013', 'EntityID': '00033...",5700000,IN,"{'Percent': 30, 'Name': 'Other economic manage...",4700000,5424,GOVERNMENT OF TUNISIA,"BZ,BS",,"[{'Percent': 70, 'Name': 'Public Administratio...",November,"[{'code': '24', 'name': 'Other economic manage...",Republic of Tunisia,http://www.worldbank.org/projects/P144674?lang=en,IBRD,Active,0,"[{'code': 'BS', 'name': 'Public administration...",{'$oid': '52b213b38594d8a2be17c781'}
2,[{'Name': 'Rural and Inter-Urban Roads and Hig...,Y,IDA,PE,"[Trade and integration, Public sector governan...",6060000,MINISTRY OF TRANSPORT AND COMMUNICATIONS,Tuvalu Aviation Investment Project - Additiona...,52116,,6060000,P145310,"[{'code': 'TX', 'name': 'Transportation'}]","Resettlement Plan,Environmental Assessment,Int...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Investment Project Financing,TV,,6060000,2013-11-01T00:00:00Z,Tuvalu,,IBRD/IDA,L,East Asia and Pacific,Active,Tuvalu!$!TV,B,,2014,"[{'DocDate': '21-OCT-2013', 'EntityID': '00033...",6060000,IN,"{'Percent': 46, 'Name': 'Regional integration'}",0,52812547,MINISTRY OF FINANCE AND ECONOMIC DEVEL,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",November,"[{'code': '47', 'name': 'Regional integration'...",Tuvalu,http://www.worldbank.org/projects/P145310?lang=en,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c782'}
3,[{'Name': 'Other social services'}],N,OTHER,RE,"[Social dev/gender/inclusion, Social dev/gende...",0,LABOR INTENSIVE PUBLIC WORKS PROJECT PMU,Gov't and Civil Society Organization Partnership,77,,1500000,P144665,"[{'code': 'JX', 'name': 'Health and other soci...","Procurement Plan,Project Information Document,...","{'Percent': 100, 'Name': 'Other social services'}",Technical Assistance Loan,RY,,0,2013-10-31T00:00:00Z,"Yemen, Republic of",,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Yemen!$!RY,C,,2014,"[{'DocDate': '15-MAY-2013', 'EntityID': '00035...",1500000,IN,"{'Percent': 50, 'Name': 'Participation and civ...",1500000,5957,MIN. OF PLANNING AND INT'L COOPERATION,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '57', 'name': 'Participation and civ...",Republic of Yemen,http://www.worldbank.org/projects/P144665?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c783'}
4,[{'Name': 'General industry and trade sector'}...,N,IDA,PE,"[Trade and integration, Financial and private ...",13100000,MINISTRY OF TRADE AND INDUSTRY,Second Private Sector Competitiveness and Econ...,54,2019-04-30T00:00:00Z,13100000,P144933,"[{'code': 'YX', 'name': 'Industry and trade'},...","Project Information Document,Integrated Safegu...","{'Percent': 50, 'Name': 'General industry and ...",Investment Project Financing,LS,"{'Percent': 40, 'Name': 'Other industry'}",13100000,2013-10-31T00:00:00Z,Lesotho,,IBRD/IDA,L,Africa,Active,Kingdom of Lesotho!$!LS,B,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '06-SEP-2013', 'EntityID': '09022...",15000000,IN,"{'Percent': 30, 'Name': 'Export development an...",0,4145,MINISTRY OF FINANCE,"FH,YW,YZ","{'Percent': 10, 'Name': 'SME Finance'}","[{'Percent': 50, 'Name': 'Industry and trade'}...",October,"[{'code': '45', 'name': 'Export development an...",Kingdom of Lesotho,http://www.worldbank.org/projects/P144933/seco...,IBRD,Active,0,"[{'code': 'YZ', 'name': 'General industry and ...",{'$oid': '52b213b38594d8a2be17c784'}


In [199]:
Updated_Bank_df['mjtheme_namecode']=theme_code_df['New_Theme']

In [200]:
Updated_Bank_df.head()

Unnamed: 0,sector,supplementprojectflg,projectfinancialtype,prodline,mjtheme,idacommamt,impagency,project_name,mjthemecode,closingdate,totalcommamt,id,mjsector_namecode,docty,sector1,lendinginstr,countrycode,sector2,totalamt,boardapprovaldate,countryshortname,sector4,prodlinetext,productlinetype,regionname,status,country_namecode,envassesmentcategorycode,project_abstract,approvalfy,projectdocs,lendprojectcost,lendinginstrtype,theme1,grantamt,themecode,borrower,sectorcode,sector3,majorsector_percent,board_approval_month,theme_namecode,countryname,url,source,projectstatusdisplay,ibrdcommamt,sector_namecode,_id,mjtheme_namecode
0,"[{'Name': 'Primary education'}, {'Name': 'Seco...",N,IDA,PE,[Human development],130000000,MINISTRY OF EDUCATION,Ethiopia General Education Quality Improvement...,811,2018-07-07T00:00:00Z,130000000,P129828,"[{'code': 'EX', 'name': 'Education'}, {'code':...","Project Information Document,Indigenous People...","{'Percent': 46, 'Name': 'Primary education'}",Investment Project Financing,ET,"{'Percent': 26, 'Name': 'Secondary education'}",130000000,2013-11-12T00:00:00Z,Ethiopia,"{'Percent': 12, 'Name': 'Tertiary education'}",IBRD/IDA,L,Africa,Active,Federal Democratic Republic of Ethiopia!$!ET,C,{'cdata': 'The development objective of the Se...,1999,"[{'DocDate': '28-AUG-2013', 'EntityID': '09022...",550000000,IN,"{'Percent': 100, 'Name': 'Education for all'}",0,65,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,"ET,BS,ES,EP","{'Percent': 16, 'Name': 'Public administration...","[{'Percent': 46, 'Name': 'Education'}, {'Perce...",November,"[{'code': '65', 'name': 'Education for all'}]",Federal Democratic Republic of Ethiopia,http://www.worldbank.org/projects/P129828/ethi...,IBRD,Active,0,"[{'code': 'EP', 'name': 'Primary education'}, ...",{'$oid': '52b213b38594d8a2be17c780'},"[{code:8,name:Human development}, {code:11,nam..."
1,[{'Name': 'Public administration- Other social...,N,OTHER,RE,"[Economic management, Social protection and ri...",0,MINISTRY OF FINANCE,TN: DTF Social Protection Reforms Support,16,,4700000,P144674,"[{'code': 'BX', 'name': 'Public Administration...","Project Information Document,Integrated Safegu...","{'Percent': 70, 'Name': 'Public administration...",Specific Investment Loan,TN,"{'Percent': 30, 'Name': 'General public admini...",0,2013-11-04T00:00:00Z,Tunisia,,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Tunisia!$!TN,C,,2015,"[{'DocDate': '29-MAR-2013', 'EntityID': '00033...",5700000,IN,"{'Percent': 30, 'Name': 'Other economic manage...",4700000,5424,GOVERNMENT OF TUNISIA,"BZ,BS",,"[{'Percent': 70, 'Name': 'Public Administratio...",November,"[{'code': '24', 'name': 'Other economic manage...",Republic of Tunisia,http://www.worldbank.org/projects/P144674?lang=en,IBRD,Active,0,"[{'code': 'BS', 'name': 'Public administration...",{'$oid': '52b213b38594d8a2be17c781'},"[{code:1,name:Economic management}, {code:6,na..."
2,[{'Name': 'Rural and Inter-Urban Roads and Hig...,Y,IDA,PE,"[Trade and integration, Public sector governan...",6060000,MINISTRY OF TRANSPORT AND COMMUNICATIONS,Tuvalu Aviation Investment Project - Additiona...,52116,,6060000,P145310,"[{'code': 'TX', 'name': 'Transportation'}]","Resettlement Plan,Environmental Assessment,Int...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Investment Project Financing,TV,,6060000,2013-11-01T00:00:00Z,Tuvalu,,IBRD/IDA,L,East Asia and Pacific,Active,Tuvalu!$!TV,B,,2014,"[{'DocDate': '21-OCT-2013', 'EntityID': '00033...",6060000,IN,"{'Percent': 46, 'Name': 'Regional integration'}",0,52812547,MINISTRY OF FINANCE AND ECONOMIC DEVEL,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",November,"[{'code': '47', 'name': 'Regional integration'...",Tuvalu,http://www.worldbank.org/projects/P145310?lang=en,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c782'},"[{code:5,name:Trade and integration}, {code:2,..."
3,[{'Name': 'Other social services'}],N,OTHER,RE,"[Social dev/gender/inclusion, Social dev/gende...",0,LABOR INTENSIVE PUBLIC WORKS PROJECT PMU,Gov't and Civil Society Organization Partnership,77,,1500000,P144665,"[{'code': 'JX', 'name': 'Health and other soci...","Procurement Plan,Project Information Document,...","{'Percent': 100, 'Name': 'Other social services'}",Technical Assistance Loan,RY,,0,2013-10-31T00:00:00Z,"Yemen, Republic of",,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Yemen!$!RY,C,,2014,"[{'DocDate': '15-MAY-2013', 'EntityID': '00035...",1500000,IN,"{'Percent': 50, 'Name': 'Participation and civ...",1500000,5957,MIN. OF PLANNING AND INT'L COOPERATION,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '57', 'name': 'Participation and civ...",Republic of Yemen,http://www.worldbank.org/projects/P144665?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c783'},"[{code:7,name:Social dev/gender/inclusion}, {c..."
4,[{'Name': 'General industry and trade sector'}...,N,IDA,PE,"[Trade and integration, Financial and private ...",13100000,MINISTRY OF TRADE AND INDUSTRY,Second Private Sector Competitiveness and Econ...,54,2019-04-30T00:00:00Z,13100000,P144933,"[{'code': 'YX', 'name': 'Industry and trade'},...","Project Information Document,Integrated Safegu...","{'Percent': 50, 'Name': 'General industry and ...",Investment Project Financing,LS,"{'Percent': 40, 'Name': 'Other industry'}",13100000,2013-10-31T00:00:00Z,Lesotho,,IBRD/IDA,L,Africa,Active,Kingdom of Lesotho!$!LS,B,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '06-SEP-2013', 'EntityID': '09022...",15000000,IN,"{'Percent': 30, 'Name': 'Export development an...",0,4145,MINISTRY OF FINANCE,"FH,YW,YZ","{'Percent': 10, 'Name': 'SME Finance'}","[{'Percent': 50, 'Name': 'Industry and trade'}...",October,"[{'code': '45', 'name': 'Export development an...",Kingdom of Lesotho,http://www.worldbank.org/projects/P144933/seco...,IBRD,Active,0,"[{'code': 'YZ', 'name': 'General industry and ...",{'$oid': '52b213b38594d8a2be17c784'},"[{code:5,name:Trade and integration}, {code:4,..."


In [201]:
#The 10 countries with most projects
country_df.sort_values(by='Count', ascending=False, inplace=True)
country_df.set_index('CountryName').head(10)

Unnamed: 0_level_0,Count
CountryName,Unnamed: 1_level_1
People's Republic of China,19
Republic of Indonesia,19
Socialist Republic of Vietnam,17
Republic of India,16
Republic of Yemen,13
People's Republic of Bangladesh,12
Nepal,12
Kingdom of Morocco,12
Republic of Mozambique,11
Africa,11


In [202]:
#Top 10 major project themes
unique_code_names_df.sort_values(by=['Count'],ascending=False, inplace=True)
unique_code_names_df.head(10)

Unnamed: 0_level_0,name,Count,Theme
code,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
11,Environment and natural resources management,250,"{code:11,name:Environment and natural resource..."
10,Rural development,216,"{code:10,name:Rural development}"
8,Human development,210,"{code:8,name:Human development}"
2,Public sector governance,199,"{code:2,name:Public sector governance}"
6,Social protection and risk management,168,"{code:6,name:Social protection and risk manage..."
4,Financial and private sector development,146,"{code:4,name:Financial and private sector deve..."
7,Social dev/gender/inclusion,130,"{code:7,name:Social dev/gender/inclusion}"
5,Trade and integration,77,"{code:5,name:Trade and integration}"
9,Urban development,50,"{code:9,name:Urban development}"
1,Economic management,38,"{code:1,name:Economic management}"


In [204]:
#Create a dataframe with the missing names filled in.
Updated_Bank_df['mjtheme_namecode']

0      [{code:8,name:Human development}, {code:11,nam...
1      [{code:1,name:Economic management}, {code:6,na...
2      [{code:5,name:Trade and integration}, {code:2,...
3      [{code:7,name:Social dev/gender/inclusion}, {c...
4      [{code:5,name:Trade and integration}, {code:4,...
5      [{code:6,name:Social protection and risk manag...
6      [{code:2,name:Public sector governance}, {code...
7      [{code:11,name:Environment and natural resourc...
8      [{code:10,name:Rural development}, {code:7,nam...
9      [{code:2,name:Public sector governance}, {code...
10     [{code:10,name:Rural development}, {code:2,nam...
11     [{code:10,name:Rural development}, {code:6,nam...
12     [{code:4,name:Financial and private sector dev...
13     [{code:5,name:Trade and integration}, {code:11...
14     [{code:6,name:Social protection and risk manag...
15     [{code:10,name:Rural development}, {code:11,na...
16     [{code:10,name:Rural development}, {code:2,nam...
17     [{code:8,name:Human deve

In [205]:
Updated_Bank_df.head()

Unnamed: 0,sector,supplementprojectflg,projectfinancialtype,prodline,mjtheme,idacommamt,impagency,project_name,mjthemecode,closingdate,totalcommamt,id,mjsector_namecode,docty,sector1,lendinginstr,countrycode,sector2,totalamt,boardapprovaldate,countryshortname,sector4,prodlinetext,productlinetype,regionname,status,country_namecode,envassesmentcategorycode,project_abstract,approvalfy,projectdocs,lendprojectcost,lendinginstrtype,theme1,grantamt,themecode,borrower,sectorcode,sector3,majorsector_percent,board_approval_month,theme_namecode,countryname,url,source,projectstatusdisplay,ibrdcommamt,sector_namecode,_id,mjtheme_namecode
0,"[{'Name': 'Primary education'}, {'Name': 'Seco...",N,IDA,PE,[Human development],130000000,MINISTRY OF EDUCATION,Ethiopia General Education Quality Improvement...,811,2018-07-07T00:00:00Z,130000000,P129828,"[{'code': 'EX', 'name': 'Education'}, {'code':...","Project Information Document,Indigenous People...","{'Percent': 46, 'Name': 'Primary education'}",Investment Project Financing,ET,"{'Percent': 26, 'Name': 'Secondary education'}",130000000,2013-11-12T00:00:00Z,Ethiopia,"{'Percent': 12, 'Name': 'Tertiary education'}",IBRD/IDA,L,Africa,Active,Federal Democratic Republic of Ethiopia!$!ET,C,{'cdata': 'The development objective of the Se...,1999,"[{'DocDate': '28-AUG-2013', 'EntityID': '09022...",550000000,IN,"{'Percent': 100, 'Name': 'Education for all'}",0,65,FEDERAL DEMOCRATIC REPUBLIC OF ETHIOPIA,"ET,BS,ES,EP","{'Percent': 16, 'Name': 'Public administration...","[{'Percent': 46, 'Name': 'Education'}, {'Perce...",November,"[{'code': '65', 'name': 'Education for all'}]",Federal Democratic Republic of Ethiopia,http://www.worldbank.org/projects/P129828/ethi...,IBRD,Active,0,"[{'code': 'EP', 'name': 'Primary education'}, ...",{'$oid': '52b213b38594d8a2be17c780'},"[{code:8,name:Human development}, {code:11,nam..."
1,[{'Name': 'Public administration- Other social...,N,OTHER,RE,"[Economic management, Social protection and ri...",0,MINISTRY OF FINANCE,TN: DTF Social Protection Reforms Support,16,,4700000,P144674,"[{'code': 'BX', 'name': 'Public Administration...","Project Information Document,Integrated Safegu...","{'Percent': 70, 'Name': 'Public administration...",Specific Investment Loan,TN,"{'Percent': 30, 'Name': 'General public admini...",0,2013-11-04T00:00:00Z,Tunisia,,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Tunisia!$!TN,C,,2015,"[{'DocDate': '29-MAR-2013', 'EntityID': '00033...",5700000,IN,"{'Percent': 30, 'Name': 'Other economic manage...",4700000,5424,GOVERNMENT OF TUNISIA,"BZ,BS",,"[{'Percent': 70, 'Name': 'Public Administratio...",November,"[{'code': '24', 'name': 'Other economic manage...",Republic of Tunisia,http://www.worldbank.org/projects/P144674?lang=en,IBRD,Active,0,"[{'code': 'BS', 'name': 'Public administration...",{'$oid': '52b213b38594d8a2be17c781'},"[{code:1,name:Economic management}, {code:6,na..."
2,[{'Name': 'Rural and Inter-Urban Roads and Hig...,Y,IDA,PE,"[Trade and integration, Public sector governan...",6060000,MINISTRY OF TRANSPORT AND COMMUNICATIONS,Tuvalu Aviation Investment Project - Additiona...,52116,,6060000,P145310,"[{'code': 'TX', 'name': 'Transportation'}]","Resettlement Plan,Environmental Assessment,Int...","{'Percent': 100, 'Name': 'Rural and Inter-Urba...",Investment Project Financing,TV,,6060000,2013-11-01T00:00:00Z,Tuvalu,,IBRD/IDA,L,East Asia and Pacific,Active,Tuvalu!$!TV,B,,2014,"[{'DocDate': '21-OCT-2013', 'EntityID': '00033...",6060000,IN,"{'Percent': 46, 'Name': 'Regional integration'}",0,52812547,MINISTRY OF FINANCE AND ECONOMIC DEVEL,TI,,"[{'Percent': 100, 'Name': 'Transportation'}]",November,"[{'code': '47', 'name': 'Regional integration'...",Tuvalu,http://www.worldbank.org/projects/P145310?lang=en,IBRD,Active,0,"[{'code': 'TI', 'name': 'Rural and Inter-Urban...",{'$oid': '52b213b38594d8a2be17c782'},"[{code:5,name:Trade and integration}, {code:2,..."
3,[{'Name': 'Other social services'}],N,OTHER,RE,"[Social dev/gender/inclusion, Social dev/gende...",0,LABOR INTENSIVE PUBLIC WORKS PROJECT PMU,Gov't and Civil Society Organization Partnership,77,,1500000,P144665,"[{'code': 'JX', 'name': 'Health and other soci...","Procurement Plan,Project Information Document,...","{'Percent': 100, 'Name': 'Other social services'}",Technical Assistance Loan,RY,,0,2013-10-31T00:00:00Z,"Yemen, Republic of",,Recipient Executed Activities,L,Middle East and North Africa,Active,Republic of Yemen!$!RY,C,,2014,"[{'DocDate': '15-MAY-2013', 'EntityID': '00035...",1500000,IN,"{'Percent': 50, 'Name': 'Participation and civ...",1500000,5957,MIN. OF PLANNING AND INT'L COOPERATION,JB,,"[{'Percent': 100, 'Name': 'Health and other so...",October,"[{'code': '57', 'name': 'Participation and civ...",Republic of Yemen,http://www.worldbank.org/projects/P144665?lang=en,IBRD,Active,0,"[{'code': 'JB', 'name': 'Other social services'}]",{'$oid': '52b213b38594d8a2be17c783'},"[{code:7,name:Social dev/gender/inclusion}, {c..."
4,[{'Name': 'General industry and trade sector'}...,N,IDA,PE,"[Trade and integration, Financial and private ...",13100000,MINISTRY OF TRADE AND INDUSTRY,Second Private Sector Competitiveness and Econ...,54,2019-04-30T00:00:00Z,13100000,P144933,"[{'code': 'YX', 'name': 'Industry and trade'},...","Project Information Document,Integrated Safegu...","{'Percent': 50, 'Name': 'General industry and ...",Investment Project Financing,LS,"{'Percent': 40, 'Name': 'Other industry'}",13100000,2013-10-31T00:00:00Z,Lesotho,,IBRD/IDA,L,Africa,Active,Kingdom of Lesotho!$!LS,B,{'cdata': 'The development objective of the Se...,2014,"[{'DocDate': '06-SEP-2013', 'EntityID': '09022...",15000000,IN,"{'Percent': 30, 'Name': 'Export development an...",0,4145,MINISTRY OF FINANCE,"FH,YW,YZ","{'Percent': 10, 'Name': 'SME Finance'}","[{'Percent': 50, 'Name': 'Industry and trade'}...",October,"[{'code': '45', 'name': 'Export development an...",Kingdom of Lesotho,http://www.worldbank.org/projects/P144933/seco...,IBRD,Active,0,"[{'code': 'YZ', 'name': 'General industry and ...",{'$oid': '52b213b38594d8a2be17c784'},"[{code:5,name:Trade and integration}, {code:4,..."
