## Data Sources

https://databank.worldbank.org/data/reports.aspx?source=world-development-indicators#

http://statisticstimes.com/geography/countries-by-continents.php

## Imports

In [1]:
import pandas as pd

In [2]:
import numpy as np

# Cleaning Data

In [3]:
data = pd.read_csv('World_Data.csv')

In [4]:
data2 = pd.read_csv('World_Data_2.csv')

In [5]:
data3 = pd.read_csv('World_Data_3.csv')

In [6]:
#concatenating all of the dataframes to one
data = pd.concat([data, data2, data3], ignore_index = True)

In [7]:
data.head()

Unnamed: 0,Country Name,Country Code,Series Name,Series Code,1980 [YR1980],1981 [YR1981],1982 [YR1982],1983 [YR1983],1984 [YR1984],1985 [YR1985],...,2009 [YR2009],2010 [YR2010],2011 [YR2011],2012 [YR2012],2013 [YR2013],2014 [YR2014],2015 [YR2015],2016 [YR2016],2017 [YR2017],2018 [YR2018]
0,Afghanistan,AFG,Access to electricity (% of population),EG.ELC.ACCS.ZS,..,..,..,..,..,..,...,44.8548851013184,42.7,43.2220189082037,69.1,67.2595520019531,89.5,71.5,84.1371383666992,..,..
1,Afghanistan,AFG,"Children out of school, primary",SE.PRM.UNER,..,..,..,..,..,..,...,..,..,..,..,..,..,..,..,..,..
2,Afghanistan,AFG,"Contraceptive prevalence, modern methods (% of...",SP.DYN.CONM.ZS,..,..,..,..,..,..,...,..,19.9,20.3,13.8,..,..,19.8,..,..,..
3,Afghanistan,AFG,"Contraceptive prevalence, any methods (% of wo...",SP.DYN.CONU.ZS,..,..,..,..,..,..,...,..,21.8,21.2,..,..,..,22.5,..,..,..
4,Afghanistan,AFG,"Maternal mortality ratio (national estimate, p...",SH.STA.MMRT.NE,..,..,..,..,..,..,...,..,330,..,..,..,..,1291,..,..,..


In [8]:
data.shape

(14999, 43)

In [9]:
data['Country Name'].unique()

array(['Afghanistan', 'Albania', 'Algeria', 'American Samoa', 'Andorra',
       'Angola', 'Antigua and Barbuda', 'Argentina', 'Armenia', 'Aruba',
       'Australia', 'Austria', 'Azerbaijan', 'Bahamas, The', 'Bahrain',
       'Bangladesh', 'Barbados', 'Belarus', 'Belgium', 'Belize', 'Benin',
       'Bermuda', 'Bhutan', 'Bolivia', 'Bosnia and Herzegovina',
       'Botswana', 'Brazil', 'British Virgin Islands',
       'Brunei Darussalam', 'Bulgaria', 'Burkina Faso', 'Burundi',
       'Cabo Verde', 'Cambodia', 'Cameroon', 'Canada', 'Cayman Islands',
       'Central African Republic', 'Chad', 'Channel Islands', 'Chile',
       'China', 'Colombia', 'Comoros', 'Congo, Dem. Rep.', 'Congo, Rep.',
       'Costa Rica', "Cote d'Ivoire", 'Croatia', 'Cuba', 'Curacao',
       'Cyprus', 'Czech Republic', 'Denmark', 'Djibouti', 'Dominica',
       'Dominican Republic', 'Ecuador', 'Egypt, Arab Rep.', 'El Salvador',
       'Equatorial Guinea', 'Eritrea', 'Estonia', 'Eswatini', 'Ethiopia',
       'Faroe Is

In [10]:
#turning years from column headers to a column
df = data.drop(['Series Code', 'Country Code'], axis = 1).copy()
df = df.melt(id_vars=['Country Name', 'Series Name'], var_name = 'Year')

In [12]:
#turning year into an integer rather than a string and removing the label [YR####]
df['Year'] = df['Year'].apply(lambda x: int(x.split()[0]))

In [13]:
#changing values to floats or getting rid of '..' by replacing with NaNs
df['value'] = df['value'].apply(lambda x: float(x) if x != '..' else float('nan'))

In [27]:
df.head()

Unnamed: 0,Country Name,Series Name,Year,value
0,Afghanistan,Access to electricity (% of population),1980,
1,Afghanistan,"Children out of school, primary",1980,
2,Afghanistan,"Contraceptive prevalence, modern methods (% of...",1980,
3,Afghanistan,"Contraceptive prevalence, any methods (% of wo...",1980,
4,Afghanistan,"Maternal mortality ratio (national estimate, p...",1980,


In [14]:
#moving the column "Series Name" to column headers
pivoted = pd.pivot_table(df, index=['Country Name', 'Year'], columns = 'Series Name', values = 'value')

In [15]:
#gets data for potential features where MMR is not null (aka drops all null values for MMR)
mortality = pivoted[pivoted['Maternal mortality ratio (modeled estimate, per 100,000 live births)'].notnull()].copy()

In [16]:
#looking at the amount of non-null values available for each potential feature
mortality.groupby('Year').count()

Series Name,Access to electricity (% of population),"Adjusted net enrollment rate, primary (% of primary school age children)","Adjusted net enrollment rate, primary, female (% of primary school age children)","Adjusted net enrollment rate, primary, male (% of primary school age children)","Adolescent fertility rate (births per 1,000 women ages 15-19)",Adults (ages 15+) and children (ages 0-14) newly infected with HIV,Age dependency ratio (% of working-age population),"Age dependency ratio, old (% of working-age population)","Age dependency ratio, young (% of working-age population)","Automated teller machines (ATMs) (per 100,000 adults)",...,"Persistence to last grade of primary, total (% of cohort)","Physicians (per 1,000 people)",Pregnant women receiving prenatal care (%),"Prevalence of HIV, total (% of population ages 15-49)","Primary completion rate, total (% of relevant age group)",Progression to secondary school (%),"Pupil-teacher ratio, primary","Pupil-teacher ratio, secondary",Women who were first married by age 15 (% of women ages 20-24),Women who were first married by age 18 (% of women ages 20-24)
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
1990,177,64,50,50,183,128,183,183,183,0,...,53,135,9,136,73,42,105,68,5,5
1991,177,62,51,51,183,128,183,183,183,0,...,67,87,10,136,77,52,116,77,4,4
1992,177,64,53,53,183,128,182,182,182,0,...,60,87,21,136,83,47,114,70,11,11
1993,177,63,52,52,183,128,182,182,182,0,...,63,110,19,136,79,51,113,84,7,7
1994,177,76,61,61,183,128,182,182,182,0,...,61,84,11,136,87,40,120,84,5,6
1995,177,71,57,57,183,128,183,183,183,0,...,63,116,19,136,83,46,110,76,8,8
1996,178,73,59,59,183,128,183,183,183,0,...,53,100,19,136,79,40,105,67,10,10
1997,178,61,52,52,183,128,183,183,183,0,...,38,106,26,136,68,19,91,51,10,10
1998,178,66,55,55,183,128,183,183,183,0,...,66,90,26,136,65,58,111,55,10,10
1999,178,115,102,102,183,128,183,183,183,0,...,97,85,25,136,119,92,140,102,9,11


In [17]:
#checking correlation with target
mortality.corr()

Series Name,Access to electricity (% of population),"Adjusted net enrollment rate, primary (% of primary school age children)","Adjusted net enrollment rate, primary, female (% of primary school age children)","Adjusted net enrollment rate, primary, male (% of primary school age children)","Adolescent fertility rate (births per 1,000 women ages 15-19)",Adults (ages 15+) and children (ages 0-14) newly infected with HIV,Age dependency ratio (% of working-age population),"Age dependency ratio, old (% of working-age population)","Age dependency ratio, young (% of working-age population)","Automated teller machines (ATMs) (per 100,000 adults)",...,"Persistence to last grade of primary, total (% of cohort)","Physicians (per 1,000 people)",Pregnant women receiving prenatal care (%),"Prevalence of HIV, total (% of population ages 15-49)","Primary completion rate, total (% of relevant age group)",Progression to secondary school (%),"Pupil-teacher ratio, primary","Pupil-teacher ratio, secondary",Women who were first married by age 15 (% of women ages 20-24),Women who were first married by age 18 (% of women ages 20-24)
Series Name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Access to electricity (% of population),1.000000,0.734260,0.746298,0.738435,-0.728398,-0.212927,-0.797122,0.561715,-0.806531,0.511769,...,0.821210,0.662345,0.460341,-0.410307,0.795534,0.680855,-0.824782,-0.654061,-0.469166,-0.661178
"Adjusted net enrollment rate, primary (% of primary school age children)",0.734260,1.000000,0.991979,0.989154,-0.649855,-0.138760,-0.679545,0.433661,-0.679742,0.427251,...,0.591254,0.489749,0.550305,-0.190179,0.871612,0.551821,-0.640728,-0.525818,-0.652806,-0.631142
"Adjusted net enrollment rate, primary, female (% of primary school age children)",0.746298,0.991979,1.000000,0.962721,-0.658723,-0.125259,-0.707884,0.451006,-0.706716,0.452835,...,0.599201,0.514690,0.597424,-0.147185,0.885798,0.583327,-0.661539,-0.546107,-0.661120,-0.637094
"Adjusted net enrollment rate, primary, male (% of primary school age children)",0.738435,0.989154,0.962721,1.000000,-0.632823,-0.130227,-0.678414,0.447343,-0.682123,0.439215,...,0.575339,0.504879,0.493449,-0.207987,0.845254,0.548407,-0.619742,-0.521158,-0.607015,-0.582175
"Adolescent fertility rate (births per 1,000 women ages 15-19)",-0.728398,-0.649855,-0.658723,-0.632823,1.000000,0.210501,0.798149,-0.541482,0.802340,-0.513768,...,-0.743806,-0.575692,-0.421292,0.299345,-0.720821,-0.628592,0.737550,0.591962,0.684574,0.845927
Adults (ages 15+) and children (ages 0-14) newly infected with HIV,-0.212927,-0.138760,-0.125259,-0.130227,0.210501,1.000000,0.187959,-0.190983,0.204385,-0.089305,...,-0.271654,-0.243056,-0.041920,0.404001,-0.162017,-0.230789,0.224479,0.273708,0.033648,0.124463
Age dependency ratio (% of working-age population),-0.797122,-0.679545,-0.707884,-0.678414,0.798149,0.187959,1.000000,-0.561105,0.971871,-0.528154,...,-0.763005,-0.607551,-0.516448,0.312607,-0.739626,-0.642674,0.778625,0.612577,0.430649,0.661161
"Age dependency ratio, old (% of working-age population)",0.561715,0.433661,0.451006,0.447343,-0.541482,-0.190983,-0.561105,1.000000,-0.740267,0.646894,...,0.548018,0.727174,0.339329,-0.279779,0.429973,0.423960,-0.568129,-0.551957,-0.279280,-0.421536
"Age dependency ratio, young (% of working-age population)",-0.806531,-0.679742,-0.706716,-0.682123,0.802340,0.204385,0.971871,-0.740267,1.000000,-0.640868,...,-0.775060,-0.716129,-0.523556,0.330038,-0.725426,-0.649331,0.798724,0.658023,0.430670,0.656399
"Automated teller machines (ATMs) (per 100,000 adults)",0.511769,0.427251,0.452835,0.439215,-0.513768,-0.089305,-0.528154,0.646894,-0.640868,1.000000,...,0.497319,0.543822,0.417107,-0.209705,0.446038,0.424620,-0.520985,-0.464773,-0.388298,-0.432160


In [18]:
#dropping duplicate features or features that weren't very correlated with the target
mortality.drop(['Contraceptive prevalence, modern methods (% of women ages 15-49)',
       'Lower secondary completion rate, female (% of relevant age group)',
       'Lower secondary completion rate, male (% of relevant age group)',
       'Adjusted net enrollment rate, primary, female (% of primary school age children)',
       'Adjusted net enrollment rate, primary, male (% of primary school age children)',
       'Births attended by skilled health staff (% of total)',
       'Children out of school, primary, female',
       'Children out of school, primary, male',
       'Maternal mortality ratio (national estimate, per 100,000 live births)',
       'Persistence to grade 5, total (% of cohort)',
       "Educational attainment, at least Bachelor's or equivalent, population 25+, total (%) (cumulative)",
       'Educational attainment, at least completed lower secondary, population 25+, total (%) (cumulative)',
       'Educational attainment, at least completed post-secondary, population 25+, total (%) (cumulative)',
       'Educational attainment, at least completed primary, population 25+ years, total (%) (cumulative)',
       'Educational attainment, at least completed short-cycle tertiary, population 25+, total (%) (cumulative)',
       'Educational attainment, at least completed upper secondary, population 25+, total (%) (cumulative)',
       "Educational attainment, at least Master's or equivalent, population 25+, total (%) (cumulative)",
       'Educational attainment, Doctoral or equivalent, population 25+, total (%) (cumulative)',
       'Immunization, DPT (% of children ages 12-23 months)',
       'Immunization, HepB3 (% of one-year-old children)',
       'Lifetime risk of maternal death (%)',
       'Literacy rate, youth total (% of people ages 15-24)',
       'Age dependency ratio (% of working-age population)',
       'Age dependency ratio, old (% of working-age population)',
       'Adults (ages 15+) and children (ages 0-14) newly infected with HIV',
       'Children (0-14) living with HIV',
       'Children (ages 0-14) newly infected with HIV',
       'Children out of school, primary',
       'Community health workers (per 1,000 people)',
       'Prevalence of HIV, total (% of population ages 15-49)',
       'Access to electricity (% of population)',
       'Adolescent fertility rate (births per 1,000 women ages 15-19)',
       'Automated teller machines (ATMs) (per 100,000 adults)',
       'Compulsory education, duration (years)',
       'Consumption of iodized salt (% of households)',
       'Contraceptive prevalence, any methods (% of women ages 15-49)',
       'Exclusive breastfeeding (% of children under 6 months)',
       'GDP per capita (constant 2010 US$)',
       'Government expenditure on education, total (% of GDP)',
       'Immunization, measles (% of children ages 12-23 months)',
       'Individuals using the Internet (% of population)',
       'Literacy rate, adult total (% of people ages 15 and above)',
       'Low-birthweight babies (% of births)',
       'Maternal mortality ratio (modeled estimate, per 100,000 live births)',
       'Mobile cellular subscriptions (per 100 people)',
       'Physicians (per 1,000 people)',
       'Pupil-teacher ratio, primary'], axis = 1, inplace = True)


In [19]:
mortality.groupby('Year').count()

Series Name,"Adjusted net enrollment rate, primary (% of primary school age children)","Age dependency ratio, young (% of working-age population)","Average working hours of children, working only, ages 7-14 (hours per week)","Children in employment, total (% of children ages 7-14)",Electric power consumption (kWh per capita),"Employment to population ratio, 15+, total (%) (modeled ILO estimate)",Female genital mutilation prevalence (%),GDP (constant 2010 US$),GDP growth (annual %),"Life expectancy at birth, total (years)",...,People using safely managed drinking water services (% of population),People using safely managed sanitation services (% of population),People with basic handwashing facilities including soap and water (% of population),"Persistence to last grade of primary, total (% of cohort)",Pregnant women receiving prenatal care (%),"Primary completion rate, total (% of relevant age group)",Progression to secondary school (%),"Pupil-teacher ratio, secondary",Women who were first married by age 15 (% of women ages 20-24),Women who were first married by age 18 (% of women ages 20-24)
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
1990,64,183,0,0,131,0,1,155,147,182,...,0,0,0,53,9,73,42,68,5,5
1991,62,183,0,0,132,180,0,156,156,183,...,0,0,0,67,10,77,52,77,4,4
1992,64,182,0,0,132,180,0,159,157,182,...,0,0,0,60,21,83,47,70,11,11
1993,63,182,0,0,132,180,0,160,160,182,...,0,0,0,63,19,79,51,84,7,7
1994,76,182,0,1,132,180,0,162,161,182,...,0,0,0,61,11,87,40,84,5,6
1995,71,183,0,0,134,180,3,170,163,182,...,0,0,0,63,19,83,46,76,8,8
1996,73,183,0,2,134,180,2,171,171,182,...,0,0,0,53,19,79,40,67,10,10
1997,61,183,0,0,134,180,1,172,172,183,...,0,0,0,38,26,68,19,51,10,10
1998,66,183,0,1,134,180,2,172,173,182,...,0,0,0,66,26,65,58,55,10,10
1999,115,183,2,10,134,180,3,173,173,182,...,0,0,0,97,25,119,92,102,9,11


In [20]:
#drop for too little data
mortality.drop(['Average working hours of children, working only, ages 7-14 (hours per week)',
               'Children in employment, total (% of children ages 7-14)',
               'Pregnant women receiving prenatal care (%)',
               'Women who were first married by age 15 (% of women ages 20-24)',
               'Women who were first married by age 18 (% of women ages 20-24)'], axis = 1, inplace = True)


In [21]:
mortality.corr()

Series Name,"Adjusted net enrollment rate, primary (% of primary school age children)","Age dependency ratio, young (% of working-age population)",Electric power consumption (kWh per capita),"Employment to population ratio, 15+, total (%) (modeled ILO estimate)",Female genital mutilation prevalence (%),GDP (constant 2010 US$),GDP growth (annual %),"Life expectancy at birth, total (years)","Lower secondary completion rate, total (% of relevant age group)","Nurses and midwives (per 1,000 people)",People using safely managed drinking water services (% of population),People using safely managed sanitation services (% of population),People with basic handwashing facilities including soap and water (% of population),"Persistence to last grade of primary, total (% of cohort)","Primary completion rate, total (% of relevant age group)",Progression to secondary school (%),"Pupil-teacher ratio, secondary"
Series Name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1
"Adjusted net enrollment rate, primary (% of primary school age children)",1.0,-0.679742,0.320707,-0.24074,-0.249797,0.153716,-0.053219,0.735921,0.721093,0.398881,0.632013,0.425389,0.652372,0.591254,0.871612,0.551821,-0.525818
"Age dependency ratio, young (% of working-age population)",-0.679742,1.0,-0.502247,0.187004,-0.216811,-0.246185,0.068791,-0.824096,-0.813774,-0.601862,-0.80235,-0.596622,-0.859747,-0.77506,-0.725426,-0.649331,0.658023
Electric power consumption (kWh per capita),0.320707,-0.502247,1.0,0.099821,0.475233,0.229847,-0.065702,0.521309,0.440282,0.631227,0.488839,0.476326,0.698462,0.392579,0.319908,0.323963,-0.44775
"Employment to population ratio, 15+, total (%) (modeled ILO estimate)",-0.24074,0.187004,0.099821,1.0,-0.386459,0.011589,0.041794,-0.257005,-0.287535,-0.036721,-0.332105,0.217176,-0.367579,-0.42273,-0.319116,-0.296319,0.297786
Female genital mutilation prevalence (%),-0.249797,-0.216811,0.475233,-0.386459,1.0,0.015224,-0.147607,0.041759,0.08317,-0.286366,-0.031471,0.81475,0.360264,0.552796,-0.225674,0.187141,0.232807
GDP (constant 2010 US$),0.153716,-0.246185,0.229847,0.011589,0.015224,1.0,-0.032406,0.233178,0.225791,0.190751,0.202528,0.208763,0.223808,0.215729,0.194479,0.169983,-0.1126
GDP growth (annual %),-0.053219,0.068791,-0.065702,0.041794,-0.147607,-0.032406,1.0,-0.046631,-0.105958,-0.198248,-0.332587,-0.081316,-0.086485,-0.105821,-0.063892,-0.062502,0.174349
"Life expectancy at birth, total (years)",0.735921,-0.824096,0.521309,-0.257005,0.041759,0.233178,-0.046631,1.0,0.77398,0.578146,0.798922,0.625385,0.839389,0.740662,0.764456,0.63544,-0.619253
"Lower secondary completion rate, total (% of relevant age group)",0.721093,-0.813774,0.440282,-0.287535,0.08317,0.225791,-0.105958,0.77398,1.0,0.567112,0.683306,0.564698,0.791798,0.800075,0.849312,0.755458,-0.617746
"Nurses and midwives (per 1,000 people)",0.398881,-0.601862,0.631227,-0.036721,-0.286366,0.190751,-0.198248,0.578146,0.567112,1.0,0.500462,0.501681,0.679637,0.554273,0.388765,0.457379,-0.566137


In [22]:
mortality.groupby('Year').count()

Series Name,"Adjusted net enrollment rate, primary (% of primary school age children)","Age dependency ratio, young (% of working-age population)",Electric power consumption (kWh per capita),"Employment to population ratio, 15+, total (%) (modeled ILO estimate)",Female genital mutilation prevalence (%),GDP (constant 2010 US$),GDP growth (annual %),"Life expectancy at birth, total (years)","Lower secondary completion rate, total (% of relevant age group)","Nurses and midwives (per 1,000 people)",People using safely managed drinking water services (% of population),People using safely managed sanitation services (% of population),People with basic handwashing facilities including soap and water (% of population),"Persistence to last grade of primary, total (% of cohort)","Primary completion rate, total (% of relevant age group)",Progression to secondary school (%),"Pupil-teacher ratio, secondary"
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1
1990,64,183,131,0,1,155,147,182,56,14,0,0,0,53,73,42,68
1991,62,183,132,180,0,156,156,183,55,13,0,0,0,67,77,52,77
1992,64,182,132,180,0,159,157,182,56,14,0,0,0,60,83,47,70
1993,63,182,132,180,0,160,160,182,59,12,0,0,0,63,79,51,84
1994,76,182,132,180,0,162,161,182,64,14,0,0,0,61,87,40,84
1995,71,183,134,180,3,170,163,182,53,20,0,0,0,63,83,46,76
1996,73,183,134,180,2,171,171,182,49,18,0,0,0,53,79,40,67
1997,61,183,134,180,1,172,172,183,46,25,0,0,0,38,68,19,51
1998,66,183,134,180,2,172,173,182,24,27,0,0,0,66,65,58,55
1999,115,183,134,180,3,173,173,182,75,31,0,0,0,97,119,92,102


In [23]:
#removing the pivoted levels
mortality = mortality.swaplevel(0, 1, axis=0)

In [24]:
#resetting index
mortality = mortality.reset_index()

In [25]:
#removing world totals from df
mortality = mortality[mortality['Country Name'] != 'World']

In [26]:
mortality.groupby('Country Name').count()

Series Name,Year,"Adjusted net enrollment rate, primary (% of primary school age children)","Age dependency ratio, young (% of working-age population)",Electric power consumption (kWh per capita),"Employment to population ratio, 15+, total (%) (modeled ILO estimate)",Female genital mutilation prevalence (%),GDP (constant 2010 US$),GDP growth (annual %),"Life expectancy at birth, total (years)","Lower secondary completion rate, total (% of relevant age group)","Nurses and midwives (per 1,000 people)",People using safely managed drinking water services (% of population),People using safely managed sanitation services (% of population),People with basic handwashing facilities including soap and water (% of population),"Persistence to last grade of primary, total (% of cohort)","Primary completion rate, total (% of relevant age group)",Progression to secondary school (%),"Pupil-teacher ratio, secondary"
Country Name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1
Afghanistan,26,1,26,0,25,0,14,13,26,2,6,0,0,11,0,1,0,5
Albania,26,13,26,25,25,0,26,26,26,13,3,16,16,0,13,14,12,12
Algeria,26,23,26,25,25,0,26,26,26,25,3,0,16,7,24,25,24,8
Angola,26,5,26,25,25,0,26,26,26,3,3,0,0,4,3,5,2,5
Argentina,26,18,26,25,25,0,26,26,26,17,6,16,16,0,19,21,18,11
Armenia,26,10,26,25,25,0,26,25,26,10,8,16,0,16,12,14,10,3
Australia,26,26,26,25,25,0,26,26,26,0,9,0,16,0,0,0,0,0
Austria,26,0,26,25,25,0,26,26,26,12,10,16,16,0,9,9,7,24
Azerbaijan,26,25,26,25,25,0,26,25,26,21,8,16,0,0,22,23,22,0
"Bahamas, The",26,11,26,0,25,0,26,26,26,7,3,0,0,0,5,8,4,12


In [396]:
mortality.to_csv('mortality.csv')