In [1]:
import numpy as np
import pandas as pd
import wbdata
import random
import re
from sklearn.preprocessing import Imputer

In [2]:
columns = ['Country', 'Year', 'Status', 'Life_Expectancy', 
           'Adult_Mortality', 'Infant_Deaths', 'Alcohol', 
           'Percentage_Expenditure', 'Measles', 'BMI_5-19_years',
           'BMI_18+_years','Under-Five_Deaths', 'Polio', 
           'Total_Expenditure', 'Diphtheria', 'GDP', 
           'Population','Thinness_10-19_years', 
           'Thinness_5-9_years','Income_Composition_Of_Resources', 'Schooling']
main_data = pd.DataFrame(columns=columns)

In [3]:
len(main_data.columns)

21

## COMMON REGEX

In [4]:
# Sometimes two integers popup in the same cell
regex_double_nums = re.compile(r'^[\d]+([\d]+|.[\d]+) [\d]+([\d]+|.[\d]+)$')

## Population Data

In [5]:
#wbdata.search_indicators('Population')

In [6]:
#set up the indicator I want (just build up the dict if you want more than one)
indicators = {'SP.POP.TOTL':'Population'}

In [7]:
#grab indicators above for all countries and load into data frame
pop_df_in = wbdata.get_dataframe(indicators, convert_date=False)

In [8]:
pop_df_in.to_csv("Data/New/Population/Population_Internet.csv", encoding='utf-8')

In [9]:
pop_df_get = pd.read_csv("Data/New/Population/Population_Internet.csv")
pop_df = pop_df_get.rename(index = str, columns={'date':'Year', 'country':'Country'})
len(pop_df['Country'].unique())

264

In [10]:
# Removing continents and other trivial rows
pop_df.drop(pop_df.index[:2773], inplace=True)
len(pop_df['Country'].unique())

217

In [11]:
# Year: 2000 - 2014
pop_df = pop_df[(lambda x: x['Year'].isin(range(2000,2015)))]

In [12]:
pop_df.reset_index(drop=True, inplace=True)

In [13]:
pop_df.head()

Unnamed: 0,Country,Year,Population
0,Afghanistan,2014,32758020.0
1,Afghanistan,2013,31731688.0
2,Afghanistan,2012,30696958.0
3,Afghanistan,2011,29708599.0
4,Afghanistan,2010,28803167.0


In [14]:
# Fixing Missing Values
pop_df.at[915, 'Population'] = 5054634
pop_df.at[916, 'Population'] = 4945529
pop_df.at[917, 'Population'] = 4840901

In [15]:
main_data[['Country', 'Year', 'Population']] = pop_df[['Country', 'Year', 'Population']]

In [16]:
main_data['Population'].isnull().sum()
#main_data.info()

0

In [17]:
#main_data[main_data['Country'] == "Vietnam"]

## GDP

In [18]:
#set up the indicator I want (just build up the dict if you want more than one)
indicators = {'NY.GDP.PCAP.CD':'GDP'}

In [19]:
#grab indicators above for countires above and load into data frame
gdp_df = wbdata.get_dataframe(indicators, convert_date=False)

In [20]:
gdp_df.to_csv("Data/New/GDP/GDP_Internet.csv", encoding='utf-8')
gdp_data_get = pd.read_csv("Data/New/GDP/GDP_Internet.csv")
gdp_data = gdp_data_get.rename(index = str, columns={'date':'Year', 'country':'Country'})
#gdp_data[gdp_data['Country'] == "South Sudan"]

In [21]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(gdp_data[gdp_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            gdp_other_data = gdp_data[gdp_data['Country'] == main_data['Country'][val]][gdp_data['Year'] == main_data['Year'][val]]['GDP'].values[0]
            print(gdp_other_data, "pass: 1")
            main_data.at[val, 'GDP'] = gdp_other_data
        except IndexError:
            pass

0  625.3395388284999 pass: 1
1  647.966460473683 pass: 1
2  648.511069587633 pass: 1
3  599.29762975711 pass: 1
4  550.514973976336 pass: 1
5  444.18440407545 pass: 1
6  370.382293977374 pass: 1
7  366.230443242864 pass: 1
8  269.22969301812304 pass: 1
9  247.664139959638 pass: 1
10  216.708128851229 pass: 1
11  195.77663034155103 pass: 1
12  184.49471212204898 pass: 1
13  nan pass: 1
14  nan pass: 1
15  4578.6679344615895 pass: 1
16  4413.08288688408 pass: 1
17  4247.614342362921 pass: 1
18  4437.177794486521 pass: 1
19  4094.36020359235 pass: 1
20  4114.13489916342 pass: 1
21  4370.5399247769 pass: 1
22  3595.0380568289293 pass: 1
23  2972.74292399799 pass: 1
24  2673.78658429559 pass: 1
25  2373.58129170055 pass: 1
26  1846.12012081207 pass: 1
27  1425.12421860142 pass: 1
28  1281.6598256178 pass: 1
29  1126.68334010717 pass: 1
30  5466.42577841535 pass: 1
31  5471.123388787089 pass: 1
32  5565.134521048481 pass: 1
33  5432.413319781161 pass: 1
34  4463.39467488951 pass: 1
35  3868.

  """


 pass: 1
53  nan pass: 1
54  nan pass: 1
55  11598.7517362051 pass: 1
56  11589.8530023324 pass: 1
57  11660.329531051999 pass: 1
58  10375.9942154736 pass: 1
59  10352.8227618312 pass: 1
60  42294.9947269717 pass: 1
61  40619.711297779504 pass: 1
62  38391.080866978504 pass: 1
63  41098.766941722795 pass: 1
64  39736.3540626699 pass: 1
65  43339.3798746543 pass: 1
66  47785.6590856793 pass: 1
67  48582.808455086604 pass: 1
68  43748.772158899905 pass: 1
69  41282.0201219785 pass: 1
70  38503.479614485695 pass: 1
71  32776.4422698769 pass: 1
72  24741.4935704562 pass: 1
73  22228.8464928922 pass: 1
74  21936.530101470802 pass: 1
75  5412.6923476178 pass: 1
76  5258.40737644433 pass: 1
77  5102.4899693158895 pass: 1
78  4615.86747457004 pass: 1
79  3585.90555256868 pass: 1
80  3117.89694392484 pass: 1
81  4068.97845646361 pass: 1
82  3108.26864317894 pass: 1
83  2585.1335220492897 pass: 1
84  1890.8497268156898 pass: 1
85  1248.40490589113 pass: 1
86  978.5389338872909 pass: 1
87  869.8

340  1097.45708762103 pass: 1
341  997.7417140733031 pass: 1
342  885.638224530948 pass: 1
343  807.938767268667 pass: 1
344  765.8632357656951 pass: 1
345  3124.00030982516 pass: 1
346  2947.9385262805104 pass: 1
347  2645.2277526014605 pass: 1
348  2377.68877123935 pass: 1
349  1981.1701161847602 pass: 1
350  1776.86647562189 pass: 1
351  1736.93008403587 pass: 1
352  1389.62934991949 pass: 1
353  1233.59186917076 pass: 1
354  1046.4273841431698 pass: 1
355  978.334648481852 pass: 1
356  917.3643104861699 pass: 1
357  913.575642272268 pass: 1
358  958.236652408901 pass: 1
359  1007.0028688845099 pass: 1
360  5204.24371841169 pass: 1
361  5042.58221304612 pass: 1
362  4722.013403067271 pass: 1
363  5054.32534423757 pass: 1
364  4614.8290411405 pass: 1
365  4701.33442641347 pass: 1
366  5078.31457720914 pass: 1
367  4180.913531981741 pass: 1
368  3403.8152971587297 pass: 1
369  2967.8340564335604 pass: 1
370  2802.27491705489 pass: 1
371  2214.73224591872 pass: 1
372  1761.537647188610

661  458.238406189045 pass: 1
662  424.859318512183 pass: 1
663  387.32357961186403 pass: 1
664  334.231702517329 pass: 1
665  298.806956230642 pass: 1
666  327.767654268638 pass: 1
667  286.507537174865 pass: 1
668  255.591313804132 pass: 1
669  218.52350917279801 pass: 1
670  194.166786345182 pass: 1
671  173.916351831834 pass: 1
672  175.13607148129398 pass: 1
673  153.69957329168003 pass: 1
674  405.469653093749 pass: 1
675  2910.52022576864 pass: 1
676  2964.5729890305797 pass: 1
677  2952.05234806594 pass: 1
678  3196.6475237082395 pass: 1
679  2737.34233022991 pass: 1
680  2255.33311863864 pass: 1
681  2881.59411605216 pass: 1
682  2111.20948856339 pass: 1
683  2012.1100704730602 pass: 1
684  1637.06438124572 pass: 1
685  1289.33783690965 pass: 1
686  998.101311670601 pass: 1
687  886.361665299432 pass: 1
688  842.7090677443041 pass: 1
689  998.196856210498 pass: 1
690  10630.9979007564 pass: 1
691  10569.6663143709 pass: 1
692  9985.36958968047 pass: 1
693  9186.59638994181 pas

963  354.846354368724 pass: 1
964  341.309909200504 pass: 1
965  379.756638540888 pass: 1
966  325.382554265056 pass: 1
967  243.30268224694598 pass: 1
968  193.79490564251597 pass: 1
969  161.626624773078 pass: 1
970  135.762385796471 pass: 1
971  118.87344658163201 pass: 1
972  111.363435555958 pass: 1
973  120.17892791115 pass: 1
974  123.876205729993 pass: 1
975  57543.6690591516 pass: 1
976  53612.825003877304 pass: 1
977  48421.8030715067 pass: 1
978  50789.0486039991 pass: 1
979  47397.9029229641 pass: 1
980  46521.501713475496 pass: 1
981  49773.1668730863 pass: 1
982  47024.229698072595 pass: 1
983  40719.5750317748 pass: 1
984  35847.453564998395 pass: 1
985  34979.0816995871 pass: 1
986  30993.0770616633 pass: 1
987  26553.7465597833 pass: 1
988  24300.3785998986 pass: 1
989  22479.578988392 pass: 1
990  5061.397574568859 pass: 1
991  4763.06895557778 pass: 1
992  4546.73850445133 pass: 1
993  4353.12139240993 pass: 1
994  3651.9667840554603 pass: 1
995  3369.4082466578197 p

1251  2568.61890785298 pass: 1
1252  2326.85195436274 pass: 1
1253  1945.6400342675897 pass: 1
1254  1098.45521561333 pass: 1
1255  1048.11053410866 pass: 1
1256  988.3050590665069 pass: 1
1257  965.749284085495 pass: 1
1258  946.7002572561411 pass: 1
1259  946.0599371665669 pass: 1
1260  830.113881624145 pass: 1
1261  810.265607301884 pass: 1
1262  766.8437623188879 pass: 1
1263  740.935845216079 pass: 1
1264  662.279518162433 pass: 1
1265  668.297604584601 pass: 1
1266  674.756414674589 pass: 1
1267  615.8202308278791 pass: 1
1268  505.470620633981 pass: 1
1269  465.310386508996 pass: 1
1270  387.942891069774 pass: 1
1271  329.782094609998 pass: 1
1272  393.016060861473 pass: 1
1273  413.737737605203 pass: 1
1274  462.481438106584 pass: 1
1275  2242.70745940423 pass: 1
1276  2136.7717179207502 pass: 1
1277  2178.38855524013 pass: 1
1278  2120.5894686048 pass: 1
1279  1932.8582899968899 pass: 1
1280  1815.48949644078 pass: 1
1281  1751.59585650768 pass: 1
1282  1592.5721816707598 pass

1588  1490.3610325022598 pass: 1
1589  1087.76240120887 pass: 1
1590  42996.3152212942 pass: 1
1591  48399.8078177184 pass: 1
1592  51264.0713358672 pass: 1
1593  48268.591204554294 pass: 1
1594  38497.6169579293 pass: 1
1595  37567.301210596204 pass: 1
1596  55571.9980595751 pass: 1
1597  45793.976143914806 pass: 1
1598  42717.557253307 pass: 1
1599  35490.2613236708 pass: 1
1600  26921.0827767441 pass: 1
1601  22071.5696085573 pass: 1
1602  17789.419812619 pass: 1
1603  16540.9676143149 pass: 1
1604  18389.384328288997 pass: 1
1605  1279.7697826598599 pass: 1
1606  1282.43716202467 pass: 1
1607  1177.9747348784801 pass: 1
1608  1123.8831680627 pass: 1
1609  880.037775119109 pass: 1
1610  871.224389337854 pass: 1
1611  966.393627185372 pass: 1
1612  721.768690838857 pass: 1
1613  543.110702403072 pass: 1
1614  476.552129968975 pass: 1
1615  433.234976590867 pass: 1
1616  380.50733975156 pass: 1
1617  321.726606346204 pass: 1
1618  308.40877673732797 pass: 1
1619  279.620424920086 pass

1962  89061.0513003609 pass: 1
1963  82552.5667888765 pass: 1
1964  82534.8736232049 pass: 1
1965  4181.5833128422 pass: 1
1966  4385.37935468846 pass: 1
1967  4368.0822475510795 pass: 1
1968  3769.5952691587895 pass: 1
1969  2650.3536483043804 pass: 1
1970  1717.89876129974 pass: 1
1971  2139.62563086411 pass: 1
1972  1634.0814313969 pass: 1
1973  1334.65189612629 pass: 1
1974  998.822667102654 pass: 1
1975  797.8377432266079 pass: 1
1976  646.056129497955 pass: 1
1977  571.501883026268 pass: 1
1978  524.014592388925 pass: 1
1979  474.213336086127 pass: 1
1980  7378.341021527041 pass: 1
1981  7186.431924061809 pass: 1
1982  6586.7192089878 pass: 1
1983  7318.74244854117 pass: 1
1984  6682.28115774575 pass: 1
1985  6727.10776676969 pass: 1
1986  7367.751909108821 pass: 1
1987  5976.391922117671 pass: 1
1988  4425.680912910129 pass: 1
1989  3674.6179242796998 pass: 1
1990  3380.16512135859 pass: 1
1991  2789.15906483509 pass: 1
1992  2106.6350684523 pass: 1
1993  1909.5987018617898 pass

2337  1000.0681684256599 pass: 1
2338  957.280749688589 pass: 1
2339  1038.9110175487199 pass: 1
2340  14345.1860569374 pass: 1
2341  13780.1906069881 pass: 1
2342  13143.5212186872 pass: 1
2343  13890.6962382966 pass: 1
2344  12597.862389964099 pass: 1
2345  11527.5932279825 pass: 1
2346  14001.4468819804 pass: 1
2347  11255.4366982999 pass: 1
2348  9038.73084652356 pass: 1
2349  8021.003655337259 pass: 1
2350  6681.17881781198 pass: 1
2351  5693.377763225971 pass: 1
2352  5196.93292103894 pass: 1
2353  4981.1986188017 pass: 1
2354  4492.7276035593795 pass: 1
2355  22077.5361325219 pass: 1
2356  21618.7353389663 pass: 1
2357  20577.4026375899 pass: 1
2358  23196.1837500759 pass: 1
2359  22538.654077348197 pass: 1
2360  23063.9716141302 pass: 1
2361  24815.608835662202 pass: 1
2362  22780.0584505513 pass: 1
2363  19821.444626863202 pass: 1
2364  18784.9484992149 pass: 1
2365  18045.588099483302 pass: 1
2366  15772.7333950542 pass: 1
2367  12882.288973030802 pass: 1
2368  11729.14616298

2711  982.641882183568 pass: 1
2712  867.6360436681 pass: 1
2713  832.7451401996941 pass: 1
2714  869.495692083353 pass: 1
2715  17061.302955574698 pass: 1
2716  15977.283829131798 pass: 1
2717  15219.1976045753 pass: 1
2718  15742.9552936912 pass: 1
2719  14904.9484156759 pass: 1
2720  15074.212785805901 pass: 1
2721  15762.704462517 pass: 1
2722  14541.885791743602 pass: 1
2723  13355.565670934098 pass: 1
2724  11884.7778090159 pass: 1
2725  11032.716834322 pass: 1
2726  10280.8174653888 pass: 1
2727  10662.913460785601 pass: 1
2728  10337.9802615949 pass: 1
2729  9554.38125224542 pass: 1
2730  8596.351698284008 pass: 1
2731  8367.27621963304 pass: 1
2732  8216.015523631271 pass: 1
2733  8272.39454697 pass: 1
2734  8008.19716459999 pass: 1
2735  7384.2702498314 pass: 1
2736  7576.682337697579 pass: 1
2737  7634.7461109428505 pass: 1
2738  6855.10376313063 pass: 1
2739  6203.53629341865 pass: 1
2740  5878.142850001271 pass: 1
2741  5485.336050145061 pass: 1
2742  5034.43387554853 pass

3086  34173.9799764342 pass: 1
3087  29785.986287584 pass: 1
3088  27427.58750236 pass: 1
3089  27982.3557635787 pass: 1
3090  54696.72616523269 pass: 1
3091  52782.086508871 pass: 1
3092  51450.9591148182 pass: 1
3093  49793.713524920095 pass: 1
3094  48375.4069462972 pass: 1
3095  47001.555349681796 pass: 1
3096  48401.4273403899 pass: 1
3097  48061.5376613353 pass: 1
3098  46437.067117306506 pass: 1
3099  44307.9205848603 pass: 1
3100  41921.8097617892 pass: 1
3101  39677.1983481058 pass: 1
3102  38166.0378407812 pass: 1
3103  37273.6181034176 pass: 1
3104  36449.855115534905 pass: 1
3105  16737.8982724965 pass: 1
3106  16881.2056763151 pass: 1
3107  15092.068191845101 pass: 1
3108  14166.4990866454 pass: 1
3109  11938.212001755 pass: 1
3110  9415.17038173445 pass: 1
3111  9062.31217136226 pass: 1
3112  7009.69704965585 pass: 1
3113  5877.876078469661 pass: 1
3114  5220.95111632219 pass: 1
3115  4117.308853330071 pass: 1
3116  3622.05228427976 pass: 1
3117  4088.76885515511 pass: 1


In [22]:
main_data[main_data['GDP'].isnull()]['Country'].unique()

array(['Afghanistan', 'American Samoa', 'Bermuda',
       'British Virgin Islands', 'Cayman Islands', 'Channel Islands',
       'Curacao', 'Eritrea', 'French Polynesia', 'Gibraltar', 'Guam',
       'Iraq', 'Korea, Dem. People���s Rep.', 'Nauru', 'New Caledonia',
       'Northern Mariana Islands', 'Sao Tome and Principe',
       'Sint Maarten (Dutch part)', 'Somalia', 'South Sudan',
       'St. Martin (French part)', 'Syrian Arab Republic',
       'Turks and Caicos Islands', 'Virgin Islands (U.S.)'], dtype=object)

In [23]:
#main_data[main_data['GDP'].isnull()][main_data['Country'] == "Afghanistan"][['Country','Year','GDP']]

In [24]:
main_data[main_data['Country'] == "South Sudan"][['Country', 'Year', 'GDP']]
len(main_data['Country'].unique())

217

In [25]:
# Dropping "South Sudan" - Many missing values
# main_data.drop(main_data[main_data['Country'] == "South Sudan"].index, inplace=True)

In [26]:
#af_test = main_data[main_data['Country'] == "Afghanistan"]
# len(main_data['Country'].unique())

In [27]:
# DEALING WITH MISSING VALUES
# imp=Imputer(missing_values="NaN", strategy="most_frequent" )
# imp.fit(af_test[["GDP"]])
# af_test["GDP"]=imp.transform(af_test[["GDP"]]).ravel()

In [28]:
# af_test["GDP"]

## Total Expenditure

In [29]:
totalex = pd.read_csv("Data/New/Total_Expenditure/data_internet.csv")

In [30]:
count = 0
totalex_data = pd.DataFrame(columns=['Country', 'Year', 'Total_Expenditure'])
for i in range(0, len(totalex['Country'].unique())):
    for j in range(1, len(totalex.columns)):
        #print(totalex.loc[i,'Country'], end='')
        totalex_data.at[count, 'Country'] = totalex.loc[i,'Country']
        totalex_data.at[count, 'Year'] = totalex.columns[j]
       # print(totalex.columns[j])
        totalex_data.at[count, 'Total_Expenditure'] = totalex[totalex['Country'] == totalex['Country'][i]].T[1:].loc[totalex.columns[j]].values[0]
        count+=1

In [31]:
# Dropping "South Sudan" - Many missing values
# totalex_data.drop(totalex_data[totalex_data['Country'] == "South Sudan"].index, inplace=True)

In [32]:
totalex_data['Year'] = totalex_data['Year'].astype(np.int64)
#totalex_data.info()

In [33]:
totalex_data.to_pickle("Data/New/Total_Expenditure/totalex_pickle_data.pkl")

In [34]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(totalex_data[totalex_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            totalex_other_data = totalex_data[totalex_data['Country'] == main_data['Country'][val]][totalex_data['Year'] == main_data['Year'][val]]['Total_Expenditure'].values[0]
            print(totalex_other_data, "pass: 1")
            main_data.at[val, 'Total_Expenditure'] = totalex_other_data
        except IndexError:
            pass
    else:
        try:
            totalex_other_data = totalex_data[totalex_data['Country'].str.startswith(main_data['Country'][val])][totalex_data['Year'] == main_data['Year'][val]]['Total_Expenditure'].values[0]
            print(totalex_other_data, "pass: 2")
            main_data.at[val, 'Total_Expenditure'] = totalex_other_data
        except IndexError:
            try:
                totalex_other_data = totalex_data[totalex_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][totalex_data['Year'] == main_data['Year'][val]]['Total_Expenditure'].values[0]
                print(totalex_other_data, "pass: 3")
                main_data.at[val, 'Total_Expenditure'] = totalex_other_data
            except IndexError:
                pass
        

0  12.0 pass: 1
1  10.59 pass: 1
2  11.67 pass: 1
3  10.17 pass: 1
4  14.4 pass: 1
5  12.73 pass: 1
6  6.93 pass: 1
7  2.95 pass: 1
8  6.3 pass: 1
9  5.49 pass: 1
10  6.98 pass: 1
11  5.58 pass: 1
12  8.99 pass: 1
13  nan pass: 1
14  nan pass: 1
15  9.37 pass: 1
16  9.76 pass: 1
17  9.71 pass: 1
18  9.85 pass: 1
19  8.46 pass: 1
20  8.46 pass: 1
21  8.37 pass: 1
22  8.88 pass: 1
23  9.04 pass: 1
24  9.67 pass: 1
25  9.18 pass: 1
26  7.76 pass: 1
27  7.19 pass: 1
28  7.25 pass: 1
29  7.08 pass: 1
30  9.9 pass: 1
31  9.95 pass: 1
32  9.99 pass: 1
33  9.37 pass: 1
34  9.65 pass: 1
35  9.01 pass: 1
36  8.07 pass: 1
37  8.14 pass: 1
38  7.8 pass: 1
39  8.19 pass: 1
40  8.48 pass: 1
41  8.5 pass: 1
42  8.37 pass: 1
43  8.54 pass: 1
44  8.79 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  27.92 pass: 1
61  22.32 pass: 1
62  

  """
  if sys.path[0] == '':


18.88 pass: 1
63  19.31 pass: 1
64  24.04 pass: 1
65  25.1 pass: 1
66  24.04 pass: 1
67  22.85 pass: 1
68  19.38 pass: 1
69  19.5 pass: 1
70  22.7 pass: 1
71  21.98 pass: 1
72  19.99 pass: 1
73  19.24 pass: 1
74  19.08 pass: 1
75  5.0 pass: 1
76  7.42 pass: 1
77  5.57 pass: 1
78  5.58 pass: 1
79  5.43 pass: 1
80  6.36 pass: 1
81  6.46 pass: 1
82  6.42 pass: 1
83  9.56 pass: 1
84  6.08 pass: 1
85  6.25 pass: 1
86  4.61 pass: 1
87  3.38 pass: 1
88  5.77 pass: 1
89  2.86 pass: 1
90  18.08 pass: 1
91  16.29 pass: 1
92  17.16 pass: 1
93  15.18 pass: 1
94  16.36 pass: 1
95  11.38 pass: 1
96  12.27 pass: 1
97  10.81 pass: 1
98  10.07 pass: 1
99  12.08 pass: 1
100  10.69 pass: 1
101  11.89 pass: 1
102  9.88 pass: 1
103  10.75 pass: 1
104  11.42 pass: 1
105  6.92 pass: 1
106  7.72 pass: 1
107  8.74 pass: 1
108  11.82 pass: 1
109  14.07 pass: 1
110  17.13 pass: 1
111  15.79 pass: 1
112  15.37 pass: 1
113  16.35 pass: 1
114  16.67 pass: 1
115  16.92 pass: 1
116  17.27 pass: 1
117  18.23 pass: 1
1

585  586  587  588  589  590  591  592  593  594  595  596  597  598  599  600  15.88 pass: 1
601  15.32 pass: 1
602  14.65 pass: 1
603  14.34 pass: 1
604  13.8 pass: 1
605  14.06 pass: 1
606  13.56 pass: 1
607  13.72 pass: 1
608  13.45 pass: 1
609  12.54 pass: 1
610  12.67 pass: 1
611  12.02 pass: 1
612  15.14 pass: 1
613  14.96 pass: 1
614  14.5 pass: 1
615  10.43 pass: 1
616  10.28 pass: 1
617  10.49 pass: 1
618  10.62 pass: 1
619  10.24 pass: 1
620  10.31 pass: 1
621  10.13 pass: 1
622  11.06 pass: 1
623  9.94 pass: 1
624  9.79 pass: 1
625  10.0 pass: 1
626  9.54 pass: 1
627  9.26 pass: 1
628  9.29 pass: 1
629  10.82 pass: 1
630  18.14 pass: 1
631  18.14 pass: 1
632  18.87 pass: 1
633  20.55 pass: 1
634  18.1 pass: 1
635  18.29 pass: 1
636  18.0 pass: 1
637  16.7 pass: 1
638  16.44 pass: 1
639  15.71 pass: 1
640  15.38 pass: 1
641  18.6 pass: 1
642  16.72 pass: 1
643  16.88 pass: 1
644  19.3 pass: 1
645  8.66 pass: 1
646  7.38 pass: 1
647  9.94 pass: 1
648  7.19 pass: 1
649  6.15 p

1098  18.58 pass: 1
1099  18.15 pass: 1
1100  18.31 pass: 1
1101  18.13 pass: 1
1102  18.06 pass: 1
1103  17.58 pass: 1
1104  17.33 pass: 1
1105  17.1 pass: 1
1106  17.34 pass: 1
1107  17.31 pass: 1
1108  17.13 pass: 1
1109  17.87 pass: 1
1110  6.82 pass: 1
1111  10.58 pass: 1
1112  9.32 pass: 1
1113  14.03 pass: 1
1114  14.93 pass: 1
1115  16.45 pass: 1
1116  13.15 pass: 1
1117  16.16 pass: 1
1118  13.98 pass: 1
1119  15.08 pass: 1
1120  12.58 pass: 1
1121  8.33 pass: 1
1122  8.45 pass: 1
1123  9.34 pass: 1
1124  7.85 pass: 1
1125  1126  1127  1128  1129  1130  1131  1132  1133  1134  1135  1136  1137  1138  1139  1140  9.98 pass: 1
1141  9.98 pass: 1
1142  11.37 pass: 1
1143  12.32 pass: 1
1144  11.85 pass: 1
1145  12.54 pass: 1
1146  11.51 pass: 1
1147  12.06 pass: 1
1148  12.84 pass: 1
1149  12.35 pass: 1
1150  10.31 pass: 1
1151  11.05 pass: 1
1152  11.04 pass: 1
1153  11.19 pass: 1
1154  9.83 pass: 1
1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  11

1605  1606  1607  1608  1609  1610  1611  1612  1613  1614  1615  1616  1617  1618  1619  1620  1621  1622  1623  1624  1625  1626  1627  1628  1629  1630  1631  1632  1633  1634  1635  9.81 pass: 1
1636  9.81 pass: 1
1637  9.81 pass: 1
1638  10.08 pass: 1
1639  9.08 pass: 1
1640  9.31 pass: 1
1641  10.55 pass: 1
1642  11.84 pass: 1
1643  11.37 pass: 1
1644  10.15 pass: 1
1645  10.26 pass: 1
1646  9.31 pass: 1
1647  9.11 pass: 1
1648  9.03 pass: 1
1649  8.68 pass: 1
1650  10.72 pass: 1
1651  10.72 pass: 1
1652  10.72 pass: 1
1653  9.56 pass: 1
1654  9.19 pass: 1
1655  9.66 pass: 1
1656  9.07 pass: 1
1657  10.45 pass: 1
1658  9.95 pass: 1
1659  11.8 pass: 1
1660  11.04 pass: 1
1661  9.73 pass: 1
1662  10.29 pass: 1
1663  9.72 pass: 1
1664  7.58 pass: 1
1665  13.08 pass: 1
1666  12.82 pass: 1
1667  13.12 pass: 1
1668  14.48 pass: 1
1669  13.2 pass: 1
1670  11.03 pass: 1
1671  9.83 pass: 1
1672  10.0 pass: 1
1673  7.77 pass: 1
1674  6.71 pass: 1
1675  8.69 pass: 1
1676  8.33 pass: 1
1677 

2100  2101  2102  2103  2104  2105  2106  2107  2108  2109  2110  2111  2112  2113  2114  2115  23.36 pass: 1
2116  23.36 pass: 1
2117  23.13 pass: 1
2118  21.71 pass: 1
2119  19.78 pass: 1
2120  22.47 pass: 1
2121  21.61 pass: 1
2122  18.06 pass: 1
2123  18.06 pass: 1
2124  17.69 pass: 1
2125  17.4 pass: 1
2126  16.71 pass: 1
2127  17.14 pass: 1
2128  15.89 pass: 1
2129  15.71 pass: 1
2130  23.95 pass: 1
2131  19.84 pass: 1
2132  18.68 pass: 1
2133  19.11 pass: 1
2134  19.83 pass: 1
2135  19.99 pass: 1
2136  18.11 pass: 1
2137  18.82 pass: 1
2138  17.13 pass: 1
2139  18.6 pass: 1
2140  19.22 pass: 1
2141  20.2 pass: 1
2142  18.77 pass: 1
2143  15.56 pass: 1
2144  13.12 pass: 1
2145  7.57 pass: 1
2146  7.57 pass: 1
2147  7.6 pass: 1
2148  8.58 pass: 1
2149  10.69 pass: 1
2150  10.66 pass: 1
2151  11.38 pass: 1
2152  12.24 pass: 1
2153  16.08 pass: 1
2154  14.78 pass: 1
2155  8.97 pass: 1
2156  9.39 pass: 1
2157  9.89 pass: 1
2158  10.1 pass: 1
2159  8.43 pass: 1
2160  8.17 pass: 1
2161

2580  2581  2582  2583  2584  2585  2586  2587  2588  2589  2590  2591  2592  2593  2594  2595  2596  2597  2598  2599  2600  2601  2602  2603  2604  2605  2606  2607  2608  2609  2610  12.83 pass: 1
2611  11.22 pass: 1
2612  14.06 pass: 1
2613  13.38 pass: 1
2614  13.6 pass: 1
2615  14.23 pass: 1
2616  14.28 pass: 1
2617  13.66 pass: 1
2618  13.81 pass: 1
2619  13.78 pass: 1
2620  13.63 pass: 1
2621  13.66 pass: 1
2622  13.69 pass: 1
2623  13.27 pass: 1
2624  13.15 pass: 1
2625  12.54 pass: 1
2626  13.12 pass: 1
2627  13.34 pass: 1
2628  13.98 pass: 1
2629  20.32 pass: 1
2630  21.1 pass: 1
2631  15.07 pass: 1
2632  19.67 pass: 1
2633  25.35 pass: 1
2634  28.48 pass: 1
2635  23.89 pass: 1
2636  20.26 pass: 1
2637  19.91 pass: 1
2638  34.41 pass: 1
2639  20.75 pass: 1
2640  2641  2642  2643  2644  2645  2646  2647  2648  2649  2650  2651  2652  2653  2654  2655  14.23 pass: 1
2656  14.23 pass: 1
2657  14.44 pass: 1
2658  14.56 pass: 1
2659  14.11 pass: 1
2660  13.29 pass: 1
2661  13.48 

3145  18.69 pass: 1
3146  17.22 pass: 1
3147  12.64 pass: 1
3148  11.97 pass: 1
3149  10.49 pass: 1
3150  5.8 pass: 3
3151  6.38 pass: 3
3152  5.91 pass: 3
3153  8.83 pass: 3
3154  9.11 pass: 3
3155  8.96 pass: 3
3156  4.33 pass: 3
3157  6.57 pass: 3
3158  8.49 pass: 3
3159  8.31 pass: 3
3160  8.33 pass: 3
3161  6.71 pass: 3
3162  7.32 pass: 3
3163  7.41 pass: 3
3164  7.32 pass: 3
3165  3166  3167  3168  3169  3170  3171  3172  3173  3174  3175  3176  3177  3178  3179  3180  3181  3182  3183  3184  3185  3186  3187  3188  3189  3190  3191  3192  3193  3194  3195  3196  3197  3198  3199  3200  3201  3202  3203  3204  3205  3206  3207  3208  3209  3210  3.93 pass: 3
3211  3.93 pass: 3
3212  3.93 pass: 3
3213  4.3 pass: 3
3214  4.3 pass: 3
3215  4.3 pass: 3
3216  4.29 pass: 3
3217  4.29 pass: 3
3218  4.87 pass: 3
3219  4.79 pass: 3
3220  6.11 pass: 3
3221  7.11 pass: 3
3222  7.97 pass: 3
3223  8.58 pass: 3
3224  7.95 pass: 3
3225  11.31 pass: 1
3226  11.01 pass: 1
3227  11.35 pass: 1
3228

In [35]:
main_data[main_data['Country'].isnull()]['Country'].unique()

array([], dtype=object)

In [36]:
totalex_data[totalex_data['Country'].str.startswith("Zimbabwe")]

Unnamed: 0,Country,Year,Total_Expenditure
2865,Zimbabwe,2014,8.49
2866,Zimbabwe,2013,9.59
2867,Zimbabwe,2012,9.69
2868,Zimbabwe,2011,7.59
2869,Zimbabwe,2010,7.47
2870,Zimbabwe,2009,10.58
2871,Zimbabwe,2008,6.4
2872,Zimbabwe,2007,7.51
2873,Zimbabwe,2006,8.26
2874,Zimbabwe,2005,10.96


In [37]:
len(main_data[main_data['Total_Expenditure'].isnull()])

622

## MEASLES

In [38]:
measles = pd.read_csv("Data/New/Measles/Measles_Internet.csv")
measles.head()

Unnamed: 0,Country,2017,2016,2015,2014,2013,2012,2011,2010,2009,...,1983,1982,1981,1980,1979,1978,1977,1976,1975,1974
0,Afghanistan,1511.0,638.0,1154.0,492.0,430.0,2787.0,3013.0,1989.0,2861.0,...,18808.0,20320.0,31107.0,32455.0,43979.0,43964.0,28174.0,26.0,466.0,7.0
1,Albania,12.0,17.0,,,0.0,9.0,28.0,10.0,0.0,...,17.0,3.0,,,,,,,,
2,Algeria,112.0,41.0,63.0,0.0,25.0,18.0,112.0,103.0,107.0,...,22126.0,29584.0,20849.0,15527.0,14937.0,10696.0,12015.0,15646.0,8899.0,10517.0
3,Andorra,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,...,,,,,,,,,,
4,Angola,29.0,53.0,119.0,11699.0,8523.0,4458.0,1449.0,1190.0,2807.0,...,22589.0,30067.0,19714.0,29656.0,19682.0,20408.0,12940.0,5492.0,2153.0,5881.0


In [39]:
count = 0
measles_data = pd.DataFrame(columns=['Country', 'Year', 'Measles'])
for i in range(0, len(measles['Country'].unique())):
    for j in range(1, len(measles.columns)):
        #print(measles.loc[i,'Country'], end='')
        measles_data.at[count, 'Country'] = measles.loc[i,'Country']
        measles_data.at[count, 'Year'] = measles.columns[j]
       # print(measles.columns[j])
        measles_data.at[count, 'Measles'] = measles[measles['Country'] == measles['Country'][i]].T[1:].loc[measles.columns[j]].values[0]
        count+=1

In [40]:
measles_data['Year'] = measles_data['Year'].astype(np.int64)

In [41]:
measles_data.to_pickle("Data/New/Measles/measles_pickle_data.pkl")

In [42]:
#measles_data.tail()

In [43]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(measles_data[measles_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            measles_other_data = measles_data[measles_data['Country'] == main_data['Country'][val]][measles_data['Year'] == main_data['Year'][val]]['Measles'].values[0]
            print(measles_other_data, "pass: 1")
            main_data.at[val, 'Measles'] = measles_other_data
        except IndexError:
            pass
    else:
        try:
            measles_other_data = measles_data[measles_data['Country'].str.startswith(main_data['Country'][val])][measles_data['Year'] == main_data['Year'][val]]['Measles'].values[0]
            print(measles_other_data, "pass: 2")
            main_data.at[val, 'Measles'] = measles_other_data
        except IndexError:
            try:
                measles_other_data = measles_data[measles_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][measles_data['Year'] == main_data['Year'][val]]['Measles'].values[0]
                print(measles_other_data, "pass: 3")
                main_data.at[val, 'Measles'] = measles_other_data
            except IndexError:
                pass
        

0  492.0 pass: 1
1  430.0 pass: 1
2  2787.0 pass: 1
3  3013.0 pass: 1
4  1989.0 pass: 1
5  2861.0 pass: 1
6  1599.0 pass: 1
7  1141.0 pass: 1
8  1990.0 pass: 1
9  1296.0 pass: 1
10  466.0 pass: 1
11  798.0 pass: 1
12  2486.0 pass: 1
13  8762.0 pass: 1
14  6532.0 pass: 1
15  nan pass: 1
16  0.0 pass: 1
17  9.0 pass: 1
18  28.0 pass: 1
19  10.0 pass: 1
20  0.0 pass: 1
21  nan pass: 1
22  22.0 pass: 1
23  68.0 pass: 1
24  6.0 pass: 1
25  7.0 pass: 1
26  8.0 pass: 1
27  16.0 pass: 1
28  18.0 pass: 1
29  662.0 pass: 1
30  0.0 pass: 1
31  25.0 pass: 1
32  18.0 pass: 1
33  112.0 pass: 1
34  103.0 pass: 1
35  107.0 pass: 1
36  217.0 pass: 1
37  0.0 pass: 1
38  944.0 pass: 1
39  2302.0 pass: 1
40  3289.0 pass: 1
41  15374.0 pass: 1
42  5862.0 pass: 1
43  2686.0 pass: 1
44  nan pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  

  """
  if sys.path[0] == '':


nan pass: 1
61  0.0 pass: 1
62  0.0 pass: 1
63  0.0 pass: 1
64  0.0 pass: 1
65  0.0 pass: 1
66  0.0 pass: 1
67  0.0 pass: 1
68  0.0 pass: 1
69  0.0 pass: 1
70  0.0 pass: 1
71  0.0 pass: 1
72  1.0 pass: 1
73  5.0 pass: 1
74  2.0 pass: 1
75  11699.0 pass: 1
76  8523.0 pass: 1
77  4458.0 pass: 1
78  1449.0 pass: 1
79  1190.0 pass: 1
80  2807.0 pass: 1
81  265.0 pass: 1
82  1014.0 pass: 1
83  765.0 pass: 1
84  258.0 pass: 1
85  29.0 pass: 1
86  1196.0 pass: 1
87  11945.0 pass: 1
88  9046.0 pass: 1
89  2219.0 pass: 1
90  0.0 pass: 1
91  0.0 pass: 1
92  0.0 pass: 1
93  0.0 pass: 1
94  0.0 pass: 1
95  0.0 pass: 1
96  0.0 pass: 1
97  0.0 pass: 1
98  0.0 pass: 1
99  0.0 pass: 1
100  0.0 pass: 1
101  0.0 pass: 1
102  0.0 pass: 1
103  0.0 pass: 1
104  0.0 pass: 1
105  1.0 pass: 1
106  0.0 pass: 1
107  2.0 pass: 1
108  3.0 pass: 1
109  17.0 pass: 1
110  3.0 pass: 1
111  0.0 pass: 1
112  0.0 pass: 1
113  0.0 pass: 1
114  0.0 pass: 1
115  0.0 pass: 1
116  0.0 pass: 1
117  0.0 pass: 1
118  0.0 pass: 

609  0.0 pass: 1
610  0.0 pass: 1
611  1.0 pass: 1
612  0.0 pass: 1
613  0.0 pass: 1
614  0.0 pass: 1
615  52628.0 pass: 1
616  26883.0 pass: 1
617  6183.0 pass: 1
618  9943.0 pass: 1
619  38159.0 pass: 1
620  52461.0 pass: 1
621  131441.0 pass: 1
622  109023.0 pass: 1
623  99602.0 pass: 1
624  124219.0 pass: 1
625  70549.0 pass: 1
626  71879.0 pass: 1
627  58341.0 pass: 1
628  88962.0 pass: 1
629  71093.0 pass: 1
630  0.0 pass: 1
631  1.0 pass: 1
632  1.0 pass: 1
633  6.0 pass: 1
634  0.0 pass: 1
635  0.0 pass: 1
636  0.0 pass: 1
637  0.0 pass: 1
638  0.0 pass: 1
639  0.0 pass: 1
640  0.0 pass: 1
641  0.0 pass: 1
642  139.0 pass: 1
643  3.0 pass: 1
644  1.0 pass: 1
645  0.0 pass: 1
646  0.0 pass: 1
647  1.0 pass: 1
648  3.0 pass: 1
649  0.0 pass: 1
650  1.0 pass: 1
651  0.0 pass: 1
652  0.0 pass: 1
653  85.0 pass: 1
654  912.0 pass: 1
655  0.0 pass: 1
656  0.0 pass: 1
657  0.0 pass: 1
658  nan pass: 1
659  nan pass: 1
660  71.0 pass: 3
661  124.0 pass: 3
662  260.0 pass: 3
663  315.0 

1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  0.0 pass: 1
1171  0.0 pass: 1
1172  0.0 pass: 1
1173  0.0 pass: 1
1174  0.0 pass: 1
1175  0.0 pass: 1
1176  0.0 pass: 1
1177  0.0 pass: 1
1178  0.0 pass: 1
1179  0.0 pass: 1
1180  0.0 pass: 1
1181  0.0 pass: 1
1182  0.0 pass: 1
1183  0.0 pass: 1
1184  0.0 pass: 1
1185  1186  1187  1188  1189  1190  1191  1192  1193  1194  1195  1196  1197  1198  1199  1200  0.0 pass: 1
1201  0.0 pass: 1
1202  0.0 pass: 1
1203  0.0 pass: 1
1204  0.0 pass: 1
1205  0.0 pass: 1
1206  0.0 pass: 1
1207  0.0 pass: 1
1208  0.0 pass: 1
1209  0.0 pass: 1
1210  0.0 pass: 1
1211  0.0 pass: 1
1212  0.0 pass: 1
1213  0.0 pass: 1
1214  0.0 pass: 1
1215  175.0 pass: 1
1216  53.0 pass: 1
1217  6.0 pass: 1
1218  11.0 pass: 1
1219  45.0 pass: 1
1220  264.0 pass: 1
1221  89.0 pass: 1
1222  3.0 pass: 1
1223  4.0 pass: 1
1224  99.0 pass: 1
1225  10.0 pass: 1
1226  2497.0 pass: 1
1227  2151.0 pass: 1
1228  7408.0 pass: 1
1229  112

1730  0.0 pass: 1
1731  1.0 pass: 1
1732  0.0 pass: 1
1733  1.0 pass: 1
1734  1.0 pass: 1
1735  1.0 pass: 1
1736  1.0 pass: 1
1737  103.0 pass: 1
1738  7.0 pass: 1
1739  19.0 pass: 1
1740  nan pass: 1
1741  0.0 pass: 1
1742  2.0 pass: 1
1743  6.0 pass: 1
1744  0.0 pass: 1
1745  0.0 pass: 1
1746  1.0 pass: 1
1747  0.0 pass: 1
1748  8.0 pass: 1
1749  nan pass: 1
1750  0.0 pass: 1
1751  1.0 pass: 1
1752  nan pass: 1
1753  nan pass: 1
1754  0.0 pass: 1
1755  1756  1757  1758  1759  1760  1761  1762  1763  1764  1765  1766  1767  1768  1769  1770  3.0 pass: 1
1771  6.0 pass: 1
1772  2.0 pass: 1
1773  0.0 pass: 1
1774  1.0 pass: 1
1775  0.0 pass: 1
1776  3.0 pass: 1
1777  0.0 pass: 1
1778  2.0 pass: 1
1779  nan pass: 1
1780  35558.0 pass: 1
1781  62233.0 pass: 1
1782  10795.0 pass: 1
1783  9357.0 pass: 1
1784  35256.0 pass: 1
1785  3.0 pass: 1
1786  1.0 pass: 1
1787  11.0 pass: 1
1788  26.0 pass: 1
1789  118712.0 pass: 1
1790  21.0 pass: 1
1791  20.0 pass: 1
1792  143.0 pass: 1
1793  1.0 pas

2212  nan pass: 1
2213  0.0 pass: 1
2214  0.0 pass: 1
2215  7.0 pass: 1
2216  8.0 pass: 1
2217  5.0 pass: 1
2218  4.0 pass: 1
2219  0.0 pass: 1
2220  nan pass: 1
2221  0.0 pass: 1
2222  13.0 pass: 1
2223  5.0 pass: 1
2224  3.0 pass: 1
2225  19.0 pass: 1
2226  18.0 pass: 1
2227  24.0 pass: 1
2228  13.0 pass: 1
2229  25.0 pass: 1
2230  18.0 pass: 1
2231  1.0 pass: 1
2232  5.0 pass: 1
2233  15.0 pass: 1
2234  15.0 pass: 1
2235  1370.0 pass: 1
2236  8749.0 pass: 1
2237  8046.0 pass: 1
2238  4386.0 pass: 1
2239  4321.0 pass: 1
2240  863.0 pass: 1
2241  1129.0 pass: 1
2242  2801.0 pass: 1
2243  7641.0 pass: 1
2244  2981.0 pass: 1
2245  4248.0 pass: 1
2246  4740.0 pass: 1
2247  3903.0 pass: 1
2248  3849.0 pass: 1
2249  2064.0 pass: 1
2250  0.0 pass: 1
2251  0.0 pass: 1
2252  0.0 pass: 1
2253  0.0 pass: 1
2254  0.0 pass: 1
2255  0.0 pass: 1
2256  0.0 pass: 1
2257  0.0 pass: 1
2258  0.0 pass: 1
2259  0.0 pass: 1
2260  0.0 pass: 1
2261  nan pass: 1
2262  0.0 pass: 1
2263  nan pass: 1
2264  0.0 p

2679  nan pass: 1
2680  nan pass: 1
2681  nan pass: 1
2682  nan pass: 1
2683  nan pass: 1
2684  nan pass: 1
2685  154.0 pass: 1
2686  131.0 pass: 1
2687  1204.0 pass: 1
2688  3802.0 pass: 1
2689  302.0 pass: 1
2690  41.0 pass: 1
2691  297.0 pass: 1
2692  267.0 pass: 1
2693  362.0 pass: 1
2694  22.0 pass: 1
2695  26.0 pass: 1
2696  256.0 pass: 1
2697  67.0 pass: 1
2698  nan pass: 1
2699  152.0 pass: 1
2700  1686.0 pass: 1
2701  2107.0 pass: 1
2702  51.0 pass: 1
2703  60.0 pass: 1
2704  79.0 pass: 1
2705  21.0 pass: 1
2706  33.0 pass: 1
2707  44.0 pass: 1
2708  0.0 pass: 1
2709  3.0 pass: 1
2710  35.0 pass: 1
2711  65.0 pass: 1
2712  139.0 pass: 1
2713  309.0 pass: 1
2714  16527.0 pass: 1
2715  2716  2717  2718  2719  2720  2721  2722  2723  2724  2725  2726  2727  2728  2729  2730  2731  2732  2733  2734  2735  2736  2737  2738  2739  2740  2741  2742  2743  2744  2745  2746  2747  2748  2749  2750  2751  2752  2753  2754  2755  2756  2757  2758  2759  2760  2761  2762  2763  2764  2765

3165  3166  3167  3168  3169  3170  3171  3172  3173  3174  3175  3176  3177  3178  3179  3180  3181  3182  3183  3184  3185  3186  3187  3188  3189  3190  3191  3192  3193  3194  3195  3196  3197  3198  3199  3200  3201  3202  3203  3204  3205  3206  3207  3208  3209  3210  815.0 pass: 3
3211  400.0 pass: 3
3212  2177.0 pass: 3
3213  2676.0 pass: 3
3214  510.0 pass: 3
3215  130.0 pass: 3
3216  7.0 pass: 3
3217  13.0 pass: 3
3218  8079.0 pass: 3
3219  6285.0 pass: 3
3220  12708.0 pass: 3
3221  8536.0 pass: 3
3222  890.0 pass: 3
3223  485.0 pass: 3
3224  nan pass: 3
3225  9.0 pass: 1
3226  35.0 pass: 1
3227  896.0 pass: 1
3228  13234.0 pass: 1
3229  15754.0 pass: 1
3230  26.0 pass: 1
3231  140.0 pass: 1
3232  535.0 pass: 1
3233  459.0 pass: 1
3234  45.0 pass: 1
3235  35.0 pass: 1
3236  881.0 pass: 1
3237  25036.0 pass: 1
3238  16997.0 pass: 1
3239  30930.0 pass: 1
3240  0.0 pass: 1
3241  0.0 pass: 1
3242  0.0 pass: 1
3243  0.0 pass: 1
3244  9696.0 pass: 1
3245  853.0 pass: 1
3246  0.0 p

## Income composition of resources

In [44]:
icor = pd.read_csv("Data/New/Income_Composition_Of_Resources/ICOR_Internet.csv")

In [45]:
count = 0
icor_data = pd.DataFrame(columns=['Country', 'Year', 'Income_Composition_Of_Resources'])
for i in range(0, len(icor['Country'].unique())):
    for j in range(1, len(icor.columns)):
        #print(icor.loc[i,'Country'], end='')
        # Space before a word by default in the dataset. Max_Split = 1 
        icor_data.at[count, 'Country'] = icor.loc[i,'Country'].split(' ', 1)[1]
        icor_data.at[count, 'Year'] = icor.columns[j]
        #print(icor.columns[j])
        icor_data.at[count, 'Income_Composition_Of_Resources'] = icor[icor['Country'] == icor['Country'][i]].T[1:].loc[icor.columns[j]].values[0]
        count+=1

In [46]:
icor_data['Year'] = icor_data['Year'].astype(np.int64)
#icor_data['Income_Composition_Of_Resources'] = icor_data['Income_Composition_Of_Resources'].astype(np.float64)

In [47]:
#icor_data.to_pickle("Data/New/Income_Composition_Of_Resources/ICOR_Internet.pkl")

In [48]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(icor_data[icor_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            icor_other_data = icor_data[icor_data['Country'] == main_data['Country'][val]][icor_data['Year'] == main_data['Year'][val]]['Income_Composition_Of_Resources'].values[0]
            print(icor_other_data, "pass: 1")
            main_data.at[val, 'Income_Composition_Of_Resources'] = icor_other_data
        except IndexError:
            pass
    else:
        try:
            icor_other_data = icor_data[icor_data['Country'].str.startswith(main_data['Country'][val])][icor_data['Year'] == main_data['Year'][val]]['Income_Composition_Of_Resources'].values[0]
            print(icor_other_data, "pass: 2")
            main_data.at[val, 'Income_Composition_Of_Resources'] = icor_other_data
        except IndexError:
            try:
                icor_other_data = icor_data[icor_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][icor_data['Year'] == main_data['Year'][val]]['Income_Composition_Of_Resources'].values[0]
                print(icor_other_data, "pass: 3")
                main_data.at[val, 'Income_Composition_Of_Resources'] = icor_other_data
            except IndexError:
                pass
            

0  0.441 pass: 1
1  0.44299999999999995 pass: 1
2  0.442 pass: 1
3  0.426 pass: 1
4  0.42100000000000004 pass: 1
5  0.413 pass: 1
6  0.38799999999999996 pass: 1
7  0.386 pass: 1
8  0.371 pass: 1
9  0.36700000000000005 pass: 1
10  0.35700000000000004 pass: 1
11  0.36200000000000004 pass: 1
12  0.35700000000000004 pass: 1
13  nan pass: 1
14  nan pass: 1
15  0.7070000000000001 pass: 1
16  0.705 pass: 1
17  0.7 pass: 1
18  0.6990000000000001 pass: 1
19  0.693 pass: 1
20  0.6859999999999999 pass: 1
21  0.6829999999999999 pass: 1
22  0.679 pass: 1
23  0.669 pass: 1
24  0.659 pass: 1
25  0.6509999999999999 pass: 1
26  0.642 pass: 1
27  0.633 pass: 1
28  0.627 pass: 1
29  0.614 pass: 1
30  0.737 pass: 1
31  0.7340000000000001 pass: 1
32  0.7340000000000001 pass: 1
33  0.7340000000000001 pass: 1
34  0.7340000000000001 pass: 1
35  0.73 pass: 1
36  0.73 pass: 1
37  0.728 pass: 1
38  0.7190000000000001 pass: 1
39  0.7170000000000001 pass: 1
40  0.713 pass: 1
41  0.71 pass: 1
42  0.701 pass: 1
43  

  """
  if sys.path[0] == '':


48  49  50  51  52  53  54  55  56  57  58  59  60  0.92 pass: 1
61  0.914 pass: 1
62  0.91 pass: 1
63  0.91 pass: 1
64  0.9159999999999999 pass: 1
65  0.924 pass: 1
66  0.9309999999999999 pass: 1
67  0.9470000000000001 pass: 1
68  0.95 pass: 1
69  0.9470000000000001 pass: 1
70  0.9420000000000001 pass: 1
71  0.937 pass: 1
72  0.9259999999999999 pass: 1
73  0.922 pass: 1
74  0.92 pass: 1
75  0.62 pass: 1
76  0.613 pass: 1
77  0.602 pass: 1
78  0.601 pass: 1
79  0.603 pass: 1
80  0.613 pass: 1
81  0.583 pass: 1
82  0.5870000000000001 pass: 1
83  0.5539999999999999 pass: 1
84  0.537 pass: 1
85  0.526 pass: 1
86  0.52 pass: 1
87  0.518 pass: 1
88  0.496 pass: 1
89  0.483 pass: 1
90  0.792 pass: 1
91  0.787 pass: 1
92  0.7859999999999999 pass: 1
93  0.784 pass: 1
94  0.79 pass: 1
95  0.8009999999999999 pass: 1
96  0.8220000000000001 pass: 1
97  0.8240000000000001 pass: 1
98  0.812 pass: 1
99  0.7959999999999999 pass: 1
100  0.79 pass: 1
101  0.7829999999999999 pass: 1
102  0.774 pass: 1
10

505  0.428 pass: 1
506  0.41600000000000004 pass: 1
507  0.406 pass: 1
508  0.4 pass: 1
509  0.39299999999999996 pass: 1
510  0.522 pass: 1
511  0.516 pass: 1
512  0.512 pass: 1
513  0.511 pass: 1
514  0.509 pass: 1
515  0.509 pass: 1
516  0.508 pass: 1
517  0.506 pass: 1
518  0.504 pass: 1
519  0.501 pass: 1
520  0.502 pass: 1
521  0.495 pass: 1
522  0.488 pass: 1
523  0.485 pass: 1
524  0.483 pass: 1
525  0.914 pass: 1
526  0.9109999999999999 pass: 1
527  0.909 pass: 1
528  0.9079999999999999 pass: 1
529  0.905 pass: 1
530  0.902 pass: 1
531  0.909 pass: 1
532  0.909 pass: 1
533  0.907 pass: 1
534  0.904 pass: 1
535  0.9 pass: 1
536  0.897 pass: 1
537  0.8959999999999999 pass: 1
538  0.892 pass: 1
539  0.8909999999999999 pass: 1
540  541  542  543  544  545  546  547  548  549  550  551  552  553  554  555  0.313 pass: 1
556  0.325 pass: 1
557  0.32899999999999996 pass: 1
558  0.331 pass: 1
559  0.271 pass: 1
560  0.26899999999999996 pass: 1
561  0.33899999999999997 pass: 1
562  0.33

975  976  977  978  979  980  981  982  983  984  985  986  987  988  989  990  0.6579999999999999 pass: 1
991  0.6559999999999999 pass: 1
992  0.647 pass: 1
993  0.647 pass: 1
994  0.645 pass: 1
995  0.6459999999999999 pass: 1
996  0.6459999999999999 pass: 1
997  0.6459999999999999 pass: 1
998  0.647 pass: 1
999  0.648 pass: 1
1000  0.662 pass: 1
1001  0.6509999999999999 pass: 1
1002  0.648 pass: 1
1003  0.645 pass: 1
1004  0.635 pass: 1
1005  0.903 pass: 1
1006  0.903 pass: 1
1007  0.9059999999999999 pass: 1
1008  0.9079999999999999 pass: 1
1009  0.907 pass: 1
1010  0.903 pass: 1
1011  0.915 pass: 1
1012  0.915 pass: 1
1013  0.909 pass: 1
1014  0.902 pass: 1
1015  0.899 pass: 1
1016  0.892 pass: 1
1017  0.8909999999999999 pass: 1
1018  0.888 pass: 1
1019  0.883 pass: 1
1020  0.898 pass: 1
1021  0.897 pass: 1
1022  0.897 pass: 1
1023  0.899 pass: 1
1024  0.8959999999999999 pass: 1
1025  0.893 pass: 1
1026  0.899 pass: 1
1027  0.9 pass: 1
1028  0.897 pass: 1
1029  0.894 pass: 1
1030  0

1433  0.8490000000000001 pass: 1
1434  0.843 pass: 1
1435  0.836 pass: 1
1436  0.831 pass: 1
1437  0.833 pass: 1
1438  0.835 pass: 1
1439  0.835 pass: 1
1440  0.88 pass: 1
1441  0.8809999999999999 pass: 1
1442  0.8859999999999999 pass: 1
1443  0.89 pass: 1
1444  0.89 pass: 1
1445  0.888 pass: 1
1446  0.8959999999999999 pass: 1
1447  0.9 pass: 1
1448  0.899 pass: 1
1449  0.8959999999999999 pass: 1
1450  0.895 pass: 1
1451  0.893 pass: 1
1452  0.893 pass: 1
1453  0.893 pass: 1
1454  0.8909999999999999 pass: 1
1455  0.66 pass: 1
1456  0.659 pass: 1
1457  0.66 pass: 1
1458  0.659 pass: 1
1459  0.6559999999999999 pass: 1
1460  0.6559999999999999 pass: 1
1461  0.6659999999999999 pass: 1
1462  0.6659999999999999 pass: 1
1463  0.665 pass: 1
1464  0.66 pass: 1
1465  0.66 pass: 1
1466  0.6579999999999999 pass: 1
1467  0.653 pass: 1
1468  0.6559999999999999 pass: 1
1469  0.6559999999999999 pass: 1
1470  0.9 pass: 1
1471  0.899 pass: 1
1472  0.895 pass: 1
1473  0.892 pass: 1
1474  0.892 pass: 1
14

1834  0.43700000000000006 pass: 1
1835  0.436 pass: 1
1836  0.434 pass: 1
1837  0.43200000000000005 pass: 1
1838  0.43 pass: 1
1839  0.429 pass: 1
1840  0.424 pass: 1
1841  0.42700000000000005 pass: 1
1842  0.414 pass: 1
1843  0.41600000000000004 pass: 1
1844  0.40399999999999997 pass: 1
1845  0.863 pass: 1
1846  0.855 pass: 1
1847  0.851 pass: 1
1848  0.85 pass: 1
1849  0.845 pass: 1
1850  0.838 pass: 1
1851  0.85 pass: 1
1852  0.845 pass: 1
1853  0.8390000000000001 pass: 1
1854  0.8370000000000001 pass: 1
1855  0.8370000000000001 pass: 1
1856  0.8370000000000001 pass: 1
1857  0.836 pass: 1
1858  0.833 pass: 1
1859  0.8290000000000001 pass: 1
1860  0.58 pass: 1
1861  0.574 pass: 1
1862  0.5660000000000001 pass: 1
1863  0.5670000000000001 pass: 1
1864  0.565 pass: 1
1865  0.563 pass: 1
1866  0.5660000000000001 pass: 1
1867  0.5710000000000001 pass: 1
1868  0.5660000000000001 pass: 1
1869  0.5660000000000001 pass: 1
1870  0.56 pass: 1
1871  0.56 pass: 1
1872  0.561 pass: 1
1873  0.561 p

2283  0.512 pass: 1
2284  0.507 pass: 1
2285  0.5 pass: 1
2286  0.49700000000000005 pass: 1
2287  0.499 pass: 1
2288  0.47700000000000004 pass: 1
2289  0.483 pass: 1
2290  0.48200000000000004 pass: 1
2291  0.49700000000000005 pass: 1
2292  0.494 pass: 1
2293  0.494 pass: 1
2294  0.498 pass: 1
2295  0.664 pass: 1
2296  0.657 pass: 1
2297  0.638 pass: 1
2298  0.644 pass: 1
2299  0.637 pass: 1
2300  0.619 pass: 1
2301  0.63 pass: 1
2302  0.621 pass: 1
2303  0.606 pass: 1
2304  0.595 pass: 1
2305  0.593 pass: 1
2306  0.586 pass: 1
2307  0.597 pass: 1
2308  0.597 pass: 1
2309  0.6 pass: 1
2310  0.711 pass: 1
2311  0.7090000000000001 pass: 1
2312  0.7 pass: 1
2313  0.691 pass: 1
2314  0.684 pass: 1
2315  0.6759999999999999 pass: 1
2316  0.675 pass: 1
2317  0.662 pass: 1
2318  0.6509999999999999 pass: 1
2319  0.6459999999999999 pass: 1
2320  0.64 pass: 1
2321  0.638 pass: 1
2322  0.635 pass: 1
2323  0.629 pass: 1
2324  0.63 pass: 1
2325  0.662 pass: 1
2326  0.6559999999999999 pass: 1
2327  0.

2715  2716  2717  2718  2719  2720  2721  2722  2723  2724  2725  2726  2727  2728  2729  2730  2731  2732  2733  2734  2735  2736  2737  2738  2739  2740  2741  2742  2743  2744  2745  2746  2747  2748  2749  2750  2751  2752  2753  2754  2755  2756  2757  2758  2759  2760  2761  2762  2763  2764  2765  2766  2767  2768  2769  2770  2771  2772  2773  2774  2775  0.55 pass: 1
2776  0.503 pass: 1
2777  0.55 pass: 1
2778  0.536 pass: 1
2779  0.519 pass: 1
2780  0.519 pass: 1
2781  0.518 pass: 1
2782  0.511 pass: 1
2783  0.499 pass: 1
2784  0.486 pass: 1
2785  0.478 pass: 1
2786  0.47700000000000004 pass: 1
2787  0.473 pass: 1
2788  0.467 pass: 1
2789  0.462 pass: 1
2790  0.758 pass: 1
2791  0.757 pass: 1
2792  0.752 pass: 1
2793  0.747 pass: 1
2794  0.745 pass: 1
2795  0.743 pass: 1
2796  0.741 pass: 1
2797  0.736 pass: 1
2798  0.726 pass: 1
2799  0.72 pass: 1
2800  0.7140000000000001 pass: 1
2801  0.703 pass: 1
2802  0.696 pass: 1
2803  0.679 pass: 1
2804  0.687 pass: 1
2805  0.92299999

3165  3166  3167  3168  3169  3170  3171  3172  3173  3174  3175  3176  3177  3178  3179  3180  3181  3182  3183  3184  3185  3186  3187  3188  3189  3190  3191  3192  3193  3194  3195  3196  3197  3198  3199  3200  3201  3202  3203  3204  3205  3206  3207  3208  3209  3210  0.539 pass: 3
3211  0.546 pass: 3
3212  0.5429999999999999 pass: 3
3213  0.539 pass: 3
3214  0.5660000000000001 pass: 3
3215  0.561 pass: 3
3216  0.5539999999999999 pass: 3
3217  0.555 pass: 3
3218  0.5529999999999999 pass: 3
3219  0.547 pass: 3
3220  0.5429999999999999 pass: 3
3221  0.5429999999999999 pass: 3
3222  0.544 pass: 3
3223  0.544 pass: 3
3224  0.541 pass: 3
3225  0.54 pass: 1
3226  0.534 pass: 1
3227  0.535 pass: 1
3228  0.523 pass: 1
3229  0.517 pass: 1
3230  0.513 pass: 1
3231  0.495 pass: 1
3232  0.483 pass: 1
3233  0.478 pass: 1
3234  0.473 pass: 1
3235  0.469 pass: 1
3236  0.46799999999999997 pass: 1
3237  0.461 pass: 1
3238  0.45799999999999996 pass: 1
3239  0.45299999999999996 pass: 1
3240  0.428

In [49]:
#icor_data[icor_data['Country'] == "Zambia"]

In [50]:
#main_data[['Country','Year','Income_Composition_Of_Resources']]

## Diptheria

In [51]:
diptheria = pd.read_csv("Data/New/Diptheria/Dip_Internet.csv")

In [52]:
count = 0
diptheria_data = pd.DataFrame(columns=['Country', 'Year', 'Diphtheria'])
for i in range(0, len(diptheria['Country'].unique())):
    for j in range(1, len(diptheria.columns)):
        #print(diptheria.loc[i,'Country'], end='')
        diptheria_data.at[count, 'Country'] = diptheria.loc[i,'Country']
        diptheria_data.at[count, 'Year'] = diptheria.columns[j]
        #print(diptheria.columns[j])
        diptheria_data.at[count, 'Diphtheria'] = diptheria[diptheria['Country'] == diptheria['Country'][i]].T[1:].loc[diptheria.columns[j]].values[0]
        count+=1

In [53]:
diptheria_data['Year'] = diptheria_data['Year'].astype(np.int64)
diptheria_data['Diphtheria'] = diptheria_data['Diphtheria'].astype(np.float64)

In [54]:
diptheria_data.to_pickle("Data/New/Diptheria/Dip_Internet.pkl")

In [55]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(diptheria_data[diptheria_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            diptheria_other_data = diptheria_data[diptheria_data['Country'] == main_data['Country'][val]][diptheria_data['Year'] == main_data['Year'][val]]['Diphtheria'].values[0]
            print(diptheria_other_data, "pass: 1")
            main_data.at[val, 'Diphtheria'] = diptheria_other_data
        except IndexError:
            pass
    else:
        try:
            diptheria_other_data = diptheria_data[diptheria_data['Country'].str.startswith(main_data['Country'][val])][diptheria_data['Year'] == main_data['Year'][val]]['Diphtheria'].values[0]
            print(diptheria_other_data, "pass: 2")
            main_data.at[val, 'Diphtheria'] = diptheria_other_data
        except IndexError:
            try:
                diptheria_other_data = diptheria_data[diptheria_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][diptheria_data['Year'] == main_data['Year'][val]]['Diphtheria'].values[0]
                print(diptheria_other_data, "pass: 3")
                main_data.at[val, 'Diphtheria'] = diptheria_other_data
            except IndexError:
                pass
            

0  62.0 pass: 1
1  64.0 pass: 1
2  67.0 pass: 1
3  68.0 pass: 1
4  66.0 pass: 1
5  63.0 pass: 1
6  64.0 pass: 1
7  63.0 pass: 1
8  58.0 pass: 1
9  58.0 pass: 1
10  50.0 pass: 1
11  41.0 pass: 1
12  36.0 pass: 1
13  33.0 pass: 1
14  24.0 pass: 1
15  98.0 pass: 1
16  99.0 pass: 1
17  99.0 pass: 1
18  99.0 pass: 1
19  99.0 pass: 1
20  98.0 pass: 1
21  99.0 pass: 1
22  98.0 pass: 1
23  97.0 pass: 1
24  98.0 pass: 1
25  97.0 pass: 1
26  97.0 pass: 1
27  98.0 pass: 1
28  97.0 pass: 1
29  97.0 pass: 1
30  95.0 pass: 1
31  95.0 pass: 1
32  95.0 pass: 1
33  95.0 pass: 1
34  95.0 pass: 1
35  95.0 pass: 1
36  93.0 pass: 1
37  95.0 pass: 1
38  95.0 pass: 1
39  88.0 pass: 1
40  86.0 pass: 1
41  87.0 pass: 1
42  86.0 pass: 1
43  89.0 pass: 1
44  86.0 pass: 1
45  46  47  48  49  50  51  

  """
  if sys.path[0] == '':


52  53  54  55  56  57  58  59  60  97.0 pass: 1
61  96.0 pass: 1
62  99.0 pass: 1
63  99.0 pass: 1
64  99.0 pass: 1
65  99.0 pass: 1
66  99.0 pass: 1
67  96.0 pass: 1
68  93.0 pass: 1
69  98.0 pass: 1
70  99.0 pass: 1
71  99.0 pass: 1
72  97.0 pass: 1
73  96.0 pass: 1
74  98.0 pass: 1
75  55.0 pass: 1
76  54.0 pass: 1
77  54.0 pass: 1
78  51.0 pass: 1
79  60.0 pass: 1
80  44.0 pass: 1
81  54.0 pass: 1
82  58.0 pass: 1
83  22.0 pass: 1
84  28.0 pass: 1
85  30.0 pass: 1
86  31.0 pass: 1
87  35.0 pass: 1
88  32.0 pass: 1
89  23.0 pass: 1
90  99.0 pass: 1
91  99.0 pass: 1
92  98.0 pass: 1
93  99.0 pass: 1
94  98.0 pass: 1
95  99.0 pass: 1
96  99.0 pass: 1
97  99.0 pass: 1
98  99.0 pass: 1
99  99.0 pass: 1
100  97.0 pass: 1
101  99.0 pass: 1
102  98.0 pass: 1
103  97.0 pass: 1
104  95.0 pass: 1
105  94.0 pass: 1
106  94.0 pass: 1
107  91.0 pass: 1
108  91.0 pass: 1
109  94.0 pass: 1
110  94.0 pass: 1
111  93.0 pass: 1
112  91.0 pass: 1
113  91.0 pass: 1
114  98.0 pass: 1
115  98.0 pass: 1


602  90.0 pass: 1
603  94.0 pass: 1
604  92.0 pass: 1
605  94.0 pass: 1
606  95.0 pass: 1
607  96.0 pass: 1
608  94.0 pass: 1
609  91.0 pass: 1
610  93.0 pass: 1
611  96.0 pass: 1
612  97.0 pass: 1
613  97.0 pass: 1
614  91.0 pass: 1
615  99.0 pass: 1
616  99.0 pass: 1
617  99.0 pass: 1
618  99.0 pass: 1
619  99.0 pass: 1
620  99.0 pass: 1
621  97.0 pass: 1
622  93.0 pass: 1
623  93.0 pass: 1
624  87.0 pass: 1
625  87.0 pass: 1
626  86.0 pass: 1
627  86.0 pass: 1
628  86.0 pass: 1
629  85.0 pass: 1
630  90.0 pass: 1
631  91.0 pass: 1
632  91.0 pass: 1
633  85.0 pass: 1
634  88.0 pass: 1
635  92.0 pass: 1
636  92.0 pass: 1
637  93.0 pass: 1
638  93.0 pass: 1
639  93.0 pass: 1
640  89.0 pass: 1
641  92.0 pass: 1
642  81.0 pass: 1
643  80.0 pass: 1
644  79.0 pass: 1
645  87.0 pass: 1
646  87.0 pass: 1
647  86.0 pass: 1
648  83.0 pass: 1
649  74.0 pass: 1
650  83.0 pass: 1
651  81.0 pass: 1
652  75.0 pass: 1
653  69.0 pass: 1
654  68.0 pass: 1
655  76.0 pass: 1
656  80.0 pass: 1
657  89.0 

1105  96.0 pass: 1
1106  97.0 pass: 1
1107  93.0 pass: 1
1108  93.0 pass: 1
1109  90.0 pass: 1
1110  98.0 pass: 1
1111  90.0 pass: 1
1112  92.0 pass: 1
1113  91.0 pass: 1
1114  94.0 pass: 1
1115  94.0 pass: 1
1116  93.0 pass: 1
1117  94.0 pass: 1
1118  84.0 pass: 1
1119  84.0 pass: 1
1120  80.0 pass: 1
1121  80.0 pass: 1
1122  78.0 pass: 1
1123  79.0 pass: 1
1124  88.0 pass: 1
1125  1126  1127  1128  1129  1130  1131  1132  1133  1134  1135  1136  1137  1138  1139  1140  99.0 pass: 1
1141  99.0 pass: 1
1142  99.0 pass: 1
1143  99.0 pass: 1
1144  99.0 pass: 1
1145  99.0 pass: 1
1146  99.0 pass: 1
1147  99.0 pass: 1
1148  98.0 pass: 1
1149  96.0 pass: 1
1150  95.0 pass: 1
1151  94.0 pass: 1
1152  92.0 pass: 1
1153  91.0 pass: 1
1154  89.0 pass: 1
1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  97.0 pass: 1
1171  97.0 pass: 1
1172  97.0 pass: 1
1173  95.0 pass: 1
1174  97.0 pass: 1
1175  99.0 pass: 1
1176  99.0 pass: 1
1177  96.0 pass: 1
117

1643  96.0 pass: 1
1644  99.0 pass: 1
1645  99.0 pass: 1
1646  98.0 pass: 1
1647  97.0 pass: 1
1648  97.0 pass: 1
1649  96.0 pass: 1
1650  79.0 pass: 1
1651  84.0 pass: 1
1652  83.0 pass: 1
1653  83.0 pass: 1
1654  82.0 pass: 1
1655  82.0 pass: 1
1656  81.0 pass: 1
1657  80.0 pass: 1
1658  78.0 pass: 1
1659  77.0 pass: 1
1660  75.0 pass: 1
1661  74.0 pass: 1
1662  77.0 pass: 1
1663  80.0 pass: 1
1664  83.0 pass: 1
1665  93.0 pass: 1
1666  93.0 pass: 1
1667  95.0 pass: 1
1668  96.0 pass: 1
1669  93.0 pass: 1
1670  91.0 pass: 1
1671  88.0 pass: 1
1672  88.0 pass: 1
1673  89.0 pass: 1
1674  89.0 pass: 1
1675  90.0 pass: 1
1676  90.0 pass: 1
1677  84.0 pass: 1
1678  78.0 pass: 1
1679  83.0 pass: 1
1680  50.0 pass: 1
1681  76.0 pass: 1
1682  80.0 pass: 1
1683  77.0 pass: 1
1684  70.0 pass: 1
1685  81.0 pass: 1
1686  75.0 pass: 1
1687  65.0 pass: 1
1688  60.0 pass: 1
1689  60.0 pass: 1
1690  31.0 pass: 1
1691  35.0 pass: 1
1692  39.0 pass: 1
1693  42.0 pass: 1
1694  46.0 pass: 1
1695  94.0 p

2121  89.0 pass: 1
2122  88.0 pass: 1
2123  89.0 pass: 1
2124  89.0 pass: 1
2125  89.0 pass: 1
2126  90.0 pass: 1
2127  90.0 pass: 1
2128  90.0 pass: 1
2129  90.0 pass: 1
2130  98.0 pass: 1
2131  98.0 pass: 1
2132  98.0 pass: 1
2133  98.0 pass: 1
2134  98.0 pass: 1
2135  98.0 pass: 1
2136  97.0 pass: 1
2137  93.0 pass: 1
2138  88.0 pass: 1
2139  86.0 pass: 1
2140  79.0 pass: 1
2141  86.0 pass: 1
2142  85.0 pass: 1
2143  87.0 pass: 1
2144  83.0 pass: 1
2145  75.0 pass: 1
2146  70.0 pass: 1
2147  71.0 pass: 1
2148  75.0 pass: 1
2149  70.0 pass: 1
2150  71.0 pass: 1
2151  67.0 pass: 1
2152  57.0 pass: 1
2153  51.0 pass: 1
2154  45.0 pass: 1
2155  43.0 pass: 1
2156  41.0 pass: 1
2157  39.0 pass: 1
2158  36.0 pass: 1
2159  34.0 pass: 1
2160  43.0 pass: 1
2161  43.0 pass: 1
2162  42.0 pass: 1
2163  48.0 pass: 1
2164  54.0 pass: 1
2165  63.0 pass: 1
2166  53.0 pass: 1
2167  42.0 pass: 1
2168  40.0 pass: 1
2169  36.0 pass: 1
2170  33.0 pass: 1
2171  29.0 pass: 1
2172  25.0 pass: 1
2173  27.0 p

2613  96.0 pass: 1
2614  96.0 pass: 1
2615  96.0 pass: 1
2616  97.0 pass: 1
2617  97.0 pass: 1
2618  97.0 pass: 1
2619  95.0 pass: 1
2620  94.0 pass: 1
2621  95.0 pass: 1
2622  93.0 pass: 1
2623  92.0 pass: 1
2624  91.0 pass: 1
2625  77.0 pass: 1
2626  83.0 pass: 1
2627  92.0 pass: 1
2628  91.0 pass: 1
2629  83.0 pass: 1
2630  86.0 pass: 1
2631  85.0 pass: 1
2632  88.0 pass: 1
2633  99.0 pass: 1
2634  89.0 pass: 1
2635  90.0 pass: 1
2636  84.0 pass: 1
2637  78.0 pass: 1
2638  84.0 pass: 1
2639  86.0 pass: 1
2640  42.0 pass: 1
2641  42.0 pass: 1
2642  42.0 pass: 1
2643  41.0 pass: 1
2644  45.0 pass: 1
2645  42.0 pass: 1
2646  31.0 pass: 1
2647  40.0 pass: 1
2648  26.0 pass: 1
2649  35.0 pass: 1
2650  30.0 pass: 1
2651  40.0 pass: 1
2652  40.0 pass: 1
2653  33.0 pass: 1
2654  33.0 pass: 1
2655  77.0 pass: 1
2656  73.0 pass: 1
2657  65.0 pass: 1
2658  69.0 pass: 1
2659  72.0 pass: 1
2660  76.0 pass: 1
2661  79.0 pass: 1
2662  82.0 pass: 1
2663  82.0 pass: 1
2664  79.0 pass: 1
2665  74.0 p

3121  99.0 pass: 1
3122  99.0 pass: 1
3123  99.0 pass: 1
3124  99.0 pass: 1
3125  98.0 pass: 1
3126  98.0 pass: 1
3127  96.0 pass: 1
3128  96.0 pass: 1
3129  99.0 pass: 1
3130  99.0 pass: 1
3131  98.0 pass: 1
3132  99.0 pass: 1
3133  99.0 pass: 1
3134  99.0 pass: 1
3135  86.0 pass: 1
3136  84.0 pass: 1
3137  82.0 pass: 1
3138  79.0 pass: 1
3139  77.0 pass: 1
3140  75.0 pass: 1
3141  73.0 pass: 1
3142  70.0 pass: 1
3143  68.0 pass: 1
3144  68.0 pass: 1
3145  69.0 pass: 1
3146  69.0 pass: 1
3147  70.0 pass: 1
3148  70.0 pass: 1
3149  71.0 pass: 1
3150  78.0 pass: 3
3151  82.0 pass: 3
3152  81.0 pass: 3
3153  78.0 pass: 3
3154  78.0 pass: 3
3155  84.0 pass: 3
3156  50.0 pass: 3
3157  62.0 pass: 3
3158  71.0 pass: 3
3159  87.0 pass: 3
3160  86.0 pass: 3
3161  68.0 pass: 3
3162  65.0 pass: 3
3163  70.0 pass: 3
3164  77.0 pass: 3
3165  3166  3167  3168  3169  3170  3171  3172  3173  3174  3175  3176  3177  3178  3179  3180  3181  3182  3183  3184  3185  3186  3187  3188  3189  3190  3191  31

In [56]:
#main_data[['Country','Year','Diphtheria']]
#main_data.iloc[[3151]]

## Thinness (10-19 Years)

In [57]:
thin_10_19 = pd.read_csv("Data/New/Thinness_10_19/thin_9_10_internet.csv")
thin_10_19

Unnamed: 0.1,Unnamed: 0,2016,2016.1,2016.2,2015,2015.1,2015.2,2014,2014.1,2014.2,...,1978.2,1977,1977.1,1977.2,1976,1976.1,1976.2,1975,1975.1,1975.2
0,Country,Both sexes,Male,Female,Both sexes,Male,Female,Both sexes,Male,Female,...,Female,Both sexes,Male,Female,Both sexes,Male,Female,Both sexes,Male,Female
1,Afghanistan,17.2 [9.1-26.0],23.6 [9.5-39.4],10.5 [4.4-18.8],17.5 [9.5-26.0],23.9 [10.1-39.4],10.7 [4.6-18.8],17.7 [9.8-26.1],24.2 [10.5-39.2],10.9 [4.8-19.0],...,14.5 [4.9-28.2],23.6 [13.0-34.6],32.0 [14.5-48.9],14.6 [4.7-28.7],23.7 [12.8-35.0],32.2 [14.3-49.4],14.7 [4.6-29.4],23.8 [12.8-35.4],32.3 [14.0-49.9],14.8 [4.5-29.9]
2,Albania,1.2 [0.5-2.4],1.2 [0.3-3.1],1.2 [0.3-3.0],1.2 [0.5-2.4],1.2 [0.3-3.0],1.3 [0.4-3.0],1.3 [0.5-2.4],1.3 [0.3-3.0],1.3 [0.4-3.0],...,3.5 [0.5-11.1],3.7 [1.0-8.9],3.7 [0.5-11.3],3.6 [0.4-11.7],3.8 [1.0-9.3],3.8 [0.5-11.8],3.7 [0.4-12.4],3.9 [0.9-9.8],3.9 [0.4-12.4],3.9 [0.4-13.2]
3,Algeria,6.0 [2.4-11.6],7.3 [1.8-16.8],4.7 [1.1-11.9],6.0 [2.4-11.3],7.3 [1.9-16.3],4.5 [1.1-11.3],5.9 [2.5-11.2],7.4 [2.0-16.1],4.4 [1.1-10.8],...,6.4 [1.1-17.3],9.4 [3.4-18.3],12.1 [2.9-26.9],6.5 [1.0-18.0],9.5 [3.3-18.7],12.3 [2.8-27.8],6.7 [0.9-18.8],9.7 [3.3-19.3],12.4 [2.7-28.4],6.8 [0.9-19.4]
4,Andorra,0.8 [0.2-2.2],1.0 [0.1-3.3],0.7 [0.1-2.4],0.8 [0.2-2.1],0.9 [0.1-3.2],0.7 [0.1-2.3],0.8 [0.2-2.0],0.9 [0.1-3.0],0.7 [0.1-2.2],...,0.8 [0.1-3.0],0.9 [0.2-2.5],0.9 [0.1-3.2],0.9 [0.1-3.3],0.9 [0.2-2.7],1.0 [0.1-3.5],0.9 [0.1-3.5],1.0 [0.2-2.9],1.0 [0.1-3.8],0.9 [0.1-3.8]
5,Angola,8.3 [2.7-16.9],11.6 [2.4-27.3],5.0 [0.8-13.5],8.5 [2.9-16.8],11.9 [2.7-27.1],5.1 [0.9-13.4],8.6 [3.1-16.7],12.1 [2.9-27.1],5.2 [1.0-13.1],...,8.0 [1.2-21.0],13.7 [5.2-24.8],19.5 [5.0-38.9],8.1 [1.1-21.5],13.9 [5.1-25.3],19.6 [4.9-39.5],8.2 [1.0-22.3],14.0 [5.0-25.9],19.8 [4.7-40.2],8.3 [1.0-23.0]
6,Antigua and Barbuda,3.3 [1.1-7.3],3.8 [0.6-10.3],2.9 [0.5-8.1],3.3 [1.1-7.0],3.8 [0.7-10.0],2.8 [0.5-7.8],3.3 [1.2-6.8],3.8 [0.8-9.7],2.8 [0.5-7.5],...,3.5 [0.3-11.6],5.0 [1.3-11.7],6.3 [0.9-17.1],3.6 [0.3-12.2],5.1 [1.3-12.2],6.4 [0.9-17.7],3.7 [0.3-12.7],5.2 [1.2-12.7],6.5 [0.8-18.5],3.8 [0.2-13.3]
7,Argentina,1.0 [0.3-2.2],1.0 [0.2-2.9],0.9 [0.2-2.6],1.0 [0.3-2.1],1.0 [0.2-2.8],0.9 [0.2-2.4],1.0 [0.4-2.1],1.0 [0.2-2.8],0.9 [0.2-2.4],...,1.6 [0.2-5.3],1.9 [0.4-5.2],2.2 [0.2-7.7],1.6 [0.2-5.5],2.0 [0.4-5.5],2.3 [0.2-8.2],1.7 [0.2-5.8],2.0 [0.4-5.9],2.3 [0.2-8.7],1.7 [0.1-6.1]
8,Armenia,2.1 [0.7-5.1],2.4 [0.4-7.0],1.8 [0.3-5.1],2.1 [0.7-4.8],2.4 [0.4-6.8],1.8 [0.3-4.7],2.1 [0.7-4.7],2.4 [0.4-6.6],1.7 [0.3-4.4],...,2.3 [0.2-7.2],3.3 [0.8-8.6],4.3 [0.4-13.9],2.4 [0.2-7.9],3.5 [0.8-9.2],4.4 [0.4-14.8],2.5 [0.2-8.5],3.6 [0.8-9.8],4.6 [0.4-15.6],2.6 [0.2-9.2]
9,Australia,0.6 [0.3-1.2],0.9 [0.3-2.0],0.4 [0.1-0.9],0.6 [0.3-1.2],0.9 [0.3-1.9],0.4 [0.1-0.8],0.6 [0.3-1.2],0.9 [0.4-1.9],0.4 [0.1-0.8],...,0.8 [0.2-2.1],1.0 [0.4-2.1],1.2 [0.3-3.0],0.8 [0.2-2.3],1.0 [0.4-2.3],1.2 [0.3-3.1],0.9 [0.2-2.5],1.1 [0.4-2.4],1.2 [0.3-3.4],0.9 [0.2-2.8]


In [58]:
# Rename empty column name
thin_10_19.rename(columns = {thin_10_19.columns[0]: "Country"}, inplace=True)

In [59]:
count = 0
thin_10_19_data = pd.DataFrame(columns=['Country', 'Year', 'Thinness_10-19_years'])
for i in range(1, len(thin_10_19['Country'].unique())):
    j = 1
    while j < len(thin_10_19.columns):
        #print(thin_10_19.loc[i,'Country'], end=' ')
        thin_10_19_data.at[count, 'Country'] = thin_10_19.loc[i,'Country']
        thin_10_19_data.at[count, 'Year'] = thin_10_19.columns[j]
        #print(thin_10_19.columns[j], j)
        thin_10_19_data.at[count, 'Thinness_10-19_years'] = thin_10_19[thin_10_19['Country'] == thin_10_19['Country'][i]].T[1:].loc[thin_10_19.columns[j]].values[0].split(' [')[0]
        count+=1
        j += 3
        

In [60]:
#thin_10_19_data[thin_10_19_data['Country'] == "Uganda"]

In [61]:
thin_10_19_data['Year'] = thin_10_19_data['Year'].astype(np.int64)
#thin_10_19_data['Thinness_10-19_years'] = thin_10_19_data['Thinness_10-19_years'].astype(np.float64)

In [62]:
thin_10_19_data.to_pickle("Data/New/Thinness_10_19/Thinness_10_19.pkl")

In [63]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(thin_10_19_data[thin_10_19_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            thin_10_19_other_data = thin_10_19_data[thin_10_19_data['Country'] == main_data['Country'][val]][thin_10_19_data['Year'] == main_data['Year'][val]]['Thinness_10-19_years'].values[0]
            print(thin_10_19_other_data, "pass: 1")
            main_data.at[val, 'Thinness_10-19_years'] = thin_10_19_other_data
        except IndexError:
            pass
    else:
        try:
            thin_10_19_other_data = thin_10_19_data[thin_10_19_data['Country'].str.startswith(main_data['Country'][val])][thin_10_19_data['Year'] == main_data['Year'][val]]['Thinness_10-19_years'].values[0]
            print(thin_10_19_other_data, "pass: 2")
            main_data.at[val, 'Thinness_10-19_years'] = thin_10_19_other_data
        except IndexError:
            try:
                thin_10_19_other_data = thin_10_19_data[thin_10_19_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][thin_10_19_data['Year'] == main_data['Year'][val]]['Thinness_10-19_years'].values[0]
                print(thin_10_19_other_data, "pass: 3")
                main_data.at[val, 'Thinness_10-19_years'] = thin_10_19_other_data
            except IndexError:
                pass

0  17.7 pass: 1
1  17.9 pass: 1
2  18.2 pass: 1
3  18.4 pass: 1
4  18.6 pass: 1
5  18.8 pass: 1
6  19.0 pass: 1
7  19.2 pass: 1
8  19.3 pass: 1
9  19.5 pass: 1
10  19.7 pass: 1
11  19.9 pass: 1
12  20.1 pass: 1
13  20.3 pass: 1
14  20.5 pass: 1
15  1.3 pass: 1
16  1.3 pass: 1
17  1.4 pass: 1
18  1.4 pass: 1
19  1.5 pass: 1
20  1.6 pass: 1
21  1.6 pass: 1
22  1.7 pass: 1
23  1.8 pass: 1
24  1.8 pass: 1
25  1.9 pass: 1
26  2.0 pass: 1
27  2.1 pass: 1
28  2.1 pass: 1
29  2.2 pass: 1
30  5.9 pass: 1
31  5.9 pass: 1
32  5.9 pass: 1
33  5.9 pass: 1
34  6.0 pass: 1
35  6.0 pass: 1
36  6.0 pass: 1
37  6.1 pass: 1
38  6.1 pass: 1
39  6.2 pass: 1
40  6.3 pass: 1
41  6.3 pass: 1
42  6.4 pass: 1
43  6.5 pass: 1
44  6.6 pass: 1
45  46  47  48  49  50  51  52  53  54  55  

  """
  if sys.path[0] == '':


56  57  58  59  60  0.8 pass: 1
61  0.8 pass: 1
62  0.8 pass: 1
63  0.7 pass: 1
64  0.7 pass: 1
65  0.7 pass: 1
66  0.7 pass: 1
67  0.7 pass: 1
68  0.7 pass: 1
69  0.7 pass: 1
70  0.7 pass: 1
71  0.7 pass: 1
72  0.7 pass: 1
73  0.7 pass: 1
74  0.7 pass: 1
75  8.6 pass: 1
76  8.8 pass: 1
77  8.9 pass: 1
78  9.1 pass: 1
79  9.3 pass: 1
80  9.5 pass: 1
81  9.6 pass: 1
82  9.8 pass: 1
83  10.0 pass: 1
84  10.2 pass: 1
85  10.4 pass: 1
86  10.5 pass: 1
87  10.7 pass: 1
88  10.9 pass: 1
89  11.1 pass: 1
90  3.3 pass: 1
91  3.3 pass: 1
92  3.3 pass: 1
93  3.3 pass: 1
94  3.4 pass: 1
95  3.4 pass: 1
96  3.4 pass: 1
97  3.4 pass: 1
98  3.5 pass: 1
99  3.5 pass: 1
100  3.5 pass: 1
101  3.6 pass: 1
102  3.6 pass: 1
103  3.7 pass: 1
104  3.7 pass: 1
105  1.0 pass: 1
106  1.0 pass: 1
107  1.0 pass: 1
108  1.0 pass: 1
109  1.0 pass: 1
110  1.0 pass: 1
111  1.1 pass: 1
112  1.1 pass: 1
113  1.1 pass: 1
114  1.1 pass: 1
115  1.2 pass: 1
116  1.2 pass: 1
117  1.2 pass: 1
118  1.2 pass: 1
119  1.3 pass:

612  1.0 pass: 1
613  1.1 pass: 1
614  1.1 pass: 1
615  3.8 pass: 1
616  3.9 pass: 1
617  4.1 pass: 1
618  4.2 pass: 1
619  4.4 pass: 1
620  4.5 pass: 1
621  4.7 pass: 1
622  4.8 pass: 1
623  5.0 pass: 1
624  5.1 pass: 1
625  5.3 pass: 1
626  5.5 pass: 1
627  5.7 pass: 1
628  5.9 pass: 1
629  6.0 pass: 1
630  2.1 pass: 1
631  2.1 pass: 1
632  2.2 pass: 1
633  2.2 pass: 1
634  2.2 pass: 1
635  2.3 pass: 1
636  2.3 pass: 1
637  2.3 pass: 1
638  2.4 pass: 1
639  2.4 pass: 1
640  2.5 pass: 1
641  2.5 pass: 1
642  2.5 pass: 1
643  2.6 pass: 1
644  2.6 pass: 1
645  6.8 pass: 1
646  6.9 pass: 1
647  7.0 pass: 1
648  7.1 pass: 1
649  7.2 pass: 1
650  7.2 pass: 1
651  7.3 pass: 1
652  7.4 pass: 1
653  7.5 pass: 1
654  7.5 pass: 1
655  7.6 pass: 1
656  7.7 pass: 1
657  7.8 pass: 1
658  7.9 pass: 1
659  8.0 pass: 1
660  7.7 pass: 3
661  7.9 pass: 3
662  8.0 pass: 3
663  8.1 pass: 3
664  8.3 pass: 3
665  8.4 pass: 3
666  8.5 pass: 3
667  8.7 pass: 3
668  8.8 pass: 3
669  9.0 pass: 3
670  9.1 pass:

1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  3.8 pass: 1
1171  3.8 pass: 1
1172  3.8 pass: 1
1173  3.8 pass: 1
1174  3.8 pass: 1
1175  3.8 pass: 1
1176  3.9 pass: 1
1177  3.9 pass: 1
1178  3.9 pass: 1
1179  4.0 pass: 1
1180  4.0 pass: 1
1181  4.1 pass: 1
1182  4.2 pass: 1
1183  4.3 pass: 1
1184  4.4 pass: 1
1185  1186  1187  1188  1189  1190  1191  1192  1193  1194  1195  1196  1197  1198  1199  1200  1.2 pass: 1
1201  1.2 pass: 1
1202  1.2 pass: 1
1203  1.3 pass: 1
1204  1.3 pass: 1
1205  1.3 pass: 1
1206  1.3 pass: 1
1207  1.4 pass: 1
1208  1.4 pass: 1
1209  1.4 pass: 1
1210  1.4 pass: 1
1211  1.5 pass: 1
1212  1.5 pass: 1
1213  1.6 pass: 1
1214  1.6 pass: 1
1215  7.7 pass: 1
1216  7.8 pass: 1
1217  8.0 pass: 1
1218  8.2 pass: 1
1219  8.4 pass: 1
1220  8.6 pass: 1
1221  8.9 pass: 1
1222  9.1 pass: 1
1223  9.3 pass: 1
1224  9.5 pass: 1
1225  9.7 pass: 1
1226  9.9 pass: 1
1227  10.1 pass: 1
1228  10.3 pass: 1
1229  10.5 pass: 1
1230  7

1742  0.9 pass: 1
1743  0.9 pass: 1
1744  0.9 pass: 1
1745  0.9 pass: 1
1746  0.9 pass: 1
1747  0.9 pass: 1
1748  1.0 pass: 1
1749  1.0 pass: 1
1750  1.0 pass: 1
1751  1.0 pass: 1
1752  1.0 pass: 1
1753  1.0 pass: 1
1754  1.0 pass: 1
1755  1756  1757  1758  1759  1760  1761  1762  1763  1764  1765  1766  1767  1768  1769  1770  7.3 pass: 1
1771  7.4 pass: 1
1772  7.5 pass: 1
1773  7.6 pass: 1
1774  7.7 pass: 1
1775  7.8 pass: 1
1776  7.9 pass: 1
1777  8.0 pass: 1
1778  8.1 pass: 1
1779  8.2 pass: 1
1780  8.3 pass: 1
1781  8.5 pass: 1
1782  8.6 pass: 1
1783  8.7 pass: 1
1784  8.8 pass: 1
1785  6.5 pass: 1
1786  6.6 pass: 1
1787  6.7 pass: 1
1788  6.8 pass: 1
1789  6.9 pass: 1
1790  7.0 pass: 1
1791  7.1 pass: 1
1792  7.3 pass: 1
1793  7.4 pass: 1
1794  7.5 pass: 1
1795  7.6 pass: 1
1796  7.7 pass: 1
1797  7.9 pass: 1
1798  8.0 pass: 1
1799  8.1 pass: 1
1800  7.8 pass: 1
1801  7.9 pass: 1
1802  8.0 pass: 1
1803  8.2 pass: 1
1804  8.3 pass: 1
1805  8.5 pass: 1
1806  8.7 pass: 1
1807  8.8 

2312  1.1 pass: 1
2313  1.1 pass: 1
2314  1.2 pass: 1
2315  1.2 pass: 1
2316  1.2 pass: 1
2317  1.2 pass: 1
2318  1.3 pass: 1
2319  1.3 pass: 1
2320  1.3 pass: 1
2321  1.4 pass: 1
2322  1.4 pass: 1
2323  1.4 pass: 1
2324  1.5 pass: 1
2325  10.0 pass: 1
2326  10.0 pass: 1
2327  10.0 pass: 1
2328  10.0 pass: 1
2329  10.0 pass: 1
2330  10.0 pass: 1
2331  10.0 pass: 1
2332  10.0 pass: 1
2333  10.0 pass: 1
2334  10.0 pass: 1
2335  10.0 pass: 1
2336  10.0 pass: 1
2337  10.0 pass: 1
2338  10.0 pass: 1
2339  10.0 pass: 1
2340  2.0 pass: 1
2341  2.0 pass: 1
2342  2.0 pass: 1
2343  2.1 pass: 1
2344  2.1 pass: 1
2345  2.2 pass: 1
2346  2.2 pass: 1
2347  2.3 pass: 1
2348  2.3 pass: 1
2349  2.4 pass: 1
2350  2.4 pass: 1
2351  2.5 pass: 1
2352  2.5 pass: 1
2353  2.5 pass: 1
2354  2.6 pass: 1
2355  0.7 pass: 1
2356  0.7 pass: 1
2357  0.7 pass: 1
2358  0.7 pass: 1
2359  0.7 pass: 1
2360  0.7 pass: 1
2361  0.7 pass: 1
2362  0.7 pass: 1
2363  0.7 pass: 1
2364  0.7 pass: 1
2365  0.7 pass: 1
2366  0.8 pas

2864  4.2 pass: 1
2865  2866  2867  2868  2869  2870  2871  2872  2873  2874  2875  2876  2877  2878  2879  2880  7.9 pass: 1
2881  8.0 pass: 1
2882  8.1 pass: 1
2883  8.2 pass: 1
2884  8.3 pass: 1
2885  8.5 pass: 1
2886  8.6 pass: 1
2887  8.7 pass: 1
2888  8.9 pass: 1
2889  9.0 pass: 1
2890  9.1 pass: 1
2891  9.2 pass: 1
2892  9.3 pass: 1
2893  9.4 pass: 1
2894  9.4 pass: 1
2895  11.1 pass: 1
2896  11.2 pass: 1
2897  11.3 pass: 1
2898  11.5 pass: 1
2899  11.6 pass: 1
2900  11.7 pass: 1
2901  11.8 pass: 1
2902  11.9 pass: 1
2903  12.0 pass: 1
2904  12.0 pass: 1
2905  12.1 pass: 1
2906  12.1 pass: 1
2907  12.1 pass: 1
2908  12.2 pass: 1
2909  12.2 pass: 1
2910  6.8 pass: 1
2911  7.0 pass: 1
2912  7.1 pass: 1
2913  7.3 pass: 1
2914  7.5 pass: 1
2915  7.7 pass: 1
2916  7.9 pass: 1
2917  8.1 pass: 1
2918  8.4 pass: 1
2919  8.6 pass: 1
2920  8.8 pass: 1
2921  9.0 pass: 1
2922  9.2 pass: 1
2923  9.4 pass: 1
2924  9.6 pass: 1
2925  0.1 pass: 1
2926  0.1 pass: 1
2927  0.1 pass: 1
2928  0.1 pas

In [64]:
main_data[['Country','Year','Thinness_10-19_years']].isnull().sum()

Country                   0
Year                      0
Thinness_10-19_years    585
dtype: int64

In [65]:
thin_5_9 = pd.read_csv("Data/New/Thinness_5_9/thin_5_9_internet.csv")

In [66]:
# Rename empty column name
thin_5_9.rename(columns = {thin_5_9.columns[0]: "Country"}, inplace=True)

In [67]:
count = 0
thin_5_9_data = pd.DataFrame(columns=['Country', 'Year', 'Thinness_5-9_years'])
for i in range(1, len(thin_5_9['Country'].unique())):
    j = 1
    while j < len(thin_5_9.columns):
        #print(thin_5_9.loc[i,'Country'], end=' ')
        thin_5_9_data.at[count, 'Country'] = thin_5_9.loc[i,'Country']
        thin_5_9_data.at[count, 'Year'] = thin_5_9.columns[j]
        #print(thin_5_9.columns[j], j)
        thin_5_9_data.at[count, 'Thinness_5-9_years'] = thin_5_9[thin_5_9['Country'] == thin_5_9['Country'][i]].T[1:].loc[thin_5_9.columns[j]].values[0].split(' [')[0]
        count+=1
        j += 3
        

In [68]:
thin_5_9_data['Year'] = thin_5_9_data['Year'].astype(np.int64)
#thin_5_9_data['Thinness_5-9_years'] = thin_5_9_data['Thinness_5-9_years'].astype(np.float64)

In [69]:
thin_5_9_data.to_pickle("Data/New/Thinness_5_9/thin_5_9_internet.pkl")

In [70]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(thin_5_9_data[thin_5_9_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            thin_5_9_other_data = thin_5_9_data[thin_5_9_data['Country'] == main_data['Country'][val]][thin_5_9_data['Year'] == main_data['Year'][val]]['Thinness_5-9_years'].values[0]
            print(thin_5_9_other_data, "pass: 1")
            main_data.at[val, 'Thinness_5-9_years'] = thin_5_9_other_data
        except IndexError:
            pass
    else:
        try:
            thin_5_9_other_data = thin_5_9_data[thin_5_9_data['Country'].str.startswith(main_data['Country'][val])][thin_5_9_data['Year'] == main_data['Year'][val]]['Thinness_5-9_years'].values[0]
            print(thin_5_9_other_data, "pass: 2")
            main_data.at[val, 'Thinness_5-9_years'] = thin_5_9_other_data
        except IndexError:
            try:
                thin_5_9_other_data = thin_5_9_data[thin_5_9_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][thin_5_9_data['Year'] == main_data['Year'][val]]['Thinness_5-9_years'].values[0]
                print(thin_5_9_other_data, "pass: 3")
                main_data.at[val, 'Thinness_5-9_years'] = thin_5_9_other_data
            except IndexError:
                pass

0  17.7 pass: 1
1  18.0 pass: 1
2  18.2 pass: 1
3  18.4 pass: 1
4  18.7 pass: 1
5  18.9 pass: 1
6  19.1 pass: 1
7  19.3 pass: 1
8  19.5 pass: 1
9  19.7 pass: 1
10  19.9 pass: 1
11  20.2 pass: 1
12  20.4 pass: 1
13  20.5 pass: 1
14  20.7 pass: 1
15  1.4 pass: 1
16  1.4 pass: 1
17  1.5 pass: 1
18  1.5 pass: 1
19  1.6 pass: 1
20  1.6 pass: 1
21  1.7 pass: 1
22  1.8 pass: 1
23  1.8 pass: 1
24  1.9 pass: 1
25  2.0 pass: 1
26  2.1 pass: 1
27  2.1 pass: 1
28  2.2 pass: 1
29  2.3 pass: 1
30  5.8 pass: 1
31  5.8 pass: 1
32  5.8 pass: 1
33  5.8 pass: 1
34  5.9 pass: 1
35  5.9 pass: 1
36  5.9 pass: 1
37  6.0 pass: 1
38  6.0 pass: 1
39  6.1 pass: 1
40  6.1 pass: 1
41  6.2 pass: 1
42  6.3 pass: 1
43  6.4 pass: 1
44  6.5 pass: 1
45  46  47  48  49  50  51  52  53  54

  """
  if sys.path[0] == '':


  55  56  57  58  59  60  0.7 pass: 1
61  0.7 pass: 1
62  0.7 pass: 1
63  0.7 pass: 1
64  0.7 pass: 1
65  0.7 pass: 1
66  0.7 pass: 1
67  0.7 pass: 1
68  0.7 pass: 1
69  0.7 pass: 1
70  0.7 pass: 1
71  0.7 pass: 1
72  0.7 pass: 1
73  0.7 pass: 1
74  0.7 pass: 1
75  8.5 pass: 1
76  8.6 pass: 1
77  8.8 pass: 1
78  9.0 pass: 1
79  9.2 pass: 1
80  9.4 pass: 1
81  9.6 pass: 1
82  9.7 pass: 1
83  9.9 pass: 1
84  10.1 pass: 1
85  10.3 pass: 1
86  10.5 pass: 1
87  10.7 pass: 1
88  10.9 pass: 1
89  11.0 pass: 1
90  3.3 pass: 1
91  3.3 pass: 1
92  3.3 pass: 1
93  3.3 pass: 1
94  3.3 pass: 1
95  3.3 pass: 1
96  3.3 pass: 1
97  3.4 pass: 1
98  3.4 pass: 1
99  3.4 pass: 1
100  3.5 pass: 1
101  3.5 pass: 1
102  3.5 pass: 1
103  3.6 pass: 1
104  3.6 pass: 1
105  0.9 pass: 1
106  0.9 pass: 1
107  0.9 pass: 1
108  0.9 pass: 1
109  0.9 pass: 1
110  0.9 pass: 1
111  0.9 pass: 1
112  0.9 pass: 1
113  1.0 pass: 1
114  1.0 pass: 1
115  1.0 pass: 1
116  1.0 pass: 1
117  1.1 pass: 1
118  1.1 pass: 1
119  1.1 

628  5.1 pass: 1
629  5.2 pass: 1
630  1.9 pass: 1
631  1.9 pass: 1
632  2.0 pass: 1
633  2.0 pass: 1
634  2.0 pass: 1
635  2.0 pass: 1
636  2.1 pass: 1
637  2.1 pass: 1
638  2.1 pass: 1
639  2.2 pass: 1
640  2.2 pass: 1
641  2.3 pass: 1
642  2.3 pass: 1
643  2.3 pass: 1
644  2.4 pass: 1
645  6.6 pass: 1
646  6.7 pass: 1
647  6.8 pass: 1
648  6.9 pass: 1
649  7.0 pass: 1
650  7.1 pass: 1
651  7.2 pass: 1
652  7.3 pass: 1
653  7.4 pass: 1
654  7.5 pass: 1
655  7.6 pass: 1
656  7.7 pass: 1
657  7.8 pass: 1
658  7.9 pass: 1
659  8.0 pass: 1
660  7.4 pass: 3
661  7.5 pass: 3
662  7.6 pass: 3
663  7.7 pass: 3
664  7.9 pass: 3
665  8.0 pass: 3
666  8.2 pass: 3
667  8.3 pass: 3
668  8.5 pass: 3
669  8.6 pass: 3
670  8.8 pass: 3
671  8.9 pass: 3
672  9.0 pass: 3
673  9.2 pass: 3
674  9.3 pass: 3
675  7.4 pass: 3
676  7.5 pass: 3
677  7.6 pass: 3
678  7.7 pass: 3
679  7.9 pass: 3
680  8.0 pass: 3
681  8.2 pass: 3
682  8.3 pass: 3
683  8.5 pass: 3
684  8.6 pass: 3
685  8.8 pass: 3
686  8.9 pass:

1205  1.3 pass: 1
1206  1.3 pass: 1
1207  1.4 pass: 1
1208  1.4 pass: 1
1209  1.4 pass: 1
1210  1.4 pass: 1
1211  1.5 pass: 1
1212  1.5 pass: 1
1213  1.6 pass: 1
1214  1.6 pass: 1
1215  7.6 pass: 1
1216  7.8 pass: 1
1217  8.0 pass: 1
1218  8.2 pass: 1
1219  8.4 pass: 1
1220  8.6 pass: 1
1221  8.8 pass: 1
1222  9.1 pass: 1
1223  9.3 pass: 1
1224  9.5 pass: 1
1225  9.7 pass: 1
1226  9.9 pass: 1
1227  10.1 pass: 1
1228  10.3 pass: 1
1229  10.5 pass: 1
1230  7.3 pass: 1
1231  7.5 pass: 1
1232  7.7 pass: 1
1233  7.9 pass: 1
1234  8.1 pass: 1
1235  8.4 pass: 1
1236  8.6 pass: 1
1237  8.8 pass: 1
1238  9.0 pass: 1
1239  9.3 pass: 1
1240  9.5 pass: 1
1241  9.7 pass: 1
1242  10.0 pass: 1
1243  10.2 pass: 1
1244  10.4 pass: 1
1245  5.3 pass: 1
1246  5.3 pass: 1
1247  5.3 pass: 1
1248  5.3 pass: 1
1249  5.4 pass: 1
1250  5.4 pass: 1
1251  5.5 pass: 1
1252  5.5 pass: 1
1253  5.5 pass: 1
1254  5.6 pass: 1
1255  5.6 pass: 1
1256  5.7 pass: 1
1257  5.7 pass: 1
1258  5.8 pass: 1
1259  5.8 pass: 1
1260

1799  8.0 pass: 1
1800  7.6 pass: 1
1801  7.7 pass: 1
1802  7.8 pass: 1
1803  8.0 pass: 1
1804  8.2 pass: 1
1805  8.3 pass: 1
1806  8.5 pass: 1
1807  8.6 pass: 1
1808  8.8 pass: 1
1809  8.9 pass: 1
1810  9.1 pass: 1
1811  9.3 pass: 1
1812  9.4 pass: 1
1813  9.6 pass: 1
1814  9.7 pass: 1
1815  13.8 pass: 1
1816  13.9 pass: 1
1817  14.0 pass: 1
1818  14.1 pass: 1
1819  14.2 pass: 1
1820  14.3 pass: 1
1821  14.4 pass: 1
1822  14.5 pass: 1
1823  14.5 pass: 1
1824  14.6 pass: 1
1825  14.7 pass: 1
1826  14.7 pass: 1
1827  14.8 pass: 1
1828  14.8 pass: 1
1829  14.9 pass: 1
1830  7.9 pass: 1
1831  8.1 pass: 1
1832  8.3 pass: 1
1833  8.5 pass: 1
1834  8.8 pass: 1
1835  9.0 pass: 1
1836  9.3 pass: 1
1837  9.5 pass: 1
1838  9.7 pass: 1
1839  10.0 pass: 1
1840  10.2 pass: 1
1841  10.5 pass: 1
1842  10.7 pass: 1
1843  10.9 pass: 1
1844  11.1 pass: 1
1845  0.7 pass: 1
1846  0.7 pass: 1
1847  0.7 pass: 1
1848  0.7 pass: 1
1849  0.7 pass: 1
1850  0.7 pass: 1
1851  0.7 pass: 1
1852  0.7 pass: 1
1853  0

2357  0.5 pass: 1
2358  0.5 pass: 1
2359  0.5 pass: 1
2360  0.5 pass: 1
2361  0.5 pass: 1
2362  0.5 pass: 1
2363  0.6 pass: 1
2364  0.6 pass: 1
2365  0.6 pass: 1
2366  0.6 pass: 1
2367  0.6 pass: 1
2368  0.6 pass: 1
2369  0.6 pass: 1
2370  2371  2372  2373  2374  2375  2376  2377  2378  2379  2380  2381  2382  2383  2384  2385  4.7 pass: 1
2386  4.7 pass: 1
2387  4.6 pass: 1
2388  4.6 pass: 1
2389  4.6 pass: 1
2390  4.5 pass: 1
2391  4.5 pass: 1
2392  4.5 pass: 1
2393  4.5 pass: 1
2394  4.5 pass: 1
2395  4.5 pass: 1
2396  4.5 pass: 1
2397  4.5 pass: 1
2398  4.5 pass: 1
2399  4.5 pass: 1
2400  2.9 pass: 1
2401  3.0 pass: 1
2402  3.1 pass: 1
2403  3.2 pass: 1
2404  3.3 pass: 1
2405  3.5 pass: 1
2406  3.6 pass: 1
2407  3.7 pass: 1
2408  3.8 pass: 1
2409  3.9 pass: 1
2410  4.0 pass: 1
2411  4.1 pass: 1
2412  4.2 pass: 1
2413  4.3 pass: 1
2414  4.3 pass: 1
2415  2.3 pass: 1
2416  2.4 pass: 1
2417  2.4 pass: 1
2418  2.5 pass: 1
2419  2.5 pass: 1
2420  2.5 pass: 1
2421  2.6 pass: 1
2422  2.7 

2910  6.6 pass: 1
2911  6.8 pass: 1
2912  7.0 pass: 1
2913  7.2 pass: 1
2914  7.4 pass: 1
2915  7.6 pass: 1
2916  7.8 pass: 1
2917  8.0 pass: 1
2918  8.3 pass: 1
2919  8.5 pass: 1
2920  8.7 pass: 1
2921  8.9 pass: 1
2922  9.1 pass: 1
2923  9.3 pass: 1
2924  9.5 pass: 1
2925  0.1 pass: 1
2926  0.1 pass: 1
2927  0.1 pass: 1
2928  0.1 pass: 1
2929  0.1 pass: 1
2930  0.1 pass: 1
2931  0.1 pass: 1
2932  0.1 pass: 1
2933  0.1 pass: 1
2934  0.1 pass: 1
2935  0.1 pass: 1
2936  0.1 pass: 1
2937  0.1 pass: 1
2938  0.1 pass: 1
2939  0.1 pass: 1
2940  6.0 pass: 1
2941  6.1 pass: 1
2942  6.2 pass: 1
2943  6.3 pass: 1
2944  6.4 pass: 1
2945  6.4 pass: 1
2946  6.5 pass: 1
2947  6.6 pass: 1
2948  6.7 pass: 1
2949  6.8 pass: 1
2950  6.9 pass: 1
2951  7.0 pass: 1
2952  7.1 pass: 1
2953  7.2 pass: 1
2954  7.3 pass: 1
2955  6.3 pass: 1
2956  6.3 pass: 1
2957  6.3 pass: 1
2958  6.3 pass: 1
2959  6.3 pass: 1
2960  6.3 pass: 1
2961  6.3 pass: 1
2962  6.3 pass: 1
2963  6.3 pass: 1
2964  6.3 pass: 1
2965  6.3 

In [71]:
main_data[['Country','Year','Thinness_5-9_years']].isnull().sum()

Country                 0
Year                    0
Thinness_5-9_years    585
dtype: int64

## STATUS OF EACH COUNTRY

In [72]:
status_data = pd.read_csv("Data/New/Status/Status_Of_Country.csv")

In [73]:
status_data.rename(columns = {status_data.columns[0]: "ID"}, inplace=True)
status_data.columns

Index(['ID', 'Economy', 'Code', 'Region', 'Income group', 'Lending category',
       'Other'],
      dtype='object')

In [74]:
status_data.head()

Unnamed: 0,ID,Economy,Code,Region,Income group,Lending category,Other
0,1,Afghanistan,AFG,South Asia,Low income,IDA,HIPC
1,2,Albania,ALB,Europe & Central Asia,Upper middle income,IBRD,
2,3,Algeria,DZA,Middle East & North Africa,Upper middle income,IBRD,
3,4,American Samoa,ASM,East Asia & Pacific,Upper middle income,..,
4,5,Andorra,AND,Europe & Central Asia,High income,..,


In [75]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(status_data[status_data['Economy'] == main_data['Country'][val]].values) != 0:
        try:
            status_other_data = status_data[status_data['Economy'] == main_data['Country'][val]]["Income group"].values[0]
            print(status_other_data, "pass: 1")
            main_data.at[val, 'Status'] = status_other_data
        except IndexError:
            pass
    else:
        try:
            status_other_data = status_data[status_data['Economy'].str.startswith(main_data['Country'][val])]["Income group"].values[0]
            print(status_other_data, "pass: 2")
            main_data.at[val, 'Status'] = status_other_data
        except IndexError:
            try:
                status_other_data = status_data[status_data['Economy'].str.startswith(main_data['Country'][val].split(',')[0])]["Income group"].values[0]
                print(status_other_data, "pass: 3")
                main_data.at[val, 'Status'] = status_other_data
            except IndexError:
                pass

0  Low income pass: 1
1  Low income pass: 1
2  Low income pass: 1
3  Low income pass: 1
4  Low income pass: 1
5  Low income pass: 1
6  Low income pass: 1
7  Low income pass: 1
8  Low income pass: 1
9  Low income pass: 1
10  Low income pass: 1
11  Low income pass: 1
12  Low income pass: 1
13  Low income pass: 1
14  Low income pass: 1
15  Upper middle income pass: 1
16  Upper middle income pass: 1
17  Upper middle income pass: 1
18  Upper middle income pass: 1
19  Upper middle income pass: 1
20  Upper middle income pass: 1
21  Upper middle income pass: 1
22  Upper middle income pass: 1
23  Upper middle income pass: 1
24  Upper middle income pass: 1
25  Upper middle income pass: 1
26  Upper middle income pass: 1
27  Upper middle income pass: 1
28  Upper middle income pass: 1
29  Upper middle income pass: 1
30  Upper middle income pass: 1
31  Upper middle income pass: 1
32  Upper middle income pass: 1
33  Upper middle income pass: 1
34  Upper middle income pass: 1
35  Upper middle income p

300  Low income pass: 1
301  Low income pass: 1
302  Low income pass: 1
303  Low income pass: 1
304  Low income pass: 1
305  Low income pass: 1
306  Low income pass: 1
307  Low income pass: 1
308  Low income pass: 1
309  Low income pass: 1
310  Low income pass: 1
311  Low income pass: 1
312  Low income pass: 1
313  Low income pass: 1
314  Low income pass: 1
315  High income pass: 1
316  High income pass: 1
317  High income pass: 1
318  High income pass: 1
319  High income pass: 1
320  High income pass: 1
321  High income pass: 1
322  High income pass: 1
323  High income pass: 1
324  High income pass: 1
325  High income pass: 1
326  High income pass: 1
327  High income pass: 1
328  High income pass: 1
329  High income pass: 1
330  Lower middle income pass: 1
331  Lower middle income pass: 1
332  Lower middle income pass: 1
333  Lower middle income pass: 1
334  Lower middle income pass: 1
335  Lower middle income pass: 1
336  Lower middle income pass: 1
337  Lower middle income pass: 1
3

656  Low income pass: 1
657  Low income pass: 1
658  Low income pass: 1
659  Low income pass: 1
660  Low income pass: 1
661  Low income pass: 1
662  Low income pass: 1
663  Low income pass: 1
664  Low income pass: 1
665  Low income pass: 1
666  Low income pass: 1
667  Low income pass: 1
668  Low income pass: 1
669  Low income pass: 1
670  Low income pass: 1
671  Low income pass: 1
672  Low income pass: 1
673  Low income pass: 1
674  Low income pass: 1
675  Lower middle income pass: 1
676  Lower middle income pass: 1
677  Lower middle income pass: 1
678  Lower middle income pass: 1
679  Lower middle income pass: 1
680  Lower middle income pass: 1
681  Lower middle income pass: 1
682  Lower middle income pass: 1
683  Lower middle income pass: 1
684  Lower middle income pass: 1
685  Lower middle income pass: 1
686  Lower middle income pass: 1
687  Lower middle income pass: 1
688  Lower middle income pass: 1
689  Lower middle income pass: 1
690  Upper middle income pass: 1
691  Upper middl

1071  Low income pass: 1
1072  Low income pass: 1
1073  Low income pass: 1
1074  Low income pass: 1
1075  Low income pass: 1
1076  Low income pass: 1
1077  Low income pass: 1
1078  Low income pass: 1
1079  Low income pass: 1
1080  Lower middle income pass: 1
1081  Lower middle income pass: 1
1082  Lower middle income pass: 1
1083  Lower middle income pass: 1
1084  Lower middle income pass: 1
1085  Lower middle income pass: 1
1086  Lower middle income pass: 1
1087  Lower middle income pass: 1
1088  Lower middle income pass: 1
1089  Lower middle income pass: 1
1090  Lower middle income pass: 1
1091  Lower middle income pass: 1
1092  Lower middle income pass: 1
1093  Lower middle income pass: 1
1094  Lower middle income pass: 1
1095  High income pass: 1
1096  High income pass: 1
1097  High income pass: 1
1098  High income pass: 1
1099  High income pass: 1
1100  High income pass: 1
1101  High income pass: 1
1102  High income pass: 1
1103  High income pass: 1
1104  High income pass: 1
1105 

1423  High income pass: 1
1424  High income pass: 1
1425  High income pass: 1
1426  High income pass: 1
1427  High income pass: 1
1428  High income pass: 1
1429  High income pass: 1
1430  High income pass: 1
1431  High income pass: 1
1432  High income pass: 1
1433  High income pass: 1
1434  High income pass: 1
1435  High income pass: 1
1436  High income pass: 1
1437  High income pass: 1
1438  High income pass: 1
1439  High income pass: 1
1440  High income pass: 1
1441  High income pass: 1
1442  High income pass: 1
1443  High income pass: 1
1444  High income pass: 1
1445  High income pass: 1
1446  High income pass: 1
1447  High income pass: 1
1448  High income pass: 1
1449  High income pass: 1
1450  High income pass: 1
1451  High income pass: 1
1452  High income pass: 1
1453  High income pass: 1
1454  High income pass: 1
1455  Upper middle income pass: 1
1456  Upper middle income pass: 1
1457  Upper middle income pass: 1
1458  Upper middle income pass: 1
1459  Upper middle income pass: 

1749  High income pass: 1
1750  High income pass: 1
1751  High income pass: 1
1752  High income pass: 1
1753  High income pass: 1
1754  High income pass: 1
1755  High income pass: 1
1756  High income pass: 1
1757  High income pass: 1
1758  High income pass: 1
1759  High income pass: 1
1760  High income pass: 1
1761  High income pass: 1
1762  High income pass: 1
1763  High income pass: 1
1764  High income pass: 1
1765  High income pass: 1
1766  High income pass: 1
1767  High income pass: 1
1768  High income pass: 1
1769  High income pass: 1
1770  Low income pass: 1
1771  Low income pass: 1
1772  Low income pass: 1
1773  Low income pass: 1
1774  Low income pass: 1
1775  Low income pass: 1
1776  Low income pass: 1
1777  Low income pass: 1
1778  Low income pass: 1
1779  Low income pass: 1
1780  Low income pass: 1
1781  Low income pass: 1
1782  Low income pass: 1
1783  Low income pass: 1
1784  Low income pass: 1
1785  Low income pass: 1
1786  Low income pass: 1
1787  Low income pass: 1
1788

2145  Low income pass: 1
2146  Low income pass: 1
2147  Low income pass: 1
2148  Low income pass: 1
2149  Low income pass: 1
2150  Low income pass: 1
2151  Low income pass: 1
2152  Low income pass: 1
2153  Low income pass: 1
2154  Low income pass: 1
2155  Low income pass: 1
2156  Low income pass: 1
2157  Low income pass: 1
2158  Low income pass: 1
2159  Low income pass: 1
2160  Lower middle income pass: 1
2161  Lower middle income pass: 1
2162  Lower middle income pass: 1
2163  Lower middle income pass: 1
2164  Lower middle income pass: 1
2165  Lower middle income pass: 1
2166  Lower middle income pass: 1
2167  Lower middle income pass: 1
2168  Lower middle income pass: 1
2169  Lower middle income pass: 1
2170  Lower middle income pass: 1
2171  Lower middle income pass: 1
2172  Lower middle income pass: 1
2173  Lower middle income pass: 1
2174  Lower middle income pass: 1
2175  2176  2177  2178  2179  2180  2181  2182  2183  2184  2185  2186  2187  2188  2189  2190  High income pass: 1

2462  High income pass: 1
2463  High income pass: 1
2464  High income pass: 1
2465  High income pass: 1
2466  High income pass: 1
2467  High income pass: 1
2468  High income pass: 1
2469  High income pass: 1
2470  High income pass: 1
2471  High income pass: 1
2472  High income pass: 1
2473  High income pass: 1
2474  High income pass: 1
2475  2476  2477  2478  2479  2480  2481  2482  2483  2484  2485  2486  2487  2488  2489  2490  High income pass: 1
2491  High income pass: 1
2492  High income pass: 1
2493  High income pass: 1
2494  High income pass: 1
2495  High income pass: 1
2496  High income pass: 1
2497  High income pass: 1
2498  High income pass: 1
2499  High income pass: 1
2500  High income pass: 1
2501  High income pass: 1
2502  High income pass: 1
2503  High income pass: 1
2504  High income pass: 1
2505  Low income pass: 1
2506  Low income pass: 1
2507  Low income pass: 1
2508  Low income pass: 1
2509  Low income pass: 1
2510  Low income pass: 1
2511  Low income pass: 1
2512  L

2823  High income pass: 1
2824  High income pass: 1
2825  High income pass: 1
2826  High income pass: 1
2827  High income pass: 1
2828  High income pass: 1
2829  High income pass: 1
2830  High income pass: 1
2831  High income pass: 1
2832  High income pass: 1
2833  High income pass: 1
2834  High income pass: 1
2835  Low income pass: 1
2836  Low income pass: 1
2837  Low income pass: 1
2838  Low income pass: 1
2839  Low income pass: 1
2840  Low income pass: 1
2841  Low income pass: 1
2842  Low income pass: 1
2843  Low income pass: 1
2844  Low income pass: 1
2845  Low income pass: 1
2846  Low income pass: 1
2847  Low income pass: 1
2848  Low income pass: 1
2849  Low income pass: 1
2850  Low income pass: 1
2851  Low income pass: 1
2852  Low income pass: 1
2853  Low income pass: 1
2854  Low income pass: 1
2855  Low income pass: 1
2856  Low income pass: 1
2857  Low income pass: 1
2858  Low income pass: 1
2859  Low income pass: 1
2860  Low income pass: 1
2861  Low income pass: 1
2862  Low inc

3177  Lower middle income pass: 1
3178  Lower middle income pass: 1
3179  Lower middle income pass: 1
3180  High income pass: 1
3181  High income pass: 1
3182  High income pass: 1
3183  High income pass: 1
3184  High income pass: 1
3185  High income pass: 1
3186  High income pass: 1
3187  High income pass: 1
3188  High income pass: 1
3189  High income pass: 1
3190  High income pass: 1
3191  High income pass: 1
3192  High income pass: 1
3193  High income pass: 1
3194  High income pass: 1
3195  Lower middle income pass: 1
3196  Lower middle income pass: 1
3197  Lower middle income pass: 1
3198  Lower middle income pass: 1
3199  Lower middle income pass: 1
3200  Lower middle income pass: 1
3201  Lower middle income pass: 1
3202  Lower middle income pass: 1
3203  Lower middle income pass: 1
3204  Lower middle income pass: 1
3205  Lower middle income pass: 1
3206  Lower middle income pass: 1
3207  Lower middle income pass: 1
3208  Lower middle income pass: 1
3209  Lower middle income pass: 

In [76]:
#main_data.sample(10)

## POLIO

In [77]:
polio = pd.read_csv("Data/New/Polio/Polio_Internet.csv")

In [78]:
polio.head()

Unnamed: 0,Country,2017,2016,2015,2014,2013,2012,2011,2010,2009,...,1989,1988,1987,1986,1985,1984,1983,1982,1981,1980
0,Afghanistan,60,60,60,58,62,67,68,66,63,...,33.0,35.0,25.0,11.0,15.0,16.0,5.0,5.0,3.0,
1,Albania,99,98,99,98,99,99,99,99,98,...,96.0,96.0,94.0,94.0,94.0,92.0,92.0,92.0,92.0,92.0
2,Algeria,91,91,95,95,95,95,95,95,94,...,87.0,85.0,79.0,72.0,69.0,30.0,30.0,31.0,31.0,
3,Andorra,99,98,97,97,96,99,99,99,99,...,,,,,,,,,,
4,Angola,47,53,57,55,48,58,57,66,49,...,19.0,13.0,16.0,15.0,13.0,,,,,


In [79]:
count = 0
polio_data = pd.DataFrame(columns=['Country', 'Year', 'Polio'])
for i in range(0, len(polio['Country'].unique())):
    for j in range(1, len(polio.columns)):
        #print(polio.loc[i,'Country'], end='')
        polio_data.at[count, 'Country'] = polio.loc[i,'Country']
        polio_data.at[count, 'Year'] = polio.columns[j]
       # print(polio.columns[j])
        polio_data.at[count, 'Polio'] = polio[polio['Country'] == polio['Country'][i]].T[1:].loc[polio.columns[j]].values[0]
        count+=1

In [80]:
polio_data['Year'] = polio_data['Year'].astype(np.int64)
polio_data.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 7372 entries, 0 to 7371
Data columns (total 3 columns):
Country    7372 non-null object
Year       7372 non-null int64
Polio      6760 non-null object
dtypes: int64(1), object(2)
memory usage: 550.4+ KB


In [81]:
polio_data.to_pickle("Data/New/Polio/Polio_Internet.pkl")

In [82]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(polio_data[polio_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            polio_other_data = polio_data[polio_data['Country'] == main_data['Country'][val]][polio_data['Year'] == main_data['Year'][val]]['Polio'].values[0]
            if regex_double_nums.match(str(polio_other_data)):
                polio_other_data = polio_other_data.split(' ')[0]
                print('Regex Matched', end=' ')
            print(polio_other_data, "pass: 1")
            main_data.at[val, 'Polio'] = polio_other_data
        except IndexError:
            pass
    else:
        try:
            polio_other_data = polio_data[polio_data['Country'].str.startswith(main_data['Country'][val])][polio_data['Year'] == main_data['Year'][val]]['Polio'].values[0]
            if regex_double_nums.match(str(polio_other_data)):
                polio_other_data = polio_other_data.split(' ')[0]
                print('Regex Matched', end=' ')
            print(polio_other_data, "pass: 2")
            main_data.at[val, 'Polio'] = polio_other_data
        except IndexError:
            try:
                polio_other_data = polio_data[polio_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][polio_data['Year'] == main_data['Year'][val]]['Polio'].values[0]
                if regex_double_nums.match(str(polio_other_data)):
                    polio_other_data = polio_other_data.split(' ')[0]
                    print('Regex Matched', end=' ')
                print(polio_other_data, "pass: 3")
                main_data.at[val, 'Polio'] = polio_other_data
            except IndexError:
                pass
         

0  58 pass: 1
1  62 pass: 1
2  67 pass: 1
3  68 pass: 1
4  66 pass: 1
5  63 pass: 1
6  64 pass: 1
7  63 pass: 1
8  58 pass: 1
9  58 pass: 1
10  50 pass: 1
11  41 pass: 1
12  36 pass: 1
13  35 pass: 1
14  24 pass: 1
15  98 pass: 1
16  99 pass: 1
17  99 pass: 1
18  99 pass: 1
19  99 pass: 1
20  98 pass: 1
21  99 pass: 1
22  99 pass: 1
23  97 pass: 1
24  97 pass: 1
25  98 pass: 1
26  97 pass: 1
27  98 pass: 1
28  97 pass: 1
29  97 pass: 1
30  95 pass: 1
31  95 pass: 1
32  95 pass: 1
33  95 pass: 1
34  95 pass: 1
35  94 pass: 1
36  92 pass: 1
37  95 pass: 1
38  95 pass: 1
39  88 pass: 1
40  86 pass: 1
41  87 pass: 1
42  86 pass: 1
43  89 pass: 1
44  86 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  

  """
  from ipykernel import kernelapp as app


57  58  59  60  97 pass: 1
61  96 pass: 1
62  99 pass: 1
63  99 pass: 1
64  99 pass: 1
65  99 pass: 1
66  99 pass: 1
67  96 pass: 1
68  93 pass: 1
69  98 pass: 1
70  99 pass: 1
71  99 pass: 1
72  95 pass: 1
73  95 pass: 1
74  95 pass: 1
75  55 pass: 1
76  48 pass: 1
77  58 pass: 1
78  57 pass: 1
79  66 pass: 1
80  49 pass: 1
81  53 pass: 1
82  63 pass: 1
83  26 pass: 1
84  30 pass: 1
85  32 pass: 1
86  33 pass: 1
87  32 pass: 1
88  36 pass: 1
89  27 pass: 1
90  96 pass: 1
91  98 pass: 1
92  97 pass: 1
93  99 pass: 1
94  99 pass: 1
95  98 pass: 1
96  99 pass: 1
97  98 pass: 1
98  99 pass: 1
99  98 pass: 1
100  97 pass: 1
101  99 pass: 1
102  93 pass: 1
103  99 pass: 1
104  96 pass: 1
105  92 pass: 1
106  90 pass: 1
107  90 pass: 1
108  93 pass: 1
109  95 pass: 1
110  97 pass: 1
111  94 pass: 1
112  92 pass: 1
113  92 pass: 1
114  95 pass: 1
115  91 pass: 1
116  95 pass: 1
117  94 pass: 1
118  85 pass: 1
119  88 pass: 1
120  95 pass: 1
121  96 pass: 1
122  96 pass: 1
123  96 pass: 1
124 

673  32 pass: 3
674  31 pass: 3
675  90 pass: 3
676  85 pass: 3
677  68 pass: 3
678  72 pass: 3
679  72 pass: 3
680  76 pass: 3
681  77 pass: 3
682  71 pass: 3
683  73 pass: 3
684  62 pass: 3
685  67 pass: 3
686  50 pass: 3
687  41 pass: 3
688  32 pass: 3
689  31 pass: 3
690  91 pass: 1
691  95 pass: 1
692  90 pass: 1
693  82 pass: 1
694  93 pass: 1
695  80 pass: 1
696  89 pass: 1
697  89 pass: 1
698  89 pass: 1
699  91 pass: 1
700  90 pass: 1
701  88 pass: 1
702  94 pass: 1
703  92 pass: 1
704  80 pass: 1
705  706  707  708  709  710  711  712  713  714  715  716  717  718  719  720  95 pass: 1
721  96 pass: 1
722  96 pass: 1
723  96 pass: 1
724  97 pass: 1
725  96 pass: 1
726  96 pass: 1
727  96 pass: 1
728  96 pass: 1
729  96 pass: 1
730  96 pass: 1
731  95 pass: 1
732  95 pass: 1
733  94 pass: 1
734  94 pass: 1
735  99 pass: 1
736  99 pass: 1
737  98 pass: 1
738  99 pass: 1
739  99 pass: 1
740  99 pass: 1
741  99 pass: 1
742  99 pass: 1
743  99 pass: 1
744  99 pass: 1
745  98 pass:

1290  1291  1292  1293  1294  1295  1296  1297  1298  1299  1300  1301  1302  1303  1304  1305  99 pass: 1
1306  99 pass: 1
1307  99 pass: 1
1308  99 pass: 1
1309  99 pass: 1
1310  99 pass: 1
1311  99 pass: 1
1312  99 pass: 1
1313  99 pass: 1
1314  99 pass: 1
1315  99 pass: 1
1316  99 pass: 1
1317  98 pass: 1
1318  99 pass: 1
1319  99 pass: 1
1320  90 pass: 1
1321  91 pass: 1
1322  89 pass: 1
1323  95 pass: 1
1324  96 pass: 1
1325  96 pass: 1
1326  98 pass: 1
1327  97 pass: 1
1328  97 pass: 1
1329  95 pass: 1
1330  99 pass: 1
1331  97 pass: 1
1332  95 pass: 1
1333  92 pass: 1
1334  98 pass: 1
1335  84 pass: 1
1336  82 pass: 1
1337  79 pass: 1
1338  79 pass: 1
1339  76 pass: 1
1340  73 pass: 1
1341  69 pass: 1
1342  67 pass: 1
1343  66 pass: 1
1344  65 pass: 1
1345  58 pass: 1
1346  57 pass: 1
1347  58 pass: 1
1348  58 pass: 1
1349  57 pass: 1
1350  80 pass: 1
1351  86 pass: 1
1352  84 pass: 1
1353  81 pass: 1
1354  82 pass: 1
1355  85 pass: 1
1356  83 pass: 1
1357  77 pass: 1
1358  78 

1860  77 pass: 1
1861  79 pass: 1
1862  80 pass: 1
1863  88 pass: 1
1864  95 pass: 1
1865  99 pass: 1
1866  96 pass: 1
1867  91 pass: 1
1868  95 pass: 1
1869  88 pass: 1
1870  68 pass: 1
1871  80 pass: 1
1872  80 pass: 1
1873  56 pass: 1
1874  36 pass: 1
1875  81 pass: 1
1876  80 pass: 1
1877  80 pass: 1
1878  73 pass: 1
1879  52 pass: 1
1880  63 pass: 1
1881  73 pass: 1
1882  75 pass: 1
1883  68 pass: 1
1884  71 pass: 1
1885  68 pass: 1
1886  75 pass: 1
1887  91 pass: 1
1888  75 pass: 1
1889  58 pass: 1
1890  98 pass: 1
1891  98 pass: 1
1892  98 pass: 1
1893  98 pass: 1
1894  99 pass: 1
1895  99 pass: 1
1896  99 pass: 1
1897  96 pass: 1
1898  98 pass: 1
1899  97 pass: 1
1900  98 pass: 1
1901  99 pass: 1
1902  88 pass: 1
1903  93 pass: 1
1904  88 pass: 1
1905  87 pass: 1
1906  83 pass: 1
1907  99 pass: 1
1908  97 pass: 1
1909  95 pass: 1
1910  95 pass: 1
1911  96 pass: 1
1912  98 pass: 1
1913  98 pass: 1
1914  98 pass: 1
1915  98 pass: 1
1916  98 pass: 1
1917  98 pass: 1
1918  97 pass:

2387  93 pass: 1
2388  92 pass: 1
2389  98 pass: 1
2390  98 pass: 1
2391  98 pass: 1
2392  97 pass: 1
2393  95 pass: 1
2394  98 pass: 1
2395  95 pass: 1
2396  93 pass: 1
2397  96 pass: 1
2398  93 pass: 1
2399  91 pass: 1
2400  94 pass: 1
2401  88 pass: 1
2402  92 pass: 1
2403  89 pass: 1
2404  94 pass: 1
2405  95 pass: 1
2406  95 pass: 1
2407  96 pass: 1
2408  97 pass: 1
2409  97 pass: 1
2410  97 pass: 1
2411  97 pass: 1
2412  98 pass: 1
2413  99 pass: 1
2414  99 pass: 1
2415  97 pass: 1
2416  98 pass: 1
2417  98 pass: 1
2418  97 pass: 1
2419  98 pass: 1
2420  98 pass: 1
2421  98 pass: 1
2422  98 pass: 1
2423  98 pass: 1
2424  98 pass: 1
2425  98 pass: 1
2426  97 pass: 1
2427  97 pass: 1
2428  97 pass: 1
2429  97 pass: 1
2430  98 pass: 1
2431  98 pass: 1
2432  98 pass: 1
2433  93 pass: 1
2434  93 pass: 1
2435  93 pass: 1
2436  97 pass: 1
2437  98 pass: 1
2438  99 pass: 1
2439  95 pass: 1
2440  89 pass: 1
2441  96 pass: 1
2442  85 pass: 1
2443  76 pass: 1
2444  90 pass: 1
2445  Regex Ma

2929  Regex Matched 84 pass: 1
2930  Regex Matched 86 pass: 1
2931  Regex Matched 88 pass: 1
2932  Regex Matched 88 pass: 1
2933  Regex Matched 89 pass: 1
2934  Regex Matched 90 pass: 1
2935  Regex Matched 91 pass: 1
2936  Regex Matched 91 pass: 1
2937  Regex Matched 85 pass: 1
2938  Regex Matched 91 pass: 1
2939  Regex Matched 91 pass: 1
2940  94 pass: 1
2941  94 pass: 1
2942  91 pass: 1
2943  91 pass: 1
2944  91 pass: 1
2945  90 pass: 1
2946  91 pass: 1
2947  90 pass: 1
2948  89 pass: 1
2949  95 pass: 1
2950  94 pass: 1
2951  91 pass: 1
2952  96 pass: 1
2953  91 pass: 1
2954  90 pass: 1
2955  98 pass: 1
2956  98 pass: 1
2957  97 pass: 1
2958  98 pass: 1
2959  98 pass: 1
2960  99 pass: 1
2961  99 pass: 1
2962  98 pass: 1
2963  99 pass: 1
2964  98 pass: 1
2965  97 pass: 1
2966  95 pass: 1
2967  96 pass: 1
2968  98 pass: 1
2969  97 pass: 1
2970  96 pass: 1
2971  98 pass: 1
2972  97 pass: 1
2973  97 pass: 1
2974  97 pass: 1
2975  96 pass: 1
2976  96 pass: 1
2977  96 pass: 1
2978  90 pass

In [83]:
#main_data.iloc[[2925]]

## Under Five Deaths

In [84]:
under_5_data = pd.read_csv("Data/New/Under_5_Deaths/Under_5_Internet.csv")

In [85]:
under_5_data.rename(columns = {under_5_data.columns[2]: "Under-Five_Deaths"}, inplace=True)
under_5_data.columns

Index(['Country', 'Year', 'Under-Five_Deaths'], dtype='object')

In [86]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(under_5_data[under_5_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            under_5_other_data = under_5_data[under_5_data['Country'] == main_data['Country'][val]][under_5_data['Year'] == main_data['Year'][val]]['Under-Five_Deaths'].values[0]
            if (under_5_other_data == "&lt;1"):
                random.seed(val)
                under_5_other_data = random.uniform(0, 1)
            print(under_5_other_data, "pass: 1")
            main_data.at[val, 'Under-Five_Deaths'] = under_5_other_data
        except IndexError:
            pass
    else:
        try:
            under_5_other_data = under_5_data[under_5_data['Country'].str.startswith(main_data['Country'][val])][under_5_data['Year'] == main_data['Year'][val]]['Under-Five_Deaths'].values[0]
            if (under_5_other_data == "&lt;1"):
                random.seed(val)
                under_5_other_data = random.uniform(0, 1)
            print(under_5_other_data, "pass: 2")
            main_data.at[val, 'Under-Five_Deaths'] = under_5_other_data
        except IndexError:
            try:
                under_5_other_data = under_5_data[under_5_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][under_5_data['Year'] == main_data['Year'][val]]['Under-Five_Deaths'].values[0]
                if (under_5_other_data == "&lt;1"):
                    random.seed(val)
                    under_5_other_data = random.uniform(0, 1)
                print(under_5_other_data, "pass: 3")
                main_data.at[val, 'Under-Five_Deaths'] = under_5_other_data
            except IndexError:
                pass
         

0  86 pass: 1
1  89 pass: 1
2  93 pass: 1
3  97 pass: 1
4  101 pass: 1
5  106 pass: 1
6  109 pass: 1
7  113 pass: 1
8  116 pass: 1
9  118 pass: 1
10  120 pass: 1
11  121 pass: 1
12  122 pass: 1
13  122 pass: 1
14  121 pass: 1
15  0.965242141552123 pass: 1
16  0.36152277491407514 pass: 1
17  0.5219839097124932 pass: 1
18  0.18126486333322134 pass: 1
19  0.6771258268002703 pass: 1
20  0.9056396761745207 pass: 1
21  1 pass: 1
22  1 pass: 1
23  1 pass: 1
24  1 pass: 1
25  1 pass: 1
26  1 pass: 1
27  1 pass: 1
28  1 pass: 1
29  1 pass: 1
30  24 pass: 1
31  24 pass: 1
32  24 pass: 1
33  24 pass: 1
34  24 pass: 1
35  23 pass: 1
36  23 pass: 1
37  23 pass: 1
38  23 pass: 1
39  22 pass: 1
40  22 pass: 1
41  23 pass: 1
42  23 pass: 1
43  24 pass: 1
44  25 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  0.3078067547337774 pass: 1
61  0.4944874359794347 pass: 1
62  0.9279915658776743 pass: 1
63  0.4451392251568228 pass: 1
64  0.47615826222934565 pass: 1
65  0.41474399930867

  """
  from ipykernel import kernelapp as app


104 pass: 1
76  108 pass: 1
77  112 pass: 1
78  117 pass: 1
79  123 pass: 1
80  128 pass: 1
81  134 pass: 1
82  139 pass: 1
83  144 pass: 1
84  148 pass: 1
85  152 pass: 1
86  155 pass: 1
87  157 pass: 1
88  158 pass: 1
89  159 pass: 1
90  0.20367044742105156 pass: 1
91  0.08352052115358566 pass: 1
92  0.4210446142866463 pass: 1
93  0.9123433593597492 pass: 1
94  0.5468015535366331 pass: 1
95  0.7601614783097744 pass: 1
96  0.37059431012468647 pass: 1
97  0.19453724793318106 pass: 1
98  0.35639820676272216 pass: 1
99  0.40397807494366633 pass: 1
100  0.1456692551041303 pass: 1
101  0.5811521325045647 pass: 1
102  0.1481712063870836 pass: 1
103  0.9790501200727744 pass: 1
104  0.9599609301949554 pass: 1
105  9 pass: 1
106  10 pass: 1
107  10 pass: 1
108  10 pass: 1
109  11 pass: 1
110  11 pass: 1
111  11 pass: 1
112  12 pass: 1
113  12 pass: 1
114  12 pass: 1
115  12 pass: 1
116  13 pass: 1
117  13 pass: 1
118  14 pass: 1
119  14 pass: 1
120  1 pass: 1
121  1 pass: 1
122  1 pass: 1
123 

540  541  542  543  544  545  546  547  548  549  550  551  552  553  554  555  26 pass: 1
556  26 pass: 1
557  26 pass: 1
558  25 pass: 1
559  22 pass: 1
560  23 pass: 1
561  24 pass: 1
562  24 pass: 1
563  25 pass: 1
564  25 pass: 1
565  26 pass: 1
566  26 pass: 1
567  26 pass: 1
568  26 pass: 1
569  26 pass: 1
570  78 pass: 1
571  79 pass: 1
572  79 pass: 1
573  79 pass: 1
574  80 pass: 1
575  80 pass: 1
576  80 pass: 1
577  80 pass: 1
578  80 pass: 1
579  80 pass: 1
580  79 pass: 1
581  78 pass: 1
582  77 pass: 1
583  76 pass: 1
584  75 pass: 1
585  586  587  588  589  590  591  592  593  594  595  596  597  598  599  600  2 pass: 1
601  2 pass: 1
602  2 pass: 1
603  2 pass: 1
604  2 pass: 1
605  2 pass: 1
606  2 pass: 1
607  2 pass: 1
608  2 pass: 1
609  2 pass: 1
610  2 pass: 1
611  2 pass: 1
612  3 pass: 1
613  3 pass: 1
614  3 pass: 1
615  200 pass: 1
616  216 pass: 1
617  233 pass: 1
618  251 pass: 1
619  269 pass: 1
620  288 pass: 1
621  309 pass: 1
622  333 pass: 1
623  360 

1056  3 pass: 1
1057  3 pass: 1
1058  3 pass: 1
1059  3 pass: 1
1060  3 pass: 1
1061  3 pass: 1
1062  3 pass: 1
1063  3 pass: 1
1064  3 pass: 1
1065  5 pass: 3
1066  5 pass: 3
1067  5 pass: 3
1068  5 pass: 3
1069  6 pass: 3
1070  6 pass: 3
1071  6 pass: 3
1072  6 pass: 3
1073  6 pass: 3
1074  6 pass: 3
1075  6 pass: 3
1076  6 pass: 3
1077  6 pass: 3
1078  6 pass: 3
1079  6 pass: 3
1080  1 pass: 1
1081  1 pass: 1
1082  1 pass: 1
1083  1 pass: 1
1084  1 pass: 1
1085  1 pass: 1
1086  1 pass: 1
1087  1 pass: 1
1088  1 pass: 1
1089  1 pass: 1
1090  1 pass: 1
1091  2 pass: 1
1092  2 pass: 1
1093  2 pass: 1
1094  2 pass: 1
1095  3 pass: 1
1096  3 pass: 1
1097  3 pass: 1
1098  3 pass: 1
1099  3 pass: 1
1100  3 pass: 1
1101  3 pass: 1
1102  3 pass: 1
1103  3 pass: 1
1104  3 pass: 1
1105  3 pass: 1
1106  4 pass: 1
1107  4 pass: 1
1108  4 pass: 1
1109  4 pass: 1
1110  49 pass: 1
1111  51 pass: 1
1112  53 pass: 1
1113  56 pass: 1
1114  57 pass: 1
1115  59 pass: 1
1116  60 pass: 1
1117  60 pass: 1


1545  1546  1547  1548  1549  1550  1551  1552  1553  1554  1555  1556  1557  1558  1559  1560  1561  1562  1563  1564  1565  1566  1567  1568  1569  1570  1571  1572  1573  1574  1575  1576  1577  1578  1579  1580  1581  1582  1583  1584  1585  1586  1587  1588  1589  1590  1 pass: 1
1591  1 pass: 1
1592  1 pass: 1
1593  1 pass: 1
1594  1 pass: 1
1595  1 pass: 1
1596  1 pass: 1
1597  1 pass: 1
1598  1 pass: 1
1599  1 pass: 1
1600  1 pass: 1
1601  1 pass: 1
1602  1 pass: 1
1603  1 pass: 1
1604  1 pass: 1
1605  1606  1607  1608  1609  1610  1611  1612  1613  1614  1615  1616  1617  1618  1619  1620  1621  1622  1623  1624  1625  1626  1627  1628  1629  1630  1631  1632  1633  1634  1635  0.805397511051005 pass: 1
1636  0.8815779471939559 pass: 1
1637  0.9169873431868444 pass: 1
1638  0.7409145568273708 pass: 1
1639  0.07041445889356568 pass: 1
1640  0.7930380442045931 pass: 1
1641  0.7934719277370199 pass: 1
1642  0.9427358338394884 pass: 1
1643  0.9229815887970318 pass: 1
1644  0.45207

2040  3 pass: 1
2041  3 pass: 1
2042  3 pass: 1
2043  3 pass: 1
2044  3 pass: 1
2045  4 pass: 1
2046  4 pass: 1
2047  4 pass: 1
2048  4 pass: 1
2049  4 pass: 1
2050  4 pass: 1
2051  5 pass: 1
2052  5 pass: 1
2053  5 pass: 1
2054  4 pass: 1
2055  0.17049038616604795 pass: 1
2056  0.894626646858385 pass: 1
2057  0.9506248810318987 pass: 1
2058  0.15268451016175144 pass: 1
2059  0.41755928164128087 pass: 1
2060  0.5751003082271984 pass: 1
2061  0.36201874640696274 pass: 1
2062  0.8824018413751124 pass: 1
2063  0.835663735492809 pass: 1
2064  0.7080686487594978 pass: 1
2065  0.6261067138595788 pass: 1
2066  0.7121383333054665 pass: 1
2067  0.09154606986430702 pass: 1
2068  0.7769472052539331 pass: 1
2069  0.36218639233410166 pass: 1
2070  22 pass: 1
2071  24 pass: 1
2072  26 pass: 1
2073  28 pass: 1
2074  30 pass: 1
2075  32 pass: 1
2076  35 pass: 1
2077  38 pass: 1
2078  41 pass: 1
2079  44 pass: 1
2080  47 pass: 1
2081  50 pass: 1
2082  54 pass: 1
2083  58 pass: 1
2084  62 pass: 1
2085  

2541  0.8637949147089365 pass: 1
2542  0.9856181223922177 pass: 1
2543  0.011506966659452833 pass: 1
2544  0.5506195788302971 pass: 1
2545  0.8362765719479875 pass: 1
2546  0.3321121636053923 pass: 1
2547  0.3237995828817134 pass: 1
2548  0.7724812091142476 pass: 1
2549  0.5978171137873727 pass: 1
2550  33 pass: 1
2551  35 pass: 1
2552  37 pass: 1
2553  39 pass: 1
2554  41 pass: 1
2555  42 pass: 1
2556  44 pass: 1
2557  45 pass: 1
2558  46 pass: 1
2559  47 pass: 1
2560  47 pass: 1
2561  47 pass: 1
2562  47 pass: 1
2563  48 pass: 1
2564  48 pass: 1
2565  0.10437985456242937 pass: 1
2566  0.10828488673608738 pass: 1
2567  0.7885610264399611 pass: 1
2568  0.9550058661220846 pass: 1
2569  0.5053278979858187 pass: 1
2570  0.6486101067837008 pass: 1
2571  0.15598260874312675 pass: 1
2572  0.048019665541949585 pass: 1
2573  0.8858042516553952 pass: 1
2574  0.038618429108441044 pass: 1
2575  0.3073930597176946 pass: 1
2576  0.9505164526426554 pass: 1
2577  0.6135947880332188 pass: 1
2578  0.44

3000  3001  3002  3003  3004  3005  3006  3007  3008  3009  3010  3011  3012  3013  3014  3015  0.7240976160957538 pass: 1
3016  0.6932061451444196 pass: 1
3017  0.6624256851677249 pass: 1
3018  0.4273000894564425 pass: 1
3019  0.3509856267702347 pass: 1
3020  0.4355089134349248 pass: 1
3021  0.6073885643549118 pass: 1
3022  0.4502573322828527 pass: 1
3023  0.5779617941207508 pass: 1
3024  0.14370935140156238 pass: 1
3025  0.05251218792510659 pass: 1
3026  0.5383163442292882 pass: 1
3027  0.18487000222006245 pass: 1
3028  0.6651611843050346 pass: 1
3029  0.5070091722592971 pass: 1
3030  96 pass: 1
3031  99 pass: 1
3032  104 pass: 1
3033  110 pass: 1
3034  115 pass: 1
3035  120 pass: 1
3036  124 pass: 1
3037  130 pass: 1
3038  135 pass: 1
3039  141 pass: 1
3040  146 pass: 1
3041  152 pass: 1
3042  157 pass: 1
3043  161 pass: 1
3044  164 pass: 1
3045  5 pass: 1
3046  5 pass: 1
3047  5 pass: 1
3048  5 pass: 1
3049  6 pass: 1
3050  6 pass: 1
3051  6 pass: 1
3052  6 pass: 1
3053  6 pass: 1


In [87]:
main_data[['Country','Year','Under-Five_Deaths']].head()

Unnamed: 0,Country,Year,Under-Five_Deaths
0,Afghanistan,2014,86
1,Afghanistan,2013,89
2,Afghanistan,2012,93
3,Afghanistan,2011,97
4,Afghanistan,2010,101


In [88]:
under_5_data.head()

Unnamed: 0,Country,Year,Under-Five_Deaths
0,Afghanistan,2017,77
1,Afghanistan,2016,80
2,Afghanistan,2015,83
3,Afghanistan,2014,86
4,Afghanistan,2013,89


## Infant Deaths

In [89]:
infant_death_data = pd.read_csv("Data/New/Infant_Deaths/Infant_Deaths_Internet.csv")

In [90]:
infant_death_data.rename(columns = {infant_death_data.columns[3]: "Infant_Deaths"}, inplace=True)
infant_death_data.columns

Index(['Country', 'Year', 'Number of under-five deaths (thousands)',
       'Infant_Deaths', 'Number of neonatal deaths (thousands)'],
      dtype='object')

In [91]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(infant_death_data[infant_death_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            infant_death_other_data = infant_death_data[infant_death_data['Country'] == main_data['Country'][val]][infant_death_data['Year'] == main_data['Year'][val]]['Infant_Deaths'].values[0]
            if (infant_death_other_data == "&lt;1"):
                random.seed(val)
                infant_death_other_data = random.uniform(0, 1)
            print(infant_death_other_data, "pass: 1")
            main_data.at[val, 'Infant_Deaths'] = infant_death_other_data
        except IndexError:
            pass
    else:
        try:
            infant_death_other_data = infant_death_data[infant_death_data['Country'].str.startswith(main_data['Country'][val])][infant_death_data['Year'] == main_data['Year'][val]]['Infant_Deaths'].values[0]
            if (infant_death_other_data == "&lt;1"):
                random.seed(val)
                infant_death_other_data = random.uniform(0, 1)
            print(infant_death_other_data, "pass: 2")
            main_data.at[val, 'Infant_Deaths'] = infant_death_other_data
        except IndexError:
            try:
                infant_death_other_data = infant_death_data[infant_death_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][infant_death_data['Year'] == main_data['Year'][val]]['Infant_Deaths'].values[0]
                if (infant_death_other_data == "&lt;1"):
                    random.seed(val)
                    infant_death_other_data = random.uniform(0, 1)
                print(infant_death_other_data, "pass: 3")
                main_data.at[val, 'Infant_Deaths'] = infant_death_other_data
            except IndexError:
                pass
         

0  64 pass: 1
1  66 pass: 1
2  69 pass: 1
3  71 pass: 1
4  74 pass: 1
5  77 pass: 1
6  79 pass: 1
7  82 pass: 1
8  84 pass: 1
9  85 pass: 1
10  86 pass: 1
11  87 pass: 1
12  88 pass: 1
13  87 pass: 1
14  87 pass: 1
15  0.965242141552123 pass: 1
16  0.36152277491407514 pass: 1
17  0.5219839097124932 pass: 1
18  0.18126486333322134 pass: 1
19  0.6771258268002703 pass: 1
20  0.9056396761745207 pass: 1
21  0.16494947983319797 pass: 1
22  0.9582093798172728 pass: 1
23  1 pass: 1
24  1 pass: 1
25  1 pass: 1
26  1 pass: 1
27  1 pass: 1
28  1 pass: 1
29  1 pass: 1
30  21 pass: 1
31  21 pass: 1
32  21 pass: 1
33  21 pass: 1
34  21 pass: 1
35  20 pass: 1
36  20 pass: 1
37  20 pass: 1
38  20 pass: 1
39  19 pass: 1
40  19 pass: 1
41  20 pass: 1
42  20 pass: 1
43  20 pass: 1
44  21 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  0.3078067547337774 pass: 1
61  0.4944874359794347 pass: 1
62  0.9279915658776743 pass: 1
63  0.4451392251568228 pass: 1
64  0.47615826222934565 pass

  """
  from ipykernel import kernelapp as app


0.8597284451918654 pass: 1
75  69 pass: 1
76  71 pass: 1
77  73 pass: 1
78  76 pass: 1
79  79 pass: 1
80  82 pass: 1
81  85 pass: 1
82  88 pass: 1
83  90 pass: 1
84  92 pass: 1
85  94 pass: 1
86  95 pass: 1
87  96 pass: 1
88  96 pass: 1
89  96 pass: 1
90  0.20367044742105156 pass: 1
91  0.08352052115358566 pass: 1
92  0.4210446142866463 pass: 1
93  0.9123433593597492 pass: 1
94  0.5468015535366331 pass: 1
95  0.7601614783097744 pass: 1
96  0.37059431012468647 pass: 1
97  0.19453724793318106 pass: 1
98  0.35639820676272216 pass: 1
99  0.40397807494366633 pass: 1
100  0.1456692551041303 pass: 1
101  0.5811521325045647 pass: 1
102  0.1481712063870836 pass: 1
103  0.9790501200727744 pass: 1
104  0.9599609301949554 pass: 1
105  8 pass: 1
106  9 pass: 1
107  9 pass: 1
108  9 pass: 1
109  10 pass: 1
110  10 pass: 1
111  10 pass: 1
112  10 pass: 1
113  11 pass: 1
114  11 pass: 1
115  11 pass: 1
116  11 pass: 1
117  12 pass: 1
118  12 pass: 1
119  13 pass: 1
120  1 pass: 1
121  1 pass: 1
122  1

529  2 pass: 1
530  2 pass: 1
531  2 pass: 1
532  2 pass: 1
533  2 pass: 1
534  2 pass: 1
535  2 pass: 1
536  2 pass: 1
537  2 pass: 1
538  2 pass: 1
539  2 pass: 1
540  541  542  543  544  545  546  547  548  549  550  551  552  553  554  555  17 pass: 1
556  17 pass: 1
557  17 pass: 1
558  17 pass: 1
559  15 pass: 1
560  16 pass: 1
561  16 pass: 1
562  16 pass: 1
563  17 pass: 1
564  17 pass: 1
565  17 pass: 1
566  17 pass: 1
567  17 pass: 1
568  17 pass: 1
569  17 pass: 1
570  46 pass: 1
571  46 pass: 1
572  46 pass: 1
573  46 pass: 1
574  46 pass: 1
575  46 pass: 1
576  46 pass: 1
577  46 pass: 1
578  46 pass: 1
579  45 pass: 1
580  45 pass: 1
581  44 pass: 1
582  43 pass: 1
583  42 pass: 1
584  42 pass: 1
585  586  587  588  589  590  591  592  593  594  595  596  597  598  599  600  2 pass: 1
601  2 pass: 1
602  2 pass: 1
603  2 pass: 1
604  2 pass: 1
605  2 pass: 1
606  2 pass: 1
607  2 pass: 1
608  2 pass: 1
609  2 pass: 1
610  2 pass: 1
611  2 pass: 1
612  2 pass: 1
613  2 pas

1088  1 pass: 1
1089  1 pass: 1
1090  1 pass: 1
1091  1 pass: 1
1092  1 pass: 1
1093  2 pass: 1
1094  2 pass: 1
1095  2 pass: 1
1096  2 pass: 1
1097  2 pass: 1
1098  2 pass: 1
1099  2 pass: 1
1100  2 pass: 1
1101  2 pass: 1
1102  3 pass: 1
1103  3 pass: 1
1104  3 pass: 1
1105  3 pass: 1
1106  3 pass: 1
1107  3 pass: 1
1108  3 pass: 1
1109  3 pass: 1
1110  35 pass: 1
1111  36 pass: 1
1112  37 pass: 1
1113  38 pass: 1
1114  39 pass: 1
1115  40 pass: 1
1116  40 pass: 1
1117  41 pass: 1
1118  41 pass: 1
1119  41 pass: 1
1120  41 pass: 1
1121  41 pass: 1
1122  41 pass: 1
1123  42 pass: 1
1124  42 pass: 1
1125  1126  1127  1128  1129  1130  1131  1132  1133  1134  1135  1136  1137  1138  1139  1140  0.9400873360240022 pass: 1
1141  0.4029957439060219 pass: 1
1142  0.06696831363828093 pass: 1
1143  0.6662065360325989 pass: 1
1144  0.5104620222958949 pass: 1
1145  0.195319358936198 pass: 1
1146  0.7153390232074371 pass: 1
1147  0.8840275641394059 pass: 1
1148  0.4377120759515277 pass: 1
1149  

1605  1606  1607  1608  1609  1610  1611  1612  1613  1614  1615  1616  1617  1618  1619  1620  1621  1622  1623  1624  1625  1626  1627  1628  1629  1630  1631  1632  1633  1634  1635  0.805397511051005 pass: 1
1636  0.8815779471939559 pass: 1
1637  0.9169873431868444 pass: 1
1638  0.7409145568273708 pass: 1
1639  0.07041445889356568 pass: 1
1640  0.7930380442045931 pass: 1
1641  0.7934719277370199 pass: 1
1642  0.9427358338394884 pass: 1
1643  0.9229815887970318 pass: 1
1644  0.45207274446474566 pass: 1
1645  0.6943980102051107 pass: 1
1646  0.4124425866127627 pass: 1
1647  0.4456191395856227 pass: 1
1648  0.015002345865774314 pass: 1
1649  0.9248196081715394 pass: 1
1650  1 pass: 1
1651  1 pass: 1
1652  1 pass: 1
1653  1 pass: 1
1654  1 pass: 1
1655  1 pass: 1
1656  1 pass: 1
1657  1 pass: 1
1658  1 pass: 1
1659  1 pass: 1
1660  1 pass: 1
1661  1 pass: 1
1662  1 pass: 1
1663  1 pass: 1
1664  1 pass: 1
1665  4 pass: 1
1666  4 pass: 1
1667  4 pass: 1
1668  4 pass: 1
1669  4 pass: 1
16

2066  0.7121383333054665 pass: 1
2067  0.09154606986430702 pass: 1
2068  0.7769472052539331 pass: 1
2069  0.36218639233410166 pass: 1
2070  18 pass: 1
2071  19 pass: 1
2072  20 pass: 1
2073  22 pass: 1
2074  23 pass: 1
2075  25 pass: 1
2076  27 pass: 1
2077  29 pass: 1
2078  31 pass: 1
2079  33 pass: 1
2080  36 pass: 1
2081  38 pass: 1
2082  40 pass: 1
2083  43 pass: 1
2084  46 pass: 1
2085  1 pass: 1
2086  1 pass: 1
2087  1 pass: 1
2088  1 pass: 1
2089  1 pass: 1
2090  1 pass: 1
2091  1 pass: 1
2092  1 pass: 1
2093  1 pass: 1
2094  1 pass: 1
2095  1 pass: 1
2096  1 pass: 1
2097  1 pass: 1
2098  1 pass: 1
2099  1 pass: 1
2100  2101  2102  2103  2104  2105  2106  2107  2108  2109  2110  2111  2112  2113  2114  2115  0.35377902965232877 pass: 1
2116  0.5708711680055357 pass: 1
2117  0.1915366685191977 pass: 1
2118  0.4297625007377789 pass: 1
2119  0.17631605889904178 pass: 1
2120  0.9484940288298492 pass: 1
2121  0.8953841118460786 pass: 1
2122  0.39131008690415936 pass: 1
2123  0.704139

2494  6 pass: 1
2495  7 pass: 1
2496  7 pass: 1
2497  7 pass: 1
2498  8 pass: 1
2499  8 pass: 1
2500  9 pass: 1
2501  9 pass: 1
2502  9 pass: 1
2503  10 pass: 1
2504  10 pass: 1
2505  19 pass: 1
2506  20 pass: 1
2507  20 pass: 1
2508  20 pass: 1
2509  21 pass: 1
2510  21 pass: 1
2511  22 pass: 1
2512  22 pass: 1
2513  22 pass: 1
2514  23 pass: 1
2515  24 pass: 1
2516  24 pass: 1
2517  25 pass: 1
2518  26 pass: 1
2519  26 pass: 1
2520  1 pass: 1
2521  1 pass: 1
2522  1 pass: 1
2523  1 pass: 1
2524  1 pass: 1
2525  1 pass: 1
2526  1 pass: 1
2527  1 pass: 1
2528  1 pass: 1
2529  1 pass: 1
2530  1 pass: 1
2531  1 pass: 1
2532  1 pass: 1
2533  1 pass: 1
2534  1 pass: 1
2535  0.9155604442747851 pass: 1
2536  0.42034770141402633 pass: 1
2537  0.04501194939747777 pass: 1
2538  0.6249574086298229 pass: 1
2539  0.9358280583313839 pass: 1
2540  0.8232218924341809 pass: 1
2541  0.8637949147089365 pass: 1
2542  0.9856181223922177 pass: 1
2543  0.011506966659452833 pass: 1
2544  0.5506195788302971 p

2989  6 pass: 1
2990  6 pass: 1
2991  6 pass: 1
2992  6 pass: 1
2993  6 pass: 1
2994  6 pass: 1
2995  6 pass: 1
2996  6 pass: 1
2997  7 pass: 1
2998  7 pass: 1
2999  7 pass: 1
3000  3001  3002  3003  3004  3005  3006  3007  3008  3009  3010  3011  3012  3013  3014  3015  0.7240976160957538 pass: 1
3016  0.6932061451444196 pass: 1
3017  0.6624256851677249 pass: 1
3018  0.4273000894564425 pass: 1
3019  0.3509856267702347 pass: 1
3020  0.4355089134349248 pass: 1
3021  0.6073885643549118 pass: 1
3022  0.4502573322828527 pass: 1
3023  0.5779617941207508 pass: 1
3024  0.14370935140156238 pass: 1
3025  0.05251218792510659 pass: 1
3026  0.5383163442292882 pass: 1
3027  0.18487000222006245 pass: 1
3028  0.6651611843050346 pass: 1
3029  0.5070091722592971 pass: 1
3030  68 pass: 1
3031  69 pass: 1
3032  71 pass: 1
3033  74 pass: 1
3034  77 pass: 1
3035  79 pass: 1
3036  81 pass: 1
3037  84 pass: 1
3038  87 pass: 1
3039  90 pass: 1
3040  93 pass: 1
3041  96 pass: 1
3042  99 pass: 1
3043  100 pass:

## ADULT MORTALITY

In [92]:
adult_mor_data = pd.read_csv("Data/New/Adult_Mortality/Ad_Mor_Internet.csv")

In [93]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(adult_mor_data[adult_mor_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            adult_mor_other_data = adult_mor_data[adult_mor_data['Country'] == main_data['Country'][val]][adult_mor_data['Year'] == main_data['Year'][val]]['Adult_Mortality'].values[0]
            print(adult_mor_other_data, "pass: 1")
            main_data.at[val, 'Adult_Mortality'] = adult_mor_other_data
        except IndexError:
            pass
    else:
        try:
            adult_mor_other_data = adult_mor_data[adult_mor_data['Country'].str.startswith(main_data['Country'][val])][adult_mor_data['Year'] == main_data['Year'][val]]['Adult_Mortality'].values[0]
            print(adult_mor_other_data, "pass: 2")
            main_data.at[val, 'Adult_Mortality'] = adult_mor_other_data
        except IndexError:
            try:
                adult_mor_other_data = adult_mor_data[adult_mor_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][adult_mor_data['Year'] == main_data['Year'][val]]['Adult_Mortality'].values[0]
                print(adult_mor_other_data, "pass: 3")
                main_data.at[val, 'Adult_Mortality'] = adult_mor_other_data
            except IndexError:
                pass

0  234 pass: 1
1  235 pass: 1
2  242 pass: 1
3  248 pass: 1
4  255 pass: 1
5  260 pass: 1
6  265 pass: 1
7  273 pass: 1
8  276 pass: 1
9  277 pass: 1
10  282 pass: 1
11  286 pass: 1
12  292 pass: 1
13  307 pass: 1
14  316 pass: 1
15  98 pass: 1
16  100 pass: 1
17  103 pass: 1
18  103 pass: 1
19  103 pass: 1
20  103 pass: 1
21  102 pass: 1
22  101 pass: 1
23  101 pass: 1
24  106 pass: 1
25  101 pass: 1
26  107 pass: 1
27  102 pass: 1
28  100 pass: 1
29  106 pass: 1
30  98 pass: 1
31  100 pass: 1
32  101 pass: 1
33  103 pass: 1
34  104 pass: 1
35  107 pass: 1
36  108 pass: 1
37  111 pass: 1
38  115 pass: 1
39  119 pass: 1
40  125 pass: 1
41  133 pass: 1
42  135 pass: 1
43  139 pass: 1
44  142 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  61  62  63  64  65  66  67  68  69  70  71  72  73  74  75  244 pass: 1
76  249 pass: 1
77  253 pass: 1
78  260 pass: 1
79  270 pass: 1
80  281 pass: 1
81  292 pass: 1
82  303 pass: 1
83  314 pass: 1
84  323 pass: 1
85  334 pass

  """
  if sys.path[0] == '':


153 pass: 1
101  151 pass: 1
102  149 pass: 1
103  154 pass: 1
104  157 pass: 1
105  113 pass: 1
106  116 pass: 1
107  118 pass: 1
108  118 pass: 1
109  119 pass: 1
110  123 pass: 1
111  123 pass: 1
112  126 pass: 1
113  124 pass: 1
114  125 pass: 1
115  128 pass: 1
116  134 pass: 1
117  137 pass: 1
118  138 pass: 1
119  139 pass: 1
120  118 pass: 1
121  121 pass: 1
122  131 pass: 1
123  135 pass: 1
124  138 pass: 1
125  142 pass: 1
126  144 pass: 1
127  137 pass: 1
128  145 pass: 1
129  140 pass: 1
130  135 pass: 1
131  137 pass: 1
132  137 pass: 1
133  143 pass: 1
134  143 pass: 1
135  136  137  138  139  140  141  142  143  144  145  146  147  148  149  150  61 pass: 1
151  60 pass: 1
152  60 pass: 1
153  62 pass: 1
154  63 pass: 1
155  65 pass: 1
156  64 pass: 1
157  65 pass: 1
158  65 pass: 1
159  68 pass: 1
160  67 pass: 1
161  69 pass: 1
162  72 pass: 1
163  74 pass: 1
164  77 pass: 1
165  65 pass: 1
166  67 pass: 1
167  68 pass: 1
168  72 pass: 1
169  74 pass: 1
170  77 pass: 1

648  241 pass: 1
649  245 pass: 1
650  251 pass: 1
651  255 pass: 1
652  259 pass: 1
653  262 pass: 1
654  266 pass: 1
655  269 pass: 1
656  271 pass: 1
657  271 pass: 1
658  272 pass: 1
659  272 pass: 1
660  279 pass: 3
661  278 pass: 3
662  281 pass: 3
663  291 pass: 3
664  300 pass: 3
665  310 pass: 3
666  334 pass: 3
667  351 pass: 3
668  366 pass: 3
669  392 pass: 3
670  407 pass: 3
671  418 pass: 3
672  425 pass: 3
673  420 pass: 3
674  417 pass: 3
675  279 pass: 3
676  278 pass: 3
677  281 pass: 3
678  291 pass: 3
679  300 pass: 3
680  310 pass: 3
681  334 pass: 3
682  351 pass: 3
683  366 pass: 3
684  392 pass: 3
685  407 pass: 3
686  418 pass: 3
687  425 pass: 3
688  420 pass: 3
689  417 pass: 3
690  95 pass: 1
691  97 pass: 1
692  99 pass: 1
693  100 pass: 1
694  106 pass: 1
695  96 pass: 1
696  97 pass: 1
697  91 pass: 1
698  104 pass: 1
699  96 pass: 1
700  102 pass: 1
701  101 pass: 1
702  100 pass: 1
703  101 pass: 1
704  100 pass: 1
705  706  707  708  709  710  711  712

1262  256 pass: 1
1263  256 pass: 1
1264  683 pass: 1
1265  257 pass: 1
1266  266 pass: 1
1267  272 pass: 1
1268  282 pass: 1
1269  290 pass: 1
1270  318 pass: 1
1271  297 pass: 1
1272  300 pass: 1
1273  303 pass: 1
1274  306 pass: 1
1275  148 pass: 1
1276  149 pass: 1
1277  151 pass: 1
1278  153 pass: 1
1279  156 pass: 1
1280  156 pass: 1
1281  158 pass: 1
1282  160 pass: 1
1283  162 pass: 1
1284  164 pass: 1
1285  166 pass: 1
1286  170 pass: 1
1287  172 pass: 1
1288  174 pass: 1
1289  176 pass: 1
1290  1291  1292  1293  1294  1295  1296  1297  1298  1299  1300  1301  1302  1303  1304  1305  133 pass: 1
1306  136 pass: 1
1307  143 pass: 1
1308  147 pass: 1
1309  152 pass: 1
1310  160 pass: 1
1311  164 pass: 1
1312  176 pass: 1
1313  178 pass: 1
1314  182 pass: 1
1315  180 pass: 1
1316  184 pass: 1
1317  184 pass: 1
1318  185 pass: 1
1319  193 pass: 1
1320  55 pass: 1
1321  53 pass: 1
1322  50 pass: 1
1323  51 pass: 1
1324  53 pass: 1
1325  55 pass: 1
1326  57 pass: 1
1327  60 pass: 1


1836  288 pass: 1
1837  292 pass: 1
1838  298 pass: 1
1839  302 pass: 1
1840  310 pass: 1
1841  316 pass: 1
1842  321 pass: 1
1843  327 pass: 1
1844  335 pass: 1
1845  53 pass: 1
1846  57 pass: 1
1847  57 pass: 1
1848  59 pass: 1
1849  58 pass: 1
1850  61 pass: 1
1851  62 pass: 1
1852  65 pass: 1
1853  63 pass: 1
1854  63 pass: 1
1855  64 pass: 1
1856  66 pass: 1
1857  68 pass: 1
1858  69 pass: 1
1859  70 pass: 1
1860  1861  1862  1863  1864  1865  1866  1867  1868  1869  1870  1871  1872  1873  1874  1875  206 pass: 1
1876  207 pass: 1
1877  208 pass: 1
1878  211 pass: 1
1879  213 pass: 1
1880  214 pass: 1
1881  216 pass: 1
1882  219 pass: 1
1883  221 pass: 1
1884  224 pass: 1
1885  225 pass: 1
1886  226 pass: 1
1887  227 pass: 1
1888  228 pass: 1
1889  229 pass: 1
1890  148 pass: 1
1891  145 pass: 1
1892  152 pass: 1
1893  156 pass: 1
1894  162 pass: 1
1895  165 pass: 1
1896  165 pass: 1
1897  160 pass: 1
1898  162 pass: 1
1899  164 pass: 1
1900  164 pass: 1
1901  168 pass: 1
1902  1

2395  69 pass: 1
2396  70 pass: 1
2397  72 pass: 1
2398  73 pass: 1
2399  74 pass: 1
2400  140 pass: 1
2401  134 pass: 1
2402  141 pass: 1
2403  141 pass: 1
2404  155 pass: 1
2405  160 pass: 1
2406  160 pass: 1
2407  155 pass: 1
2408  158 pass: 1
2409  162 pass: 1
2410  166 pass: 1
2411  174 pass: 1
2412  178 pass: 1
2413  179 pass: 1
2414  175 pass: 1
2415  214 pass: 1
2416  221 pass: 1
2417  230 pass: 1
2418  237 pass: 1
2419  251 pass: 1
2420  256 pass: 1
2421  274 pass: 1
2422  279 pass: 1
2423  299 pass: 1
2424  326 pass: 1
2425  321 pass: 1
2426  325 pass: 1
2427  317 pass: 1
2428  311 pass: 1
2429  311 pass: 1
2430  207 pass: 1
2431  212 pass: 1
2432  219 pass: 1
2433  228 pass: 1
2434  239 pass: 1
2435  266 pass: 1
2436  263 pass: 1
2437  282 pass: 1
2438  321 pass: 1
2439  366 pass: 1
2440  399 pass: 1
2441  417 pass: 1
2442  429 pass: 1
2443  456 pass: 1
2444  451 pass: 1
2445  115 pass: 1
2446  118 pass: 1
2447  124 pass: 1
2448  127 pass: 1
2449  134 pass: 1
2450  164 pass:

3000  3001  3002  3003  3004  3005  3006  3007  3008  3009  3010  3011  3012  3013  3014  3015  3016  3017  3018  3019  3020  3021  3022  3023  3024  3025  3026  3027  3028  3029  3030  304 pass: 1
3031  316 pass: 1
3032  335 pass: 1
3033  348 pass: 1
3034  364 pass: 1
3035  383 pass: 1
3036  407 pass: 1
3037  416 pass: 1
3038  418 pass: 1
3039  448 pass: 1
3040  480 pass: 1
3041  494 pass: 1
3042  510 pass: 1
3043  523 pass: 1
3044  536 pass: 1
3045  212 pass: 1
3046  207 pass: 1
3047  211 pass: 1
3048  209 pass: 1
3049  218 pass: 1
3050  235 pass: 1
3051  275 pass: 1
3052  278 pass: 1
3053  268 pass: 1
3054  280 pass: 1
3055  269 pass: 1
3056  258 pass: 1
3057  257 pass: 1
3058  254 pass: 1
3059  258 pass: 1
3060  76 pass: 1
3061  78 pass: 1
3062  79 pass: 1
3063  80 pass: 1
3064  81 pass: 1
3065  83 pass: 1
3066  85 pass: 1
3067  86 pass: 1
3068  88 pass: 1
3069  91 pass: 1
3070  94 pass: 1
3071  98 pass: 1
3072  101 pass: 1
3073  104 pass: 1
3074  107 pass: 1
3075  68 pass: 2
3076 

In [94]:
#adult_mor_data.head()

In [95]:
#main_data.head()

## Life Expectancy

In [96]:
life_exp_data = pd.read_csv("Data/New/Life_Expectancy/life_exp_internet.csv")

In [97]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(life_exp_data[life_exp_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            life_exp_other_data = life_exp_data[life_exp_data['Country'] == main_data['Country'][val]][life_exp_data['Year'] == main_data['Year'][val]]['Life_Expectancy'].values[0]
            if regex_double_nums.match(life_exp_other_data):
                life_exp_other_data = life_exp_other_data.split(' ')[0]
                print('Regex Matched', end=' ')
            print(life_exp_other_data, "pass: 1")
            main_data.at[val, 'Life_Expectancy'] = life_exp_other_data
        except IndexError:
            pass
    else:
        try:
            life_exp_other_data = life_exp_data[life_exp_data['Country'].str.startswith(main_data['Country'][val])][life_exp_data['Year'] == main_data['Year'][val]]['Life_Expectancy'].values[0]
            if regex_double_nums.match(life_exp_other_data):
                life_exp_other_data = life_exp_other_data.split(' ')[0]
                print('Regex Matched', end=' ')
            print(life_exp_other_data, "pass: 2")
            main_data.at[val, 'Life_Expectancy'] = life_exp_other_data
        except IndexError:
            try:
                life_exp_other_data = life_exp_data[life_exp_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][life_exp_data['Year'] == main_data['Year'][val]]['Life_Expectancy'].values[0]
                if regex_double_nums.match(life_exp_other_data):
                    life_exp_other_data = life_exp_other_data.split(' ')[0]
                    print('Regex Matched', end=' ')
                print(life_exp_other_data, "pass: 3")
                main_data.at[val, 'Life_Expectancy'] = life_exp_other_data
            except IndexError:
                pass

0  63 pass: 1
1  62.7 pass: 1
2  62.2 pass: 1
3  61.7 pass: 1
4  61.2 pass: 1
5  60.7 pass: 1
6  60.2 pass: 1
7  59.6 pass: 1
8  59.2 pass: 1
9  58.9 pass: 1
10  58.4 pass: 1
11  58 pass: 1
12  57.4 pass: 1
13  56.5 pass: 1
14  55.9 pass: 1
15  76.1 pass: 1
16  75.7 pass: 1
17  75.2 pass: 1
18  75.1 pass: 1
19  74.7 pass: 1
20  74.4 pass: 1
21  74.2 pass: 1
22  74.1 pass: 1
23  73.9 pass: 1
24  73.5 pass: 1
25  73.3 pass: 1
26  72.9 pass: 1
27  73.5 pass: 1
28  74 pass: 1
29  73.1 pass: 1
30  76.1 pass: 1
31  75.9 pass: 1
32  75.8 pass: 1
33  75.6 pass: 1
34  75.4 pass: 1
35  75.1 pass: 1
36  74.8 pass: 1
37  74.4 pass: 1
38  74 pass: 1
39  73.4 pass: 1
40  72.8 pass: 1
41  72 pass: 1
42  71.7 pass: 1
43  71.2 pass: 1
44  70.8 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  61  62  63  64

  """
  from ipykernel import kernelapp as app


  65  66  67  68  69  70  71  72  73  74  75  61.7 pass: 1
76  61 pass: 1
77  60.4 pass: 1
78  59.5 pass: 1
79  58.4 pass: 1
80  57.3 pass: 1
81  56.1 pass: 1
82  55 pass: 1
83  53.8 pass: 1
84  52.7 pass: 1
85  51.5 pass: 1
86  50.5 pass: 1
87  49.4 pass: 1
88  48.2 pass: 1
89  47.3 pass: 1
90  74.6 pass: 1
91  74.8 pass: 1
92  74.8 pass: 1
93  75 pass: 1
94  74.7 pass: 1
95  74.5 pass: 1
96  74 pass: 1
97  73.8 pass: 1
98  73.5 pass: 1
99  73.4 pass: 1
100  73.3 pass: 1
101  73.3 pass: 1
102  73.4 pass: 1
103  73 pass: 1
104  72.5 pass: 1
105  76.7 pass: 1
106  76.3 pass: 1
107  76.2 pass: 1
108  76 pass: 1
109  75.7 pass: 1
110  75.8 pass: 1
111  75.7 pass: 1
112  75 pass: 1
113  75.4 pass: 1
114  75.1 pass: 1
115  74.9 pass: 1
116  74.2 pass: 1
117  74.2 pass: 1
118  74 pass: 1
119  74 pass: 1
120  74.5 pass: 1
121  74.5 pass: 1
122  74 pass: 1
123  73.6 pass: 1
124  73.3 pass: 1
125  73 pass: 1
126  73 pass: 1
127  73.2 pass: 1
128  72.6 pass: 1
129  72.7 pass: 1
130  72.6 pass: 1

616  75.8 pass: 1
617  75.6 pass: 1
618  75.4 pass: 1
619  75.2 pass: 1
620  75.1 pass: 1
621  74.7 pass: 1
622  74.7 pass: 1
623  74.4 pass: 1
624  74.2 pass: 1
625  73.9 pass: 1
626  73.5 pass: 1
627  73.2 pass: 1
628  72.7 pass: 1
629  72.1 pass: 1
630  74.7 pass: 1
631  74.4 pass: 1
632  74.3 pass: 1
633  74.2 pass: 1
634  73.5 pass: 1
635  73.5 pass: 1
636  73.4 pass: 1
637  73.4 pass: 1
638  73 pass: 1
639  72.9 pass: 1
640  72.5 pass: 1
641  72.1 pass: 1
642  71.4 pass: 1
643  71.2 pass: 1
644  71.1 pass: 1
645  63.3 pass: 1
646  63 pass: 1
647  62.6 pass: 1
648  62.3 pass: 1
649  61.8 pass: 1
650  61.4 pass: 1
651  61 pass: 1
652  60.7 pass: 1
653  60.4 pass: 1
654  60.1 pass: 1
655  59.8 pass: 1
656  59.7 pass: 1
657  59.6 pass: 1
658  59.6 pass: 1
659  59.5 pass: 1
660  63.3 pass: 3
661  63.1 pass: 3
662  62.8 pass: 3
663  62.2 pass: 3
664  61.6 pass: 3
665  60.9 pass: 3
666  59.7 pass: 3
667  58.6 pass: 3
668  57.5 pass: 3
669  56 pass: 3
670  54.8 pass: 3
671  54 pass: 3
67

1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  73.2 pass: 1
1171  73.2 pass: 1
1172  73.1 pass: 1
1173  72.9 pass: 1
1174  72.6 pass: 1
1175  72.4 pass: 1
1176  72.1 pass: 1
1177  71.8 pass: 1
1178  71.6 pass: 1
1179  71.3 pass: 1
1180  70.3 pass: 1
1181  71 pass: 1
1182  71 pass: 1
1183  70.8 pass: 1
1184  70.6 pass: 1
1185  1186  1187  1188  1189  1190  1191  1192  1193  1194  1195  1196  1197  1198  1199  1200  72.6 pass: 1
1201  72.2 pass: 1
1202  72 pass: 1
1203  71.6 pass: 1
1204  71 pass: 1
1205  70.8 pass: 1
1206  71 pass: 1
1207  70.6 pass: 1
1208  69.7 pass: 1
1209  69.1 pass: 1
1210  69.4 pass: 1
1211  69.1 pass: 1
1212  69 pass: 1
1213  68.1 pass: 1
1214  67.6 pass: 1
1215  57.8 pass: 1
1216  58.4 pass: 1
1217  58 pass: 1
1218  57.6 pass: 1
1219  57.2 pass: 1
1220  56.5 pass: 1
1221  56 pass: 1
1222  55.4 pass: 1
1223  54.6 pass: 1
1224  53.7 pass: 1
1225  52.8 pass: 1
1226  52.1 pass: 1
1227  51.7 pass: 1
1228  51.3 pass: 1


1710  1711  1712  1713  1714  1715  1716  1717  1718  1719  1720  1721  1722  1723  1724  1725  74.5 pass: 1
1726  73.9 pass: 1
1727  73.8 pass: 1
1728  73.5 pass: 1
1729  73.2 pass: 1
1730  72.7 pass: 1
1731  71.6 pass: 1
1732  70.6 pass: 1
1733  70.9 pass: 1
1734  71 pass: 1
1735  71.9 pass: 1
1736  71.9 pass: 1
1737  71.7 pass: 1
1738  71.5 pass: 1
1739  72 pass: 1
1740  82.3 pass: 1
1741  82.1 pass: 1
1742  81.8 pass: 1
1743  81.5 pass: 1
1744  81.4 pass: 1
1745  81.4 pass: 1
1746  81.1 pass: 1
1747  80.6 pass: 1
1748  80.2 pass: 1
1749  80 pass: 1
1750  79.5 pass: 1
1751  79.1 pass: 1
1752  78.7 pass: 1
1753  78.7 pass: 1
1754  78.4 pass: 1
1755  1756  1757  1758  1759  1760  1761  1762  1763  1764  1765  1766  1767  1768  1769  1770  65.3 pass: 1
1771  64.9 pass: 1
1772  64.5 pass: 1
1773  64 pass: 1
1774  63.5 pass: 1
1775  62.9 pass: 1
1776  62.4 pass: 1
1777  61.9 pass: 1
1778  61.5 pass: 1
1779  61 pass: 1
1780  60.6 pass: 1
1781  60.2 pass: 1
1782  59.7 pass: 1
1783  59.1 pa

2281  65.2 pass: 1
2282  65 pass: 1
2283  64.8 pass: 1
2284  64.6 pass: 1
2285  64.4 pass: 1
2286  64.2 pass: 1
2287  63.8 pass: 1
2288  63.4 pass: 1
2289  63.1 pass: 1
2290  62.7 pass: 1
2291  62.5 pass: 1
2292  62.3 pass: 1
2293  62.1 pass: 1
2294  61.9 pass: 1
2295  74 pass: 1
2296  73.8 pass: 1
2297  73.7 pass: 1
2298  73.6 pass: 1
2299  73.4 pass: 1
2300  73.1 pass: 1
2301  72.8 pass: 1
2302  72.5 pass: 1
2303  72.3 pass: 1
2304  72.1 pass: 1
2305  71.9 pass: 1
2306  71.7 pass: 1
2307  71.6 pass: 1
2308  71.4 pass: 1
2309  71.1 pass: 1
2310  75.4 pass: 1
2311  75.2 pass: 1
2312  75 pass: 1
2313  74.8 pass: 1
2314  74.6 pass: 1
2315  74.3 pass: 1
2316  74.1 pass: 1
2317  73.8 pass: 1
2318  73.5 pass: 1
2319  73.2 pass: 1
2320  72.9 pass: 1
2321  72.5 pass: 1
2322  72.1 pass: 1
2323  71.7 pass: 1
2324  71.3 pass: 1
2325  69 pass: 1
2326  68.7 pass: 1
2327  68.6 pass: 1
2328  68.5 pass: 1
2329  68.3 pass: 1
2330  67.9 pass: 1
2331  67.9 pass: 1
2332  67.8 pass: 1
2333  67.3 pass: 1
2

2804  67.7 pass: 1
2805  82.3 pass: 1
2806  82.1 pass: 1
2807  81.8 pass: 1
2808  81.8 pass: 1
2809  81.5 pass: 1
2810  81.5 pass: 1
2811  81.2 pass: 1
2812  81 pass: 1
2813  80.9 pass: 1
2814  80.6 pass: 1
2815  80.4 pass: 1
2816  80.3 pass: 1
2817  80.1 pass: 1
2818  80 pass: 1
2819  79.7 pass: 1
2820  83.3 pass: 1
2821  82.9 pass: 1
2822  82.8 pass: 1
2823  82.7 pass: 1
2824  82.4 pass: 1
2825  82.1 pass: 1
2826  82.1 pass: 1
2827  81.8 pass: 1
2828  81.6 pass: 1
2829  81.2 pass: 1
2830  81.1 pass: 1
2831  80.6 pass: 1
2832  80.5 pass: 1
2833  80.3 pass: 1
2834  79.8 pass: 1
2835  60 pass: 1
2836  61.6 pass: 1
2837  65 pass: 1
2838  72.7 pass: 1
2839  73.8 pass: 1
2840  73.8 pass: 1
2841  73.7 pass: 1
2842  73.6 pass: 1
2843  73.5 pass: 1
2844  73.4 pass: 1
2845  73.3 pass: 1
2846  73.2 pass: 1
2847  73.2 pass: 1
2848  73.1 pass: 1
2849  73 pass: 1
2850  70.4 pass: 1
2851  70.3 pass: 1
2852  70.1 pass: 1
2853  70 pass: 1
2854  69.7 pass: 1
2855  69.7 pass: 1
2856  69 pass: 1
2857  6

In [98]:
#main_data[['Country','Year','Life_Expectancy']].head()

## Percentage Expenditure

In [99]:
per_exp = pd.read_csv("Data/New/Percent_Expenditure/Percent_Exp_Internet.csv")

In [100]:
count = 0
per_exp_data = pd.DataFrame(columns=['Country', 'Year', 'Percentage_Expenditure'])
for i in range(0, len(per_exp['Country'].unique())):
    for j in range(1, len(per_exp.columns)):
        #print(per_exp.loc[i,'Country'], end='')
        per_exp_data.at[count, 'Country'] = per_exp.loc[i,'Country']
        per_exp_data.at[count, 'Year'] = per_exp.columns[j]
       # print(per_exp.columns[j])
        per_exp_data.at[count, 'Percentage_Expenditure'] = per_exp[per_exp['Country'] == per_exp['Country'][i]].T[1:].loc[per_exp.columns[j]].values[0]
        count+=1

In [101]:
per_exp_data['Year'] = per_exp_data['Year'].astype(np.int64)

In [102]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(per_exp_data[per_exp_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            per_exp_other_data = per_exp_data[per_exp_data['Country'] == main_data['Country'][val]][per_exp_data['Year'] == main_data['Year'][val]]['Percentage_Expenditure'].values[0]
            print(per_exp_other_data, "pass: 1")
            main_data.at[val, 'Percentage_Expenditure'] = per_exp_other_data
        except IndexError:
            pass
    else:
        try:
            per_exp_other_data = per_exp_data[per_exp_data['Country'].str.startswith(main_data['Country'][val])][per_exp_data['Year'] == main_data['Year'][val]]['Percentage_Expenditure'].values[0]
            print(per_exp_other_data, "pass: 2")
            main_data.at[val, 'Percentage_Expenditure'] = per_exp_other_data
        except IndexError:
            try:
                per_exp_other_data = per_exp_data[per_exp_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][per_exp_data['Year'] == main_data['Year'][val]]['Percentage_Expenditure'].values[0]
                print(per_exp_other_data, "pass: 3")
                main_data.at[val, 'Percentage_Expenditure'] = per_exp_other_data
            except IndexError:
                pass

0  9.7 pass: 1
1  8.8 pass: 1
2  7.9 pass: 1
3  8.6 pass: 1
4  8.6 pass: 1
5  9.8 pass: 1
6  10.3 pass: 1
7  9.9 pass: 1
8  10.6 pass: 1
9  9.9 pass: 1
10  9.8 pass: 1
11  8.9 pass: 1
12  9.4 pass: 1
13  No data pass: 1
14  No data pass: 1
15  7 pass: 1
16  6.3 pass: 1
17  5.9 pass: 1
18  5.6 pass: 1
19  5 pass: 1
20  5.1 pass: 1
21  5.6 pass: 1
22  6.1 pass: 1
23  5.9 pass: 1
24  6.3 pass: 1
25  6.6 pass: 1
26  6.4 pass: 1
27  6.4 pass: 1
28  6.5 pass: 1
29  6.8 pass: 1
30  6.5 pass: 1
31  6 pass: 1
32  6 pass: 1
33  5.3 pass: 1
34  5.1 pass: 1
35  5.4 pass: 1
36  4.2 pass: 1
37  3.8 pass: 1
38  3.4 pass: 1
39  3.2 pass: 1
40  3.5 pass: 1
41  3.6 pass: 1
42  3.7 pass: 1
43  3.8 pass: 1
44  3.5 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  12 pass: 1
61  14.2 pass: 1
62  12.1 pass: 1
63  11.8 pass: 1
64  11.6 pass: 1
65  10.9 pass: 1
66  10.4 pass: 1
67  9.8

  """
  if sys.path[0] == '':


 pass: 1
68  9.7 pass: 1
69  9.8 pass: 1
70  9.2 pass: 1
71  9.2 pass: 1
72  9.4 pass: 1
73  9.4 pass: 1
74  9.3 pass: 1
75  2.8 pass: 1
76  3 pass: 1
77  2.7 pass: 1
78  2.8 pass: 1
79  2.7 pass: 1
80  3.6 pass: 1
81  3.5 pass: 1
82  3.2 pass: 1
83  3.6 pass: 1
84  4 pass: 1
85  5 pass: 1
86  4.7 pass: 1
87  4.2 pass: 1
88  5.2 pass: 1
89  2.5 pass: 1
90  5.7 pass: 1
91  5.4 pass: 1
92  5.1 pass: 1
93  5.7 pass: 1
94  5.5 pass: 1
95  4.7 pass: 1
96  4.6 pass: 1
97  4.2 pass: 1
98  4.3 pass: 1
99  4.4 pass: 1
100  4.2 pass: 1
101  4.5 pass: 1
102  4.4 pass: 1
103  4.5 pass: 1
104  4.1 pass: 1
105  6.4 pass: 1
106  6.4 pass: 1
107  6.3 pass: 1
108  6.3 pass: 1
109  6.8 pass: 1
110  7 pass: 1
111  6.3 pass: 1
112  6.4 pass: 1
113  6.4 pass: 1
114  6.4 pass: 1
115  5.9 pass: 1
116  5.9 pass: 1
117  4.7 pass: 1
118  5.2 pass: 1
119  5 pass: 1
120  7 pass: 1
121  8.3 pass: 1
122  6.7 pass: 1
123  3.8 pass: 1
124  5.3 pass: 1
125  4.7 pass: 1
126  4.3 pass: 1
127  5.4 pass: 1
128  5.6 pass: 

636  6 pass: 1
637  5.7 pass: 1
638  5.7 pass: 1
639  5.5 pass: 1
640  5.1 pass: 1
641  5.6 pass: 1
642  5.3 pass: 1
643  5.6 pass: 1
644  5.5 pass: 1
645  8 pass: 1
646  8.3 pass: 1
647  8.3 pass: 1
648  9.5 pass: 1
649  8.7 pass: 1
650  8.7 pass: 1
651  9.1 pass: 1
652  9.4 pass: 1
653  9.7 pass: 1
654  10.1 pass: 1
655  10.2 pass: 1
656  10.6 pass: 1
657  11.2 pass: 1
658  10.9 pass: 1
659  12.1 pass: 1
660  2.4 pass: 3
661  2.4 pass: 3
662  2 pass: 3
663  1.9 pass: 3
664  2 pass: 3
665  2.2 pass: 3
666  2.2 pass: 3
667  2 pass: 3
668  1.8 pass: 3
669  1.9 pass: 3
670  2.1 pass: 3
671  2.1 pass: 3
672  1.9 pass: 3
673  2.4 pass: 3
674  1.7 pass: 3
675  2.4 pass: 3
676  2.4 pass: 3
677  2 pass: 3
678  1.9 pass: 3
679  2 pass: 3
680  2.2 pass: 3
681  2.2 pass: 3
682  2 pass: 3
683  1.8 pass: 3
684  1.9 pass: 3
685  2.1 pass: 3
686  2.1 pass: 3
687  1.9 pass: 3
688  2.4 pass: 3
689  1.7 pass: 3
690  8.2 pass: 1
691  8.3 pass: 1
692  8.1 pass: 1
693  8.4 pass: 1
694  8.1 pass: 1
695  7.

1213  6.7 pass: 1
1214  5.2 pass: 1
1215  4.3 pass: 1
1216  4.7 pass: 1
1217  4.6 pass: 1
1218  5.1 pass: 1
1219  4.4 pass: 1
1220  4.3 pass: 1
1221  4.3 pass: 1
1222  4.6 pass: 1
1223  4.3 pass: 1
1224  4.5 pass: 1
1225  4.6 pass: 1
1226  5 pass: 1
1227  6 pass: 1
1228  5.2 pass: 1
1229  5 pass: 1
1230  6.3 pass: 1
1231  4.7 pass: 1
1232  4.8 pass: 1
1233  5.4 pass: 1
1234  6.2 pass: 1
1235  6.6 pass: 1
1236  6.8 pass: 1
1237  6.8 pass: 1
1238  6.4 pass: 1
1239  6.3 pass: 1
1240  6.9 pass: 1
1241  5.7 pass: 1
1242  5.2 pass: 1
1243  6.1 pass: 1
1244  6.3 pass: 1
1245  5.1 pass: 1
1246  5 pass: 1
1247  4.8 pass: 1
1248  4.9 pass: 1
1249  4.6 pass: 1
1250  4.6 pass: 1
1251  4.2 pass: 1
1252  4 pass: 1
1253  4 pass: 1
1254  5.4 pass: 1
1255  5 pass: 1
1256  5.2 pass: 1
1257  4.8 pass: 1
1258  4.5 pass: 1
1259  4.4 pass: 1
1260  7.2 pass: 1
1261  7.2 pass: 1
1262  10.1 pass: 1
1263  10.6 pass: 1
1264  10.2 pass: 1
1265  8.7 pass: 1
1266  7.7 pass: 1
1267  6.8 pass: 1
1268  5.5 pass: 1
126

1787  8.5 pass: 1
1788  7.5 pass: 1
1789  7.2 pass: 1
1790  8.3 pass: 1
1791  8.6 pass: 1
1792  7.7 pass: 1
1793  6.9 pass: 1
1794  6.1 pass: 1
1795  5.7 pass: 1
1796  4.7 pass: 1
1797  3.9 pass: 1
1798  3.7 pass: 1
1799  4.4 pass: 1
1800  3.9 pass: 1
1801  3.7 pass: 1
1802  3.6 pass: 1
1803  3.5 pass: 1
1804  3.3 pass: 1
1805  3.4 pass: 1
1806  3.1 pass: 1
1807  3.3 pass: 1
1808  3.3 pass: 1
1809  2.9 pass: 1
1810  3 pass: 1
1811  3 pass: 1
1812  2.7 pass: 1
1813  2.7 pass: 1
1814  2.4 pass: 1
1815  13 pass: 1
1816  11 pass: 1
1817  8.4 pass: 1
1818  10.2 pass: 1
1819  9.3 pass: 1
1820  10.6 pass: 1
1821  11.6 pass: 1
1822  8.9 pass: 1
1823  8 pass: 1
1824  8.8 pass: 1
1825  7.5 pass: 1
1826  6.4 pass: 1
1827  7.1 pass: 1
1828  8 pass: 1
1829  7.4 pass: 1
1830  5.8 pass: 1
1831  5.4 pass: 1
1832  4.4 pass: 1
1833  4.1 pass: 1
1834  4.4 pass: 1
1835  4.7 pass: 1
1836  4.8 pass: 1
1837  5.2 pass: 1
1838  5.3 pass: 1
1839  5 pass: 1
1840  5.2 pass: 1
1841  4.6 pass: 1
1842  4.4 pass: 1
1

2320  4.8 pass: 1
2321  5 pass: 1
2322  5 pass: 1
2323  4.8 pass: 1
2324  4.4 pass: 1
2325  4.2 pass: 1
2326  4.5 pass: 1
2327  4.4 pass: 1
2328  4.2 pass: 1
2329  4.3 pass: 1
2330  4.4 pass: 1
2331  4 pass: 1
2332  3.9 pass: 1
2333  3.9 pass: 1
2334  3.9 pass: 1
2335  3.2 pass: 1
2336  3.2 pass: 1
2337  2.7 pass: 1
2338  2.9 pass: 1
2339  3.2 pass: 1
2340  6.2 pass: 1
2341  6.4 pass: 1
2342  6.2 pass: 1
2343  6.2 pass: 1
2344  6.4 pass: 1
2345  6.6 pass: 1
2346  6.4 pass: 1
2347  5.9 pass: 1
2348  5.8 pass: 1
2349  5.8 pass: 1
2350  5.9 pass: 1
2351  6 pass: 1
2352  6.1 pass: 1
2353  5.7 pass: 1
2354  5.3 pass: 1
2355  9 pass: 1
2356  9.1 pass: 1
2357  9.3 pass: 1
2358  9.5 pass: 1
2359  9.8 pass: 1
2360  9.9 pass: 1
2361  9.4 pass: 1
2362  9.1 pass: 1
2363  9.1 pass: 1
2364  9.4 pass: 1
2365  9.3 pass: 1
2366  8.9 pass: 1
2367  8.6 pass: 1
2368  8.4 pass: 1
2369  8.4 pass: 1
2370  2371  2372  2373  2374  2375  2376  2377  2378  2379  2380  2381  2382  2383  2384  2385  2.4 pass: 1
23

2854  5.8 pass: 1
2855  5.9 pass: 1
2856  5.9 pass: 1
2857  5.5 pass: 1
2858  5 pass: 1
2859  5.2 pass: 1
2860  4.8 pass: 1
2861  4.7 pass: 1
2862  4.2 pass: 1
2863  4.3 pass: 1
2864  4.3 pass: 1
2865  2866  2867  2868  2869  2870  2871  2872  2873  2874  2875  2876  2877  2878  2879  2880  3.7 pass: 1
2881  3.5 pass: 1
2882  3.5 pass: 1
2883  3.8 pass: 1
2884  3.6 pass: 1
2885  3.9 pass: 1
2886  3.7 pass: 1
2887  3.4 pass: 1
2888  3.3 pass: 1
2889  3.4 pass: 1
2890  3.4 pass: 1
2891  3.5 pass: 1
2892  3.5 pass: 1
2893  3.2 pass: 1
2894  3.2 pass: 1
2895  2.3 pass: 1
2896  1.7 pass: 1
2897  1.2 pass: 1
2898  1.2 pass: 1
2899  1.3 pass: 1
2900  1.6 pass: 1
2901  1 pass: 1
2902  1.1 pass: 1
2903  1 pass: 1
2904  1.3 pass: 1
2905  1.7 pass: 1
2906  2.8 pass: 1
2907  2.4 pass: 1
2908  No data pass: 1
2909  No data pass: 1
2910  6.5 pass: 1
2911  6.6 pass: 1
2912  6.1 pass: 1
2913  6.2 pass: 1
2914  6.3 pass: 1
2915  5.2 pass: 1
2916  4.6 pass: 1
2917  4.6 pass: 1
2918  4.4 pass: 1
2919  4.

In [103]:
#main_data[['Country','Year','Percentage_Expenditure']].head(10)

In [104]:
#per_exp_data.head(10)

## Alcohol

In [105]:
alcohol_2000_2009 = pd.read_csv("Data/New/Alcohol/Alcohol_2000_2009.csv")

In [106]:
#alcohol_2000_2009.tail(10)

In [107]:
count = 0
count_country = 0
alcohol_2000_2009_data = pd.DataFrame(columns=['Country', 'Year', 'Alcohol'])
for i in range(0, len(alcohol_2000_2009['Country'].unique())+1):
    for j in range(2, len(alcohol_2000_2009.columns)):
        print(alcohol_2000_2009.loc[count_country,'Country'], end=' ')
        alcohol_2000_2009_data.at[count, 'Country'] = alcohol_2000_2009.loc[count_country,'Country']
        alcohol_2000_2009_data.at[count, 'Year'] = alcohol_2000_2009.columns[j]
        print(i, count_country)
        alcohol_2000_2009_data.at[count, 'Alcohol'] = alcohol_2000_2009[alcohol_2000_2009['Country'] == alcohol_2000_2009['Country'][count_country]].T[1:].loc[alcohol_2000_2009.columns[j]].values[0]
        count+=1
    count_country += 5

Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Argentina 6 30
Argentina 6 30
Argentina 6 30
Argentina 6 30
Argentina 6 30
Argentina 6 30


Dominica 50 250
Dominica 50 250
Dominica 50 250
Dominica 50 250
Dominica 50 250
Dominica 50 250
Dominica 50 250
Dominica 50 250
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Dominican Republic 51 255
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Ecuador 52 260
Egypt 53 265
Egypt 53 265
Egypt 53 265
Egypt 53 265
Egypt 53 265
Egypt 53 265
Egypt 53 265
Egypt 53 265
Egypt 53 265
Egypt 53 265
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
El Salvador 54 270
Equatorial Guinea 55 275
Equatorial Guinea 55 275
Equatorial Guinea 55 275
Equatorial Guinea 55 275
Equatorial Guinea 55 275
Equatorial Guinea

Mauritius 108 540
Mauritius 108 540
Mauritius 108 540
Mauritius 108 540
Mauritius 108 540
Mexico 109 545
Mexico 109 545
Mexico 109 545
Mexico 109 545
Mexico 109 545
Mexico 109 545
Mexico 109 545
Mexico 109 545
Mexico 109 545
Mexico 109 545
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Micronesia (Federated States of) 110 550
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Mongolia 111 555
Montenegro 112 560
Montenegro 112 560
Montenegro 112 560
Montenegro 112 560
Montenegro 112 560
Montenegro 112 560
Montenegro 112 560
Montenegro 112 560
Montenegro 112 560
Montenegr

Sierra Leone 152 760
Sierra Leone 152 760
Sierra Leone 152 760
Sierra Leone 152 760
Sierra Leone 152 760
Singapore 153 765
Singapore 153 765
Singapore 153 765
Singapore 153 765
Singapore 153 765
Singapore 153 765
Singapore 153 765
Singapore 153 765
Singapore 153 765
Singapore 153 765
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovakia 154 770
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Slovenia 155 775
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Solomon Islands 156 780
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia

In [108]:
#alcohol_2000_2009_data[alcohol_2000_2009_data["Country"] == "Zimbabwe"]

In [109]:
alcohol_2010_X = pd.read_csv("Data/New/Alcohol/Alcohol_2010_x.csv")

In [110]:
count = 0
count_country = 0
alcohol_2010_X_data = pd.DataFrame(columns=['Country', 'Year', 'Alcohol'])
for i in range(0, len(alcohol_2010_X['Country'].unique())+1):
    for j in range(2, len(alcohol_2010_X.columns)):
        print(alcohol_2010_X.loc[count_country,'Country'], end=' ')
        alcohol_2010_X_data.at[count, 'Country'] = alcohol_2010_X.loc[count_country,'Country']
        alcohol_2010_X_data.at[count, 'Year'] = alcohol_2010_X.columns[j]
        print(i, count_country)
        alcohol_2010_X_data.at[count, 'Alcohol'] = alcohol_2010_X[alcohol_2010_X['Country'] == alcohol_2010_X['Country'][count_country]].T[1:].loc[alcohol_2010_X.columns[j]].values[0]
        count+=1
    count_country += 5

Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Afghanistan 0 0
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Albania 1 5
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Algeria 2 10
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Andorra 3 15
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Angola 4 20
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Antigua and Barbuda 5 25
Argentina 6 30
Argentina 6 30
Argentina 6 30
Argentina 6 30
Argentina 6 30
Argentina 6 30
Argentina 6 30
Armenia 7 35
Armenia 7 35
Armenia 7 35
Armenia 7 35
Armenia 7 35
Armenia 7 35
Armenia 7 35
Australia 8 40
Australia 8 40
Australia 8 40
Australia 8 40
Australia 8 40
Australia 8 40
Australia 8 40
Austria 9 45
Austria 9 45
Austria 9 45
Austria 9 45
Austria 9 

Guinea 71 355
Guinea 71 355
Guinea 71 355
Guinea 71 355
Guinea 71 355
Guinea-Bissau 72 360
Guinea-Bissau 72 360
Guinea-Bissau 72 360
Guinea-Bissau 72 360
Guinea-Bissau 72 360
Guinea-Bissau 72 360
Guinea-Bissau 72 360
Guyana 73 365
Guyana 73 365
Guyana 73 365
Guyana 73 365
Guyana 73 365
Guyana 73 365
Guyana 73 365
Haiti 74 370
Haiti 74 370
Haiti 74 370
Haiti 74 370
Haiti 74 370
Haiti 74 370
Haiti 74 370
Honduras 75 375
Honduras 75 375
Honduras 75 375
Honduras 75 375
Honduras 75 375
Honduras 75 375
Honduras 75 375
Hungary 76 380
Hungary 76 380
Hungary 76 380
Hungary 76 380
Hungary 76 380
Hungary 76 380
Hungary 76 380
Iceland 77 385
Iceland 77 385
Iceland 77 385
Iceland 77 385
Iceland 77 385
Iceland 77 385
Iceland 77 385
India 78 390
India 78 390
India 78 390
India 78 390
India 78 390
India 78 390
India 78 390
Indonesia 79 395
Indonesia 79 395
Indonesia 79 395
Indonesia 79 395
Indonesia 79 395
Indonesia 79 395
Indonesia 79 395
Iran (Islamic Republic of) 80 400
Iran (Islamic Republic of) 8

Solomon Islands 156 780
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
Somalia 157 785
South Africa 158 790
South Africa 158 790
South Africa 158 790
South Africa 158 790
South Africa 158 790
South Africa 158 790
South Africa 158 790
Spain 159 795
Spain 159 795
Spain 159 795
Spain 159 795
Spain 159 795
Spain 159 795
Spain 159 795
Sri Lanka 160 800
Sri Lanka 160 800
Sri Lanka 160 800
Sri Lanka 160 800
Sri Lanka 160 800
Sri Lanka 160 800
Sri Lanka 160 800
Sudan 161 805
Sudan 161 805
Sudan 161 805
Sudan 161 805
Sudan 161 805
Sudan 161 805
Sudan 161 805
Suriname 162 810
Suriname 162 810
Suriname 162 810
Suriname 162 810
Suriname 162 810
Suriname 162 810
Suriname 162 810
Sweden 163 815
Sweden 163 815
Sweden 163 815
Sweden 163 815
Sweden 163 815
Sweden 163 815
Sweden 163 815
Switzerland 164 820
Switzerland 164 820
Switzerland 164 820
Switzerland 164 820
Switzerland 164 820
Switzerland 164 820
Switzerland 164 820
Syrian Arab Republic 165 825
Sy

In [111]:
alcohol_2000_2009_data['Year'] = alcohol_2000_2009_data['Year'].astype(np.int64)
alcohol_2010_X_data['Year'] = alcohol_2010_X_data['Year'].astype(np.int64)

In [112]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(per_exp_data[per_exp_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            per_exp_other_data = per_exp_data[per_exp_data['Country'] == main_data['Country'][val]][per_exp_data['Year'] == main_data['Year'][val]]['Percentage_Expenditure'].values[0]
            print(per_exp_other_data, "pass: 1")
            main_data.at[val, 'Percentage_Expenditure'] = per_exp_other_data
        except IndexError:
            pass
    else:
        try:
            per_exp_other_data = per_exp_data[per_exp_data['Country'].str.startswith(main_data['Country'][val])][per_exp_data['Year'] == main_data['Year'][val]]['Percentage_Expenditure'].values[0]
            print(per_exp_other_data, "pass: 2")
            main_data.at[val, 'Percentage_Expenditure'] = per_exp_other_data
        except IndexError:
            try:
                per_exp_other_data = per_exp_data[per_exp_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][per_exp_data['Year'] == main_data['Year'][val]]['Percentage_Expenditure'].values[0]
                print(per_exp_other_data, "pass: 3")
                main_data.at[val, 'Percentage_Expenditure'] = per_exp_other_data
            except IndexError:
                pass

0  9.7 pass: 1
1  8.8 pass: 1
2  7.9 pass: 1
3  8.6 pass: 1
4  8.6 pass: 1
5  9.8 pass: 1
6  10.3 pass: 1
7  9.9 pass: 1
8  10.6 pass: 1
9  9.9 pass: 1
10  9.8 pass: 1
11  8.9 pass: 1
12  9.4 pass: 1
13  No data pass: 1
14  No data pass: 1
15  7 pass: 1
16  6.3 pass: 1
17  5.9 pass: 1
18  5.6 pass: 1
19  5 pass: 1
20  5.1 pass: 1
21  5.6 pass: 1
22  6.1 pass: 1
23  5.9 pass: 1
24  6.3 pass: 1
25  6.6 pass: 1
26  6.4 pass: 1
27  6.4 pass: 1
28  6.5 pass: 1
29  6.8 pass: 1
30  6.5 pass: 1
31  6 pass: 1
32  6 pass: 1
33  5.3 pass: 1
34  5.1 pass: 1
35  5.4 pass: 1
36  4.2 pass: 1
37  3.8 pass: 1
38  3.4 pass: 1
39  3.2 pass: 1
40  3.5 pass: 1
41  3.6 pass: 1
42  3.7 pass: 1
43  3.8 pass: 1
44  3.5 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  58  59  60  12 pass: 1
61  14.2 pass: 1
62  12.1 pass: 1
63  11.8 pass: 1
64  11.6 pass: 1
65  10.9 pass: 1
66  10.4 pass: 1
67  9.8 pass: 1
68  9.7 pass: 1
69  9.8 pass: 1
70  9.2 pass: 1
71  

  """
  if sys.path[0] == '':


9.2 pass: 1
72  9.4 pass: 1
73  9.4 pass: 1
74  9.3 pass: 1
75  2.8 pass: 1
76  3 pass: 1
77  2.7 pass: 1
78  2.8 pass: 1
79  2.7 pass: 1
80  3.6 pass: 1
81  3.5 pass: 1
82  3.2 pass: 1
83  3.6 pass: 1
84  4 pass: 1
85  5 pass: 1
86  4.7 pass: 1
87  4.2 pass: 1
88  5.2 pass: 1
89  2.5 pass: 1
90  5.7 pass: 1
91  5.4 pass: 1
92  5.1 pass: 1
93  5.7 pass: 1
94  5.5 pass: 1
95  4.7 pass: 1
96  4.6 pass: 1
97  4.2 pass: 1
98  4.3 pass: 1
99  4.4 pass: 1
100  4.2 pass: 1
101  4.5 pass: 1
102  4.4 pass: 1
103  4.5 pass: 1
104  4.1 pass: 1
105  6.4 pass: 1
106  6.4 pass: 1
107  6.3 pass: 1
108  6.3 pass: 1
109  6.8 pass: 1
110  7 pass: 1
111  6.3 pass: 1
112  6.4 pass: 1
113  6.4 pass: 1
114  6.4 pass: 1
115  5.9 pass: 1
116  5.9 pass: 1
117  4.7 pass: 1
118  5.2 pass: 1
119  5 pass: 1
120  7 pass: 1
121  8.3 pass: 1
122  6.7 pass: 1
123  3.8 pass: 1
124  5.3 pass: 1
125  4.7 pass: 1
126  4.3 pass: 1
127  5.4 pass: 1
128  5.6 pass: 1
129  7 pass: 1
130  8.2 pass: 1
131  5.6 pass: 1
132  5.7 p

611  7.3 pass: 1
612  7.3 pass: 1
613  7.2 pass: 1
614  7 pass: 1
615  5 pass: 1
616  4.9 pass: 1
617  4.8 pass: 1
618  4.6 pass: 1
619  4.5 pass: 1
620  4.6 pass: 1
621  4.3 pass: 1
622  4 pass: 1
623  4.2 pass: 1
624  4.3 pass: 1
625  4.4 pass: 1
626  4.6 pass: 1
627  4.5 pass: 1
628  4.4 pass: 1
629  4.5 pass: 1
630  6.4 pass: 1
631  6 pass: 1
632  6.1 pass: 1
633  5.9 pass: 1
634  6.1 pass: 1
635  6.4 pass: 1
636  6 pass: 1
637  5.7 pass: 1
638  5.7 pass: 1
639  5.5 pass: 1
640  5.1 pass: 1
641  5.6 pass: 1
642  5.3 pass: 1
643  5.6 pass: 1
644  5.5 pass: 1
645  8 pass: 1
646  8.3 pass: 1
647  8.3 pass: 1
648  9.5 pass: 1
649  8.7 pass: 1
650  8.7 pass: 1
651  9.1 pass: 1
652  9.4 pass: 1
653  9.7 pass: 1
654  10.1 pass: 1
655  10.2 pass: 1
656  10.6 pass: 1
657  11.2 pass: 1
658  10.9 pass: 1
659  12.1 pass: 1
660  2.4 pass: 3
661  2.4 pass: 3
662  2 pass: 3
663  1.9 pass: 3
664  2 pass: 3
665  2.2 pass: 3
666  2.2 pass: 3
667  2 pass: 3
668  1.8 pass: 3
669  1.9 pass: 3
670  2.1 

1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  5.3 pass: 1
1171  5.6 pass: 1
1172  5.8 pass: 1
1173  6.1 pass: 1
1174  6.1 pass: 1
1175  6 pass: 1
1176  5.7 pass: 1
1177  5.7 pass: 1
1178  5.8 pass: 1
1179  5.3 pass: 1
1180  5.1 pass: 1
1181  5.2 pass: 1
1182  5.8 pass: 1
1183  5.4 pass: 1
1184  5.1 pass: 1
1185  1186  1187  1188  1189  1190  1191  1192  1193  1194  1195  1196  1197  1198  1199  1200  6.2 pass: 1
1201  6.2 pass: 1
1202  6.3 pass: 1
1203  6.2 pass: 1
1204  6.4 pass: 1
1205  6.6 pass: 1
1206  6.5 pass: 1
1207  6.7 pass: 1
1208  6.9 pass: 1
1209  6.6 pass: 1
1210  6.7 pass: 1
1211  6.8 pass: 1
1212  6.7 pass: 1
1213  6.7 pass: 1
1214  5.2 pass: 1
1215  4.3 pass: 1
1216  4.7 pass: 1
1217  4.6 pass: 1
1218  5.1 pass: 1
1219  4.4 pass: 1
1220  4.3 pass: 1
1221  4.3 pass: 1
1222  4.6 pass: 1
1223  4.3 pass: 1
1224  4.5 pass: 1
1225  4.6 pass: 1
1226  5 pass: 1
1227  6 pass: 1
1228  5.2 pass: 1
1229  5 pass: 1
1230  6.3 pass: 1


1749  7.2 pass: 1
1750  7.3 pass: 1
1751  7 pass: 1
1752  6.7 pass: 1
1753  6.4 pass: 1
1754  5.9 pass: 1
1755  1756  1757  1758  1759  1760  1761  1762  1763  1764  1765  1766  1767  1768  1769  1770  4.9 pass: 1
1771  4 pass: 1
1772  3.8 pass: 1
1773  5 pass: 1
1774  5.4 pass: 1
1775  5.1 pass: 1
1776  4.6 pass: 1
1777  5.3 pass: 1
1778  5.6 pass: 1
1779  5.5 pass: 1
1780  5.5 pass: 1
1781  4.8 pass: 1
1782  5.9 pass: 1
1783  5.7 pass: 1
1784  5.3 pass: 1
1785  9.7 pass: 1
1786  11.6 pass: 1
1787  8.5 pass: 1
1788  7.5 pass: 1
1789  7.2 pass: 1
1790  8.3 pass: 1
1791  8.6 pass: 1
1792  7.7 pass: 1
1793  6.9 pass: 1
1794  6.1 pass: 1
1795  5.7 pass: 1
1796  4.7 pass: 1
1797  3.9 pass: 1
1798  3.7 pass: 1
1799  4.4 pass: 1
1800  3.9 pass: 1
1801  3.7 pass: 1
1802  3.6 pass: 1
1803  3.5 pass: 1
1804  3.3 pass: 1
1805  3.4 pass: 1
1806  3.1 pass: 1
1807  3.3 pass: 1
1808  3.3 pass: 1
1809  2.9 pass: 1
1810  3 pass: 1
1811  3 pass: 1
1812  2.7 pass: 1
1813  2.7 pass: 1
1814  2.4 pass: 1
1

2286  3.1 pass: 1
2287  3.6 pass: 1
2288  3.7 pass: 1
2289  3.7 pass: 1
2290  4.1 pass: 1
2291  3.8 pass: 1
2292  3.5 pass: 1
2293  3.2 pass: 1
2294  3 pass: 1
2295  7.6 pass: 1
2296  7 pass: 1
2297  7.6 pass: 1
2298  6.7 pass: 1
2299  6.2 pass: 1
2300  6.2 pass: 1
2301  5.5 pass: 1
2302  5.4 pass: 1
2303  5.3 pass: 1
2304  5 pass: 1
2305  5 pass: 1
2306  4.9 pass: 1
2307  4.7 pass: 1
2308  5.5 pass: 1
2309  5.8 pass: 1
2310  5.1 pass: 1
2311  4.8 pass: 1
2312  4.7 pass: 1
2313  4.6 pass: 1
2314  4.7 pass: 1
2315  4.9 pass: 1
2316  4.4 pass: 1
2317  4.4 pass: 1
2318  4.5 pass: 1
2319  4.6 pass: 1
2320  4.8 pass: 1
2321  5 pass: 1
2322  5 pass: 1
2323  4.8 pass: 1
2324  4.4 pass: 1
2325  4.2 pass: 1
2326  4.5 pass: 1
2327  4.4 pass: 1
2328  4.2 pass: 1
2329  4.3 pass: 1
2330  4.4 pass: 1
2331  4 pass: 1
2332  3.9 pass: 1
2333  3.9 pass: 1
2334  3.9 pass: 1
2335  3.2 pass: 1
2336  3.2 pass: 1
2337  2.7 pass: 1
2338  2.9 pass: 1
2339  3.2 pass: 1
2340  6.2 pass: 1
2341  6.4 pass: 1
2342  

2854  5.8 pass: 1
2855  5.9 pass: 1
2856  5.9 pass: 1
2857  5.5 pass: 1
2858  5 pass: 1
2859  5.2 pass: 1
2860  4.8 pass: 1
2861  4.7 pass: 1
2862  4.2 pass: 1
2863  4.3 pass: 1
2864  4.3 pass: 1
2865  2866  2867  2868  2869  2870  2871  2872  2873  2874  2875  2876  2877  2878  2879  2880  3.7 pass: 1
2881  3.5 pass: 1
2882  3.5 pass: 1
2883  3.8 pass: 1
2884  3.6 pass: 1
2885  3.9 pass: 1
2886  3.7 pass: 1
2887  3.4 pass: 1
2888  3.3 pass: 1
2889  3.4 pass: 1
2890  3.4 pass: 1
2891  3.5 pass: 1
2892  3.5 pass: 1
2893  3.2 pass: 1
2894  3.2 pass: 1
2895  2.3 pass: 1
2896  1.7 pass: 1
2897  1.2 pass: 1
2898  1.2 pass: 1
2899  1.3 pass: 1
2900  1.6 pass: 1
2901  1 pass: 1
2902  1.1 pass: 1
2903  1 pass: 1
2904  1.3 pass: 1
2905  1.7 pass: 1
2906  2.8 pass: 1
2907  2.4 pass: 1
2908  No data pass: 1
2909  No data pass: 1
2910  6.5 pass: 1
2911  6.6 pass: 1
2912  6.1 pass: 1
2913  6.2 pass: 1
2914  6.3 pass: 1
2915  5.2 pass: 1
2916  4.6 pass: 1
2917  4.6 pass: 1
2918  4.4 pass: 1
2919  4.

In [113]:
alcohol_appended = alcohol_2010_X_data.append(alcohol_2000_2009_data)

In [114]:
alcohol_data = alcohol_appended.reset_index(drop=True)

In [115]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(alcohol_data[alcohol_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            alcohol_other_data = alcohol_data[alcohol_data['Country'] == main_data['Country'][val]][alcohol_data['Year'] == main_data['Year'][val]]['Alcohol'].values[0]
            print(alcohol_other_data, "pass: 1")
            main_data.at[val, 'Alcohol'] = alcohol_other_data
        except IndexError:
            pass
    else:
        try:
            alcohol_other_data = alcohol_data[alcohol_data['Country'].str.startswith(main_data['Country'][val])][alcohol_data['Year'] == main_data['Year'][val]]['Alcohol'].values[0]
            print(alcohol_other_data, "pass: 2")
            main_data.at[val, 'Alcohol'] = alcohol_other_data
        except IndexError:
            try:
                alcohol_other_data = alcohol_data[alcohol_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][alcohol_data['Year'] == main_data['Year'][val]]['Alcohol'].values[0]
                print(alcohol_other_data, "pass: 3")
                main_data.at[val, 'Alcohol'] = alcohol_other_data
            except IndexError:
                pass

0  0.03 pass: 1
1  0.03 pass: 1
2  0.04 pass: 1
3  0.04 pass: 1
4  0.03 pass: 1
5  0.03 pass: 1
6  0.03 pass: 1
7  0.03 pass: 1
8  0.03 pass: 1
9  0.02 pass: 1
10  0.02 pass: 1
11  0.01 pass: 1
12  0.01 pass: 1
13  0.0 pass: 1
14  0.0 pass: 1
15  4.81 pass: 1
16  5.06 pass: 1
17  5.43 pass: 1
18  5.65 pass: 1
19  5.53 pass: 1
20  6.04 pass: 1
21  5.82 pass: 1
22  5.76 pass: 1
23  5.46 pass: 1
24  5.3 pass: 1
25  4.67 pass: 1
26  4.43 pass: 1
27  4.01 pass: 1
28  4.71 pass: 1
29  3.98 pass: 1
30  0.56 pass: 1
31  0.54 pass: 1
32  0.49 pass: 1
33  0.44 pass: 1
34  0.39 pass: 1
35  0.48 pass: 1
36  0.43 pass: 1
37  0.39 pass: 1
38  0.43 pass: 1
39  0.55 pass: 1
40  0.52 pass: 1
41  0.39 pass: 1
42  0.43 pass: 1
43  0.27 pass: 1
44  0.32 pass: 1
45  46  47  48  49  50  51  52  53  54  55

  """
  if sys.path[0] == '':


  56  57  58  59  60  9.95 pass: 1
61  9.78 pass: 1
62  10.06 pass: 1
63  10.31 pass: 1
64  10.64 pass: 1
65  10.8 pass: 1
66  10.97 pass: 1
67  11.53 pass: 1
68  12.03 pass: 1
69  11.96 pass: 1
70  10.8 pass: 1
71  10.97 pass: 1
72  11.53 pass: 1
73  12.03 pass: 1
74  11.96 pass: 1
75  9.0 pass: 1
76  8.02 pass: 1
77  8.14 pass: 1
78  7.86 pass: 1
79  7.67 pass: 1
80  6.89 pass: 1
81  6.9 pass: 1
82  6.22 pass: 1
83  5.44 pass: 1
84  4.68 pass: 1
85  3.39 pass: 1
86  2.88 pass: 1
87  2.62 pass: 1
88  2.45 pass: 1
89  1.77 pass: 1
90  8.45 pass: 1
91  8.5 pass: 1
92  8.3 pass: 1
93  7.91 pass: 1
94  7.81 pass: 1
95  7.9 pass: 1
96  8.24 pass: 1
97  8.19 pass: 1
98  8.34 pass: 1
99  8.81 pass: 1
100  7.27 pass: 1
101  7.11 pass: 1
102  7.14 pass: 1
103  7.43 pass: 1
104  7.46 pass: 1
105  7.93 pass: 1
106  8.2 pass: 1
107  8.35 pass: 1
108  8.11 pass: 1
109  8.15 pass: 1
110  8.33 pass: 1
111  8.41 pass: 1
112  8.16 pass: 1
113  7.75 pass: 1
114  7.53 pass: 1
115  7.63 pass: 1
116  7.62

604  7.55 pass: 1
605  7.67 pass: 1
606  7.31 pass: 1
607  7.39 pass: 1
608  7.33 pass: 1
609  7.57 pass: 1
610  6.98 pass: 1
611  7.25 pass: 1
612  6.88 pass: 1
613  6.94 pass: 1
614  7.09 pass: 1
615  5.81 pass: 1
616  5.81 pass: 1
617  5.74 pass: 1
618  5.65 pass: 1
619  5.75 pass: 1
620  4.88 pass: 1
621  4.27 pass: 1
622  3.88 pass: 1
623  3.28 pass: 1
624  2.92 pass: 1
625  3.05 pass: 1
626  2.98 pass: 1
627  2.98 pass: 1
628  2.91 pass: 1
629  3.11 pass: 1
630  4.3 pass: 1
631  4.33 pass: 1
632  4.35 pass: 1
633  4.29 pass: 1
634  4.21 pass: 1
635  4.26 pass: 1
636  4.36 pass: 1
637  4.56 pass: 1
638  4.44 pass: 1
639  4.27 pass: 1
640  4.16 pass: 1
641  4.15 pass: 1
642  4.33 pass: 1
643  4.3 pass: 1
644  4.52 pass: 1
645  nan pass: 1
646  0.25 pass: 1
647  0.11 pass: 1
648  0.12 pass: 1
649  0.15 pass: 1
650  0.17 pass: 1
651  0.12 pass: 1
652  0.16 pass: 1
653  0.25 pass: 1
654  0.24 pass: 1
655  0.35 pass: 1
656  0.33 pass: 1
657  0.1 pass: 1
658  0.11 pass: 1
659  0.11 pass

1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  8.47 pass: 1
1171  8.37 pass: 1
1172  8.28 pass: 1
1173  8.11 pass: 1
1174  8.18 pass: 1
1175  8.42 pass: 1
1176  8.92 pass: 1
1177  9.04 pass: 1
1178  9.05 pass: 1
1179  8.79 pass: 1
1180  8.38 pass: 1
1181  9.76 pass: 1
1182  10.75 pass: 1
1183  9.64 pass: 1
1184  9.4 pass: 1
1185  1186  1187  1188  1189  1190  1191  1192  1193  1194  1195  1196  1197  1198  1199  1200  1.65 pass: 1
1201  1.81 pass: 1
1202  1.9 pass: 1
1203  2.02 pass: 1
1204  1.99 pass: 1
1205  2.0 pass: 1
1206  2.06 pass: 1
1207  2.24 pass: 1
1208  2.22 pass: 1
1209  2.2 pass: 1
1210  2.25 pass: 1
1211  2.29 pass: 1
1212  2.26 pass: 1
1213  2.37 pass: 1
1214  2.48 pass: 1
1215  0.28 pass: 1
1216  0.22 pass: 1
1217  0.22 pass: 1
1218  0.22 pass: 1
1219  0.2 pass: 1
1220  0.18 pass: 1
1221  0.2 pass: 1
1222  0.19 pass: 1
1223  0.16 pass: 1
1224  0.2 pass: 1
1225  0.34 pass: 1
1226  0.18 pass: 1
1227  0.2 pass: 1
1228  0.17

1688  4.05 pass: 1
1689  4.19 pass: 1
1690  4.24 pass: 1
1691  4.22 pass: 1
1692  4.28 pass: 1
1693  4.41 pass: 1
1694  4.46 pass: 1
1695  nan pass: 1
1696  0.0 pass: 1
1697  0.01 pass: 1
1698  0.0 pass: 1
1699  0.0 pass: 1
1700  0.01 pass: 1
1701  0.01 pass: 1
1702  0.01 pass: 1
1703  0.01 pass: 1
1704  0.0 pass: 1
1705  0.01 pass: 1
1706  0.01 pass: 1
1707  0.01 pass: 1
1708  0.0 pass: 1
1709  0.01 pass: 1
1710  1711  1712  1713  1714  1715  1716  1717  1718  1719  1720  1721  1722  1723  1724  1725  14.82 pass: 1
1726  15.14 pass: 1
1727  15.15 pass: 1
1728  14.88 pass: 1
1729  13.61 pass: 1
1730  12.4 pass: 1
1731  13.3 pass: 1
1732  13.4 pass: 1
1733  12.7 pass: 1
1734  12.3 pass: 1
1735  12.1 pass: 1
1736  11.29 pass: 1
1737  11.0 pass: 1
1738  10.2 pass: 1
1739  9.87 pass: 1
1740  11.69 pass: 1
1741  11.55 pass: 1
1742  11.89 pass: 1
1743  12.01 pass: 1
1744  11.72 pass: 1
1745  11.6 pass: 1
1746  11.72 pass: 1
1747  11.94 pass: 1
1748  12.17 pass: 1
1749  12.02 pass: 1
1750  12

2250  2251  2252  2253  2254  2255  2256  2257  2258  2259  2260  2261  2262  2263  2264  2265  7.29 pass: 1
2266  7.35 pass: 1
2267  7.11 pass: 1
2268  7.05 pass: 1
2269  6.9 pass: 1
2270  6.9 pass: 1
2271  6.74 pass: 1
2272  6.15 pass: 1
2273  5.73 pass: 1
2274  5.55 pass: 1
2275  5.72 pass: 1
2276  5.55 pass: 1
2277  5.55 pass: 1
2278  5.47 pass: 1
2279  5.61 pass: 1
2280  0.76 pass: 1
2281  0.83 pass: 1
2282  0.87 pass: 1
2283  0.88 pass: 1
2284  0.79 pass: 1
2285  0.82 pass: 1
2286  0.81 pass: 1
2287  0.71 pass: 1
2288  0.64 pass: 1
2289  0.84 pass: 1
2290  0.58 pass: 1
2291  0.59 pass: 1
2292  0.61 pass: 1
2293  0.68 pass: 1
2294  0.74 pass: 1
2295  6.07 pass: 1
2296  6.14 pass: 1
2297  6.17 pass: 1
2298  6.6 pass: 1
2299  6.81 pass: 1
2300  6.64 pass: 1
2301  7.69 pass: 1
2302  6.66 pass: 1
2303  6.51 pass: 1
2304  5.98 pass: 1
2305  5.62 pass: 1
2306  4.76 pass: 1
2307  5.02 pass: 1
2308  5.82 pass: 1
2309  6.18 pass: 1
2310  5.14 pass: 1
2311  5.06 pass: 1
2312  5.38 pass: 1
2

2832  10.85 pass: 1
2833  11.12 pass: 1
2834  11.26 pass: 1
2835  0.2 pass: 1
2836  0.15 pass: 1
2837  0.21 pass: 1
2838  0.6 pass: 1
2839  0.76 pass: 1
2840  0.75 pass: 1
2841  0.74 pass: 1
2842  0.74 pass: 1
2843  0.75 pass: 1
2844  0.78 pass: 1
2845  0.6 pass: 1
2846  0.86 pass: 1
2847  0.9 pass: 1
2848  0.94 pass: 1
2849  0.92 pass: 1
2850  0.87 pass: 1
2851  0.79 pass: 1
2852  0.76 pass: 1
2853  0.7 pass: 1
2854  0.67 pass: 1
2855  0.68 pass: 1
2856  0.59 pass: 1
2857  0.59 pass: 1
2858  0.63 pass: 1
2859  0.76 pass: 1
2860  0.82 pass: 1
2861  0.88 pass: 1
2862  0.94 pass: 1
2863  0.94 pass: 1
2864  0.91 pass: 1
2865  2866  2867  2868  2869  2870  2871  2872  2873  2874  2875  2876  2877  2878  2879  2880  6.9 pass: 1
2881  6.79 pass: 1
2882  7.09 pass: 1
2883  7.14 pass: 1
2884  6.7 pass: 1
2885  6.74 pass: 1
2886  7.54 pass: 1
2887  6.14 pass: 1
2888  6.12 pass: 1
2889  6.21 pass: 1
2890  5.8 pass: 1
2891  5.95 pass: 1
2892  5.72 pass: 1
2893  5.75 pass: 1
2894  5.4 pass: 1
2895

## BMI 5-19 Years

In [116]:
bmi_5_19 = pd.read_csv("Data/New/BMI_5-19/BMI_5-19_Internet.csv")

In [117]:
bmi_5_19.rename(columns = {bmi_5_19.columns[0]: "Country"}, inplace=True)
bmi_5_19.head()

Unnamed: 0,Country,2016,2016.1,2016.2,2015,2015.1,2015.2,2014,2014.1,2014.2,...,1978.2,1977,1977.1,1977.2,1976,1976.1,1976.2,1975,1975.1,1975.2
0,Country,Both sexes,Male,Female,Both sexes,Male,Female,Both sexes,Male,Female,...,Female,Both sexes,Male,Female,Both sexes,Male,Female,Both sexes,Male,Female
1,Afghanistan,17.4 [16.2-18.7],16.7 [14.5-19.1],18.1 [17.4-18.8],17.3 [16.1-18.5],16.6 [14.4-18.9],18.0 [17.4-18.6],17.2 [16.1-18.4],16.5 [14.4-18.8],17.9 [17.3-18.5],...,15.9 [13.7-17.9],15.3 [13.7-16.9],14.8 [12.4-17.2],15.8 [13.6-17.9],15.3 [13.6-16.9],14.8 [12.3-17.3],15.8 [13.5-18.0],15.2 [13.5-16.9],14.7 [12.2-17.3],15.7 [13.3-18.0]
2,Albania,19.8 [19.3-20.4],20.0 [19.1-20.8],19.7 [19.0-20.3],19.9 [19.4-20.3],20.0 [19.3-20.7],19.7 [19.1-20.2],19.9 [19.5-20.3],20.1 [19.5-20.6],19.6 [19.2-20.1],...,17.8 [15.6-20.0],18.3 [16.8-19.8],18.8 [16.9-20.9],17.7 [15.5-20.1],18.2 [16.7-19.8],18.8 [16.7-21.0],17.7 [15.3-20.1],18.2 [16.5-19.8],18.7 [16.4-21.0],17.7 [15.2-20.2]
3,Algeria,19.7 [18.2-21.3],19.7 [17.6-21.9],19.7 [17.6-21.9],19.7 [18.2-21.2],19.7 [17.6-21.8],19.8 [17.7-21.8],19.8 [18.3-21.2],19.7 [17.7-21.8],19.8 [17.8-21.8],...,17.8 [15.4-20.1],17.4 [15.6-19.1],17.0 [14.7-19.5],17.7 [15.3-20.1],17.3 [15.5-19.1],17.0 [14.5-19.5],17.7 [15.2-20.2],17.3 [15.4-19.1],16.9 [14.3-19.5],17.6 [15.0-20.2]
4,Andorra,20.2 [18.6-21.7],20.3 [18.1-22.5],20.0 [17.9-22.2],20.2 [18.7-21.7],20.3 [18.2-22.5],20.0 [18.0-22.1],20.2 [18.7-21.6],20.3 [18.3-22.4],20.0 [18.0-22.0],...,19.0 [16.7-21.3],19.0 [17.4-20.7],19.0 [16.9-21.4],19.0 [16.6-21.3],18.9 [17.3-20.7],19.0 [16.7-21.4],18.9 [16.5-21.3],18.9 [17.1-20.7],18.9 [16.6-21.4],18.8 [16.3-21.3]


In [118]:
count = 0
bmi_5_19_data = pd.DataFrame(columns=['Country', 'Year', 'BMI_5-19_years'])
for i in range(1, len(bmi_5_19['Country'].unique())):
    j = 1
    while j < len(bmi_5_19.columns):
        #print(bmi_5_19.loc[i,'Country'], end='')
        bmi_5_19_data.at[count, 'Country'] = bmi_5_19.loc[i,'Country']
        bmi_5_19_data.at[count, 'Year'] = bmi_5_19.columns[j]
       # print(bmi_5_19.columns[j])
        bmi_5_19_data.at[count, 'BMI_5-19_years'] = bmi_5_19[bmi_5_19['Country'] == bmi_5_19['Country'][i]].T[1:].loc[bmi_5_19.columns[j]].values[0].split(' [')[0]
        count+=1
        j += 3

In [119]:
bmi_5_19_data.head()

Unnamed: 0,Country,Year,BMI_5-19_years
0,Afghanistan,2016,17.4
1,Afghanistan,2015,17.3
2,Afghanistan,2014,17.2
3,Afghanistan,2013,17.1
4,Afghanistan,2012,17.0


In [120]:
bmi_5_19_data['Year'] = bmi_5_19_data['Year'].astype(np.int64)

In [121]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(bmi_5_19_data[bmi_5_19_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            bmi_5_19_other_data = bmi_5_19_data[bmi_5_19_data['Country'] == main_data['Country'][val]][bmi_5_19_data['Year'] == main_data['Year'][val]]['BMI_5-19_years'].values[0]
            print(bmi_5_19_other_data, "pass: 1")
            main_data.at[val, 'BMI_5-19_years'] = bmi_5_19_other_data
        except IndexError:
            pass
    else:
        try:
            bmi_5_19_other_data = bmi_5_19_data[bmi_5_19_data['Country'].str.startswith(main_data['Country'][val])][bmi_5_19_data['Year'] == main_data['Year'][val]]['BMI_5-19_years'].values[0]
            print(bmi_5_19_other_data, "pass: 2")
            main_data.at[val, 'BMI_5-19_years'] = bmi_5_19_other_data
        except IndexError:
            try:
                bmi_5_19_other_data = bmi_5_19_data[bmi_5_19_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][bmi_5_19_data['Year'] == main_data['Year'][val]]['BMI_5-19_years'].values[0]
                print(bmi_5_19_other_data, "pass: 3")
                main_data.at[val, 'BMI_5-19_years'] = bmi_5_19_other_data
            except IndexError:
                pass

0  17.2 pass: 1
1  17.1 pass: 1
2  17.0 pass: 1
3  16.9 pass: 1
4  16.8 pass: 1
5  16.7 pass: 1
6  16.7 pass: 1
7  16.6 pass: 1
8  16.5 pass: 1
9  16.5 pass: 1
10  16.4 pass: 1
11  16.4 pass: 1
12  16.4 pass: 1
13  16.3 pass: 1
14  16.3 pass: 1
15  19.9 pass: 1
16  19.9 pass: 1
17  19.9 pass: 1
18  19.8 pass: 1
19  19.8 pass: 1
20  19.8 pass: 1
21  19.7 pass: 1
22  19.7 pass: 1
23  19.6 pass: 1
24  19.5 pass: 1
25  19.5 pass: 1
26  19.5 pass: 1
27  19.4 pass: 1
28  19.4 pass: 1
29  19.3 pass: 1
30  19.8 pass: 1
31  19.8 pass: 1
32  19.9 pass: 1
33  19.9 pass: 1
34  19.9 pass: 1
35  19.9 pass: 1
36  19.9 pass: 1
37  19.8 pass: 1
38  19.8 pass: 1
39  19.7 pass: 1
40  19.6 pass: 1
41  19.6 pass: 1
42  19.5 pass: 1
43  19.4 pass: 1
44  19.3 pass: 1
45  46  47  48  49  50  51  52  53  54  55  

  """
  if sys.path[0] == '':


56  57  58  59  60  20.2 pass: 1
61  20.2 pass: 1
62  20.2 pass: 1
63  20.3 pass: 1
64  20.3 pass: 1
65  20.4 pass: 1
66  20.4 pass: 1
67  20.4 pass: 1
68  20.4 pass: 1
69  20.4 pass: 1
70  20.4 pass: 1
71  20.4 pass: 1
72  20.4 pass: 1
73  20.4 pass: 1
74  20.4 pass: 1
75  17.6 pass: 1
76  17.5 pass: 1
77  17.5 pass: 1
78  17.5 pass: 1
79  17.4 pass: 1
80  17.4 pass: 1
81  17.4 pass: 1
82  17.3 pass: 1
83  17.3 pass: 1
84  17.3 pass: 1
85  17.2 pass: 1
86  17.2 pass: 1
87  17.2 pass: 1
88  17.1 pass: 1
89  17.1 pass: 1
90  21.3 pass: 1
91  21.2 pass: 1
92  21.1 pass: 1
93  21.0 pass: 1
94  20.9 pass: 1
95  20.8 pass: 1
96  20.7 pass: 1
97  20.6 pass: 1
98  20.5 pass: 1
99  20.4 pass: 1
100  20.3 pass: 1
101  20.3 pass: 1
102  20.2 pass: 1
103  20.1 pass: 1
104  20.0 pass: 1
105  20.6 pass: 1
106  20.5 pass: 1
107  20.5 pass: 1
108  20.4 pass: 1
109  20.4 pass: 1
110  20.3 pass: 1
111  20.3 pass: 1
112  20.2 pass: 1
113  20.1 pass: 1
114  20.1 pass: 1
115  20.0 pass: 1
116  20.0 pass: 

602  21.7 pass: 1
603  21.6 pass: 1
604  21.5 pass: 1
605  21.4 pass: 1
606  21.3 pass: 1
607  21.2 pass: 1
608  21.1 pass: 1
609  21.0 pass: 1
610  20.9 pass: 1
611  20.7 pass: 1
612  20.6 pass: 1
613  20.5 pass: 1
614  20.4 pass: 1
615  19.3 pass: 1
616  19.2 pass: 1
617  19.1 pass: 1
618  19.1 pass: 1
619  19.0 pass: 1
620  18.9 pass: 1
621  18.8 pass: 1
622  18.8 pass: 1
623  18.7 pass: 1
624  18.6 pass: 1
625  18.4 pass: 1
626  18.3 pass: 1
627  18.1 pass: 1
628  18.0 pass: 1
629  17.9 pass: 1
630  19.2 pass: 1
631  19.1 pass: 1
632  19.1 pass: 1
633  19.0 pass: 1
634  19.0 pass: 1
635  18.9 pass: 1
636  18.9 pass: 1
637  18.8 pass: 1
638  18.7 pass: 1
639  18.7 pass: 1
640  18.6 pass: 1
641  18.6 pass: 1
642  18.5 pass: 1
643  18.5 pass: 1
644  18.4 pass: 1
645  18.0 pass: 1
646  18.0 pass: 1
647  17.9 pass: 1
648  17.8 pass: 1
649  17.8 pass: 1
650  17.8 pass: 1
651  17.8 pass: 1
652  17.7 pass: 1
653  17.7 pass: 1
654  17.7 pass: 1
655  17.7 pass: 1
656  17.7 pass: 1
657  17.7 

1113  17.5 pass: 1
1114  17.5 pass: 1
1115  17.5 pass: 1
1116  17.4 pass: 1
1117  17.4 pass: 1
1118  17.4 pass: 1
1119  17.3 pass: 1
1120  17.3 pass: 1
1121  17.2 pass: 1
1122  17.2 pass: 1
1123  17.1 pass: 1
1124  17.1 pass: 1
1125  1126  1127  1128  1129  1130  1131  1132  1133  1134  1135  1136  1137  1138  1139  1140  21.0 pass: 1
1141  21.0 pass: 1
1142  20.9 pass: 1
1143  20.9 pass: 1
1144  20.9 pass: 1
1145  20.8 pass: 1
1146  20.8 pass: 1
1147  20.7 pass: 1
1148  20.6 pass: 1
1149  20.6 pass: 1
1150  20.5 pass: 1
1151  20.4 pass: 1
1152  20.4 pass: 1
1153  20.3 pass: 1
1154  20.3 pass: 1
1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  20.1 pass: 1
1171  20.0 pass: 1
1172  20.0 pass: 1
1173  19.9 pass: 1
1174  19.9 pass: 1
1175  19.8 pass: 1
1176  19.8 pass: 1
1177  19.7 pass: 1
1178  19.6 pass: 1
1179  19.5 pass: 1
1180  19.4 pass: 1
1181  19.3 pass: 1
1182  19.2 pass: 1
1183  19.1 pass: 1
1184  19.0 pass: 1
1185  1186  1187  1188

1701  19.8 pass: 1
1702  19.8 pass: 1
1703  19.8 pass: 1
1704  19.8 pass: 1
1705  19.8 pass: 1
1706  19.7 pass: 1
1707  19.7 pass: 1
1708  19.6 pass: 1
1709  19.5 pass: 1
1710  1711  1712  1713  1714  1715  1716  1717  1718  1719  1720  1721  1722  1723  1724  1725  19.4 pass: 1
1726  19.4 pass: 1
1727  19.5 pass: 1
1728  19.5 pass: 1
1729  19.5 pass: 1
1730  19.5 pass: 1
1731  19.5 pass: 1
1732  19.5 pass: 1
1733  19.4 pass: 1
1734  19.4 pass: 1
1735  19.3 pass: 1
1736  19.2 pass: 1
1737  19.1 pass: 1
1738  19.1 pass: 1
1739  19.0 pass: 1
1740  19.5 pass: 1
1741  19.5 pass: 1
1742  19.5 pass: 1
1743  19.4 pass: 1
1744  19.4 pass: 1
1745  19.4 pass: 1
1746  19.4 pass: 1
1747  19.4 pass: 1
1748  19.3 pass: 1
1749  19.3 pass: 1
1750  19.3 pass: 1
1751  19.3 pass: 1
1752  19.2 pass: 1
1753  19.2 pass: 1
1754  19.2 pass: 1
1755  1756  1757  1758  1759  1760  1761  1762  1763  1764  1765  1766  1767  1768  1769  1770  17.3 pass: 1
1771  17.3 pass: 1
1772  17.3 pass: 1
1773  17.2 pass: 1
177

2222  20.1 pass: 1
2223  20.0 pass: 1
2224  20.0 pass: 1
2225  19.9 pass: 1
2226  19.8 pass: 1
2227  19.7 pass: 1
2228  19.6 pass: 1
2229  19.5 pass: 1
2230  19.4 pass: 1
2231  19.4 pass: 1
2232  19.3 pass: 1
2233  19.2 pass: 1
2234  19.1 pass: 1
2235  17.2 pass: 1
2236  17.2 pass: 1
2237  17.1 pass: 1
2238  17.1 pass: 1
2239  17.0 pass: 1
2240  17.0 pass: 1
2241  17.0 pass: 1
2242  16.9 pass: 1
2243  16.9 pass: 1
2244  16.8 pass: 1
2245  16.7 pass: 1
2246  16.7 pass: 1
2247  16.6 pass: 1
2248  16.6 pass: 1
2249  16.5 pass: 1
2250  23.1 pass: 1
2251  22.9 pass: 1
2252  22.8 pass: 1
2253  22.6 pass: 1
2254  22.5 pass: 1
2255  22.4 pass: 1
2256  22.2 pass: 1
2257  22.1 pass: 1
2258  22.0 pass: 1
2259  21.9 pass: 1
2260  21.8 pass: 1
2261  21.7 pass: 1
2262  21.6 pass: 1
2263  21.5 pass: 1
2264  21.4 pass: 1
2265  19.8 pass: 1
2266  19.8 pass: 1
2267  19.7 pass: 1
2268  19.7 pass: 1
2269  19.6 pass: 1
2270  19.6 pass: 1
2271  19.6 pass: 1
2272  19.5 pass: 1
2273  19.5 pass: 1
2274  19.5 p

2715  2716  2717  2718  2719  2720  2721  2722  2723  2724  2725  2726  2727  2728  2729  2730  2731  2732  2733  2734  2735  2736  2737  2738  2739  2740  2741  2742  2743  2744  2745  2746  2747  2748  2749  2750  2751  2752  2753  2754  2755  2756  2757  2758  2759  2760  2761  2762  2763  2764  2765  2766  2767  2768  2769  2770  2771  2772  2773  2774  2775  No data pass: 1
2776  No data pass: 1
2777  No data pass: 1
2778  No data pass: 1
2779  No data pass: 1
2780  No data pass: 1
2781  No data pass: 1
2782  No data pass: 1
2783  No data pass: 1
2784  No data pass: 1
2785  No data pass: 1
2786  No data pass: 1
2787  No data pass: 1
2788  No data pass: 1
2789  No data pass: 1
2790  19.9 pass: 1
2791  19.8 pass: 1
2792  19.7 pass: 1
2793  19.6 pass: 1
2794  19.5 pass: 1
2795  19.4 pass: 1
2796  19.3 pass: 1
2797  19.2 pass: 1
2798  19.2 pass: 1
2799  19.1 pass: 1
2800  19.1 pass: 1
2801  19.1 pass: 1
2802  19.0 pass: 1
2803  19.0 pass: 1
2804  18.9 pass: 1
2805  19.3 pass: 1
2806  

## BMI 18+ Years

In [122]:
bmi_18 = pd.read_csv("Data/New/BMI_18+/BMI_18+_Internet.csv")

In [123]:
bmi_18.rename(columns = {bmi_18.columns[0]: "Country"}, inplace=True)
bmi_18.head()

Unnamed: 0,Country,2016,2016.1,2016.2,2015,2015.1,2015.2,2014,2014.1,2014.2,...,1978.2,1977,1977.1,1977.2,1976,1976.1,1976.2,1975,1975.1,1975.2
0,Country,Both sexes,Male,Female,Both sexes,Male,Female,Both sexes,Male,Female,...,Female,Both sexes,Male,Female,Both sexes,Male,Female,Both sexes,Male,Female
1,Afghanistan,23.0 [21.6-24.4],22.3 [19.8-24.9],23.7 [22.8-24.6],22.9 [21.6-24.3],22.3 [19.8-24.8],23.6 [22.7-24.5],22.8 [21.5-24.2],22.2 [19.7-24.7],23.5 [22.7-24.3],...,19.3 [16.6-21.9],19.2 [17.3-21.0],19.2 [16.6-21.8],19.2 [16.4-21.8],19.1 [17.2-21.0],19.1 [16.5-21.8],19.1 [16.2-21.8],18.9 [17.0-20.9],19.0 [16.3-21.7],18.9 [16.0-21.8]
2,Albania,26.8 [25.9-27.6],27.0 [25.9-28.2],26.5 [25.2-27.9],26.7 [25.9-27.5],26.9 [25.8-28.0],26.4 [25.2-27.7],26.6 [25.8-27.3],26.8 [25.8-27.8],26.3 [25.2-27.5],...,23.5 [21.1-25.9],23.6 [22.1-25.2],23.7 [21.9-25.6],23.5 [21.0-26.0],23.6 [21.9-25.2],23.7 [21.7-25.7],23.5 [20.9-26.0],23.5 [21.8-25.2],23.6 [21.6-25.7],23.4 [20.7-26.1]
3,Algeria,25.6 [24.6-26.5],24.7 [23.3-26.0],26.5 [25.0-27.9],25.5 [24.5-26.4],24.6 [23.3-25.8],26.4 [25.0-27.7],25.3 [24.5-26.2],24.4 [23.3-25.5],26.3 [25.0-27.5],...,22.7 [20.4-25.0],21.9 [20.4-23.5],21.2 [19.3-23.1],22.6 [20.2-25.1],21.8 [20.2-23.5],21.1 [19.1-23.2],22.6 [20.0-25.1],21.8 [20.1-23.5],21.0 [19.0-23.2],22.5 [19.8-25.1]
4,Andorra,27.0 [24.9-29.1],27.6 [25.1-30.3],26.4 [23.0-29.8],27.0 [25.0-29.1],27.6 [25.2-30.1],26.5 [23.1-29.8],27.0 [25.0-29.1],27.6 [25.2-30.0],26.5 [23.2-29.7],...,26.1 [22.6-29.5],25.6 [23.5-27.8],25.2 [22.7-27.8],26.0 [22.5-29.5],25.6 [23.4-27.7],25.1 [22.5-27.8],25.9 [22.3-29.5],25.5 [23.2-27.7],25.0 [22.4-27.7],25.9 [22.2-29.4]


In [124]:
count = 0
bmi_18_data = pd.DataFrame(columns=['Country', 'Year', 'BMI_18+_years'])
for i in range(1, len(bmi_18['Country'].unique())):
    j = 1
    while j < len(bmi_18.columns):
        #print(bmi_18.loc[i,'Country'], end='')
        bmi_18_data.at[count, 'Country'] = bmi_18.loc[i,'Country']
        bmi_18_data.at[count, 'Year'] = bmi_18.columns[j]
       # print(bmi_18.columns[j])
        bmi_18_data.at[count, 'BMI_18+_years'] = bmi_18[bmi_18['Country'] == bmi_18['Country'][i]].T[1:].loc[bmi_18.columns[j]].values[0].split(' [')[0]
        count+=1
        j += 3

In [125]:
bmi_18_data.head()

Unnamed: 0,Country,Year,BMI_18+_years
0,Afghanistan,2016,23.0
1,Afghanistan,2015,22.9
2,Afghanistan,2014,22.8
3,Afghanistan,2013,22.8
4,Afghanistan,2012,22.7


In [126]:
bmi_18_data['Year'] = bmi_18_data['Year'].astype(np.int64)

In [127]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(bmi_18_data[bmi_18_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            bmi_18_other_data = bmi_18_data[bmi_18_data['Country'] == main_data['Country'][val]][bmi_18_data['Year'] == main_data['Year'][val]]['BMI_18+_years'].values[0]
            print(bmi_18_other_data, "pass: 1")
            main_data.at[val, 'BMI_18+_years'] = bmi_18_other_data
        except IndexError:
            pass
    else:
        try:
            bmi_18_other_data = bmi_18_data[bmi_18_data['Country'].str.startswith(main_data['Country'][val])][bmi_18_data['Year'] == main_data['Year'][val]]['BMI_18+_years'].values[0]
            print(bmi_18_other_data, "pass: 2")
            main_data.at[val, 'BMI_18+_years'] = bmi_18_other_data
        except IndexError:
            try:
                bmi_18_other_data = bmi_18_data[bmi_18_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][bmi_18_data['Year'] == main_data['Year'][val]]['BMI_18+_years'].values[0]
                print(bmi_18_other_data, "pass: 3")
                main_data.at[val, 'BMI_18+_years'] = bmi_18_other_data
            except IndexError:
                pass

0  22.8 pass: 1
1  22.8 pass: 1
2  22.7 pass: 1
3  22.6 pass: 1
4  22.5 pass: 1
5  22.4 pass: 1
6  22.3 pass: 1
7  22.2 pass: 1
8  22.1 pass: 1
9  22.0 pass: 1
10  21.9 pass: 1
11  21.8 pass: 1
12  21.7 pass: 1
13  21.6 pass: 1
14  21.5 pass: 1
15  26.6 pass: 1
16  26.5 pass: 1
17  26.4 pass: 1
18  26.3 pass: 1
19  26.2 pass: 1
20  26.1 pass: 1
21  26.0 pass: 1
22  25.9 pass: 1
23  25.8 pass: 1
24  25.6 pass: 1
25  25.5 pass: 1
26  25.4 pass: 1
27  25.3 pass: 1
28  25.2 pass: 1
29  25.1 pass: 1
30  25.3 pass: 1
31  25.2 pass: 1
32  25.1 pass: 1
33  25.0 pass: 1
34  24.9 pass: 1
35  24.8 pass: 1
36  24.7 pass: 1
37  24.6 pass: 1
38  24.6 pass: 1
39  24.5 pass: 1
40  24.4 pass: 1
41  24.3 pass: 1
42  24.2 pass: 1
43  24.1 pass: 1
44  24.0 pass: 1
45  46  47  48  49  50  51  52  53  54  55  56  57  

  """
  if sys.path[0] == '':


58  59  60  27.0 pass: 1
61  27.0 pass: 1
62  27.0 pass: 1
63  27.0 pass: 1
64  27.0 pass: 1
65  27.0 pass: 1
66  27.0 pass: 1
67  27.0 pass: 1
68  27.0 pass: 1
69  26.9 pass: 1
70  26.9 pass: 1
71  26.9 pass: 1
72  26.8 pass: 1
73  26.8 pass: 1
74  26.8 pass: 1
75  22.8 pass: 1
76  22.8 pass: 1
77  22.7 pass: 1
78  22.6 pass: 1
79  22.5 pass: 1
80  22.4 pass: 1
81  22.3 pass: 1
82  22.2 pass: 1
83  22.1 pass: 1
84  22.0 pass: 1
85  21.9 pass: 1
86  21.8 pass: 1
87  21.7 pass: 1
88  21.6 pass: 1
89  21.5 pass: 1
90  26.5 pass: 1
91  26.4 pass: 1
92  26.3 pass: 1
93  26.2 pass: 1
94  26.1 pass: 1
95  26.0 pass: 1
96  25.9 pass: 1
97  25.8 pass: 1
98  25.7 pass: 1
99  25.6 pass: 1
100  25.5 pass: 1
101  25.4 pass: 1
102  25.2 pass: 1
103  25.1 pass: 1
104  25.0 pass: 1
105  27.5 pass: 1
106  27.4 pass: 1
107  27.3 pass: 1
108  27.2 pass: 1
109  27.1 pass: 1
110  27.0 pass: 1
111  26.9 pass: 1
112  26.8 pass: 1
113  26.7 pass: 1
114  26.6 pass: 1
115  26.5 pass: 1
116  26.4 pass: 1
117  2

602  27.7 pass: 1
603  27.6 pass: 1
604  27.5 pass: 1
605  27.4 pass: 1
606  27.3 pass: 1
607  27.2 pass: 1
608  27.1 pass: 1
609  27.0 pass: 1
610  26.9 pass: 1
611  26.9 pass: 1
612  26.8 pass: 1
613  26.7 pass: 1
614  26.6 pass: 1
615  23.7 pass: 1
616  23.6 pass: 1
617  23.5 pass: 1
618  23.4 pass: 1
619  23.3 pass: 1
620  23.2 pass: 1
621  23.1 pass: 1
622  23.0 pass: 1
623  22.9 pass: 1
624  22.8 pass: 1
625  22.7 pass: 1
626  22.6 pass: 1
627  22.5 pass: 1
628  22.5 pass: 1
629  22.4 pass: 1
630  26.0 pass: 1
631  25.9 pass: 1
632  25.8 pass: 1
633  25.7 pass: 1
634  25.6 pass: 1
635  25.5 pass: 1
636  25.4 pass: 1
637  25.3 pass: 1
638  25.2 pass: 1
639  25.1 pass: 1
640  25.0 pass: 1
641  24.9 pass: 1
642  24.8 pass: 1
643  24.7 pass: 1
644  24.6 pass: 1
645  24.2 pass: 1
646  24.1 pass: 1
647  24.0 pass: 1
648  23.9 pass: 1
649  23.8 pass: 1
650  23.7 pass: 1
651  23.5 pass: 1
652  23.4 pass: 1
653  23.3 pass: 1
654  23.2 pass: 1
655  23.1 pass: 1
656  23.0 pass: 1
657  22.9 

1125  1126  1127  1128  1129  1130  1131  1132  1133  1134  1135  1136  1137  1138  1139  1140  27.7 pass: 1
1141  27.7 pass: 1
1142  27.6 pass: 1
1143  27.6 pass: 1
1144  27.6 pass: 1
1145  27.5 pass: 1
1146  27.5 pass: 1
1147  27.4 pass: 1
1148  27.4 pass: 1
1149  27.3 pass: 1
1150  27.3 pass: 1
1151  27.2 pass: 1
1152  27.1 pass: 1
1153  27.1 pass: 1
1154  27.0 pass: 1
1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  26.6 pass: 1
1171  26.5 pass: 1
1172  26.3 pass: 1
1173  26.2 pass: 1
1174  26.1 pass: 1
1175  26.0 pass: 1
1176  25.9 pass: 1
1177  25.8 pass: 1
1178  25.7 pass: 1
1179  25.6 pass: 1
1180  25.5 pass: 1
1181  25.4 pass: 1
1182  25.3 pass: 1
1183  25.2 pass: 1
1184  25.1 pass: 1
1185  1186  1187  1188  1189  1190  1191  1192  1193  1194  1195  1196  1197  1198  1199  1200  26.1 pass: 1
1201  26.0 pass: 1
1202  25.9 pass: 1
1203  25.8 pass: 1
1204  25.7 pass: 1
1205  25.6 pass: 1
1206  25.5 pass: 1
1207  25.4 pass: 1
1208  25

1710  1711  1712  1713  1714  1715  1716  1717  1718  1719  1720  1721  1722  1723  1724  1725  26.9 pass: 1
1726  26.9 pass: 1
1727  26.8 pass: 1
1728  26.8 pass: 1
1729  26.8 pass: 1
1730  26.7 pass: 1
1731  26.7 pass: 1
1732  26.7 pass: 1
1733  26.6 pass: 1
1734  26.6 pass: 1
1735  26.6 pass: 1
1736  26.5 pass: 1
1737  26.5 pass: 1
1738  26.4 pass: 1
1739  26.4 pass: 1
1740  26.7 pass: 1
1741  26.7 pass: 1
1742  26.6 pass: 1
1743  26.6 pass: 1
1744  26.6 pass: 1
1745  26.5 pass: 1
1746  26.5 pass: 1
1747  26.4 pass: 1
1748  26.4 pass: 1
1749  26.3 pass: 1
1750  26.3 pass: 1
1751  26.2 pass: 1
1752  26.1 pass: 1
1753  26.0 pass: 1
1754  25.9 pass: 1
1755  1756  1757  1758  1759  1760  1761  1762  1763  1764  1765  1766  1767  1768  1769  1770  21.2 pass: 1
1771  21.1 pass: 1
1772  21.1 pass: 1
1773  21.1 pass: 1
1774  21.0 pass: 1
1775  21.0 pass: 1
1776  20.9 pass: 1
1777  20.9 pass: 1
1778  20.9 pass: 1
1779  20.8 pass: 1
1780  20.8 pass: 1
1781  20.7 pass: 1
1782  20.7 pass: 1
178

2175  2176  2177  2178  2179  2180  2181  2182  2183  2184  2185  2186  2187  2188  2189  2190  2191  2192  2193  2194  2195  2196  2197  2198  2199  2200  2201  2202  2203  2204  2205  27.0 pass: 1
2206  26.9 pass: 1
2207  26.8 pass: 1
2208  26.8 pass: 1
2209  26.7 pass: 1
2210  26.7 pass: 1
2211  26.6 pass: 1
2212  26.5 pass: 1
2213  26.5 pass: 1
2214  26.4 pass: 1
2215  26.3 pass: 1
2216  26.2 pass: 1
2217  26.1 pass: 1
2218  26.0 pass: 1
2219  25.9 pass: 1
2220  25.9 pass: 1
2221  25.8 pass: 1
2222  25.8 pass: 1
2223  25.7 pass: 1
2224  25.7 pass: 1
2225  25.6 pass: 1
2226  25.6 pass: 1
2227  25.6 pass: 1
2228  25.5 pass: 1
2229  25.5 pass: 1
2230  25.4 pass: 1
2231  25.4 pass: 1
2232  25.3 pass: 1
2233  25.2 pass: 1
2234  25.2 pass: 1
2235  23.6 pass: 1
2236  23.5 pass: 1
2237  23.4 pass: 1
2238  23.3 pass: 1
2239  23.2 pass: 1
2240  23.1 pass: 1
2241  23.0 pass: 1
2242  22.9 pass: 1
2243  22.9 pass: 1
2244  22.8 pass: 1
2245  22.7 pass: 1
2246  22.6 pass: 1
2247  22.5 pass: 1
224

2687  26.6 pass: 1
2688  26.6 pass: 1
2689  26.6 pass: 1
2690  26.6 pass: 1
2691  26.6 pass: 1
2692  26.6 pass: 1
2693  26.6 pass: 1
2694  26.6 pass: 1
2695  26.6 pass: 1
2696  26.5 pass: 1
2697  26.5 pass: 1
2698  26.5 pass: 1
2699  26.4 pass: 1
2700  23.0 pass: 1
2701  22.9 pass: 1
2702  22.7 pass: 1
2703  22.6 pass: 1
2704  22.5 pass: 1
2705  22.4 pass: 1
2706  22.3 pass: 1
2707  22.2 pass: 1
2708  22.1 pass: 1
2709  22.0 pass: 1
2710  21.9 pass: 1
2711  21.8 pass: 1
2712  21.7 pass: 1
2713  21.6 pass: 1
2714  21.5 pass: 1
2715  2716  2717  2718  2719  2720  2721  2722  2723  2724  2725  2726  2727  2728  2729  2730  2731  2732  2733  2734  2735  2736  2737  2738  2739  2740  2741  2742  2743  2744  2745  2746  2747  2748  2749  2750  2751  2752  2753  2754  2755  2756  2757  2758  2759  2760  2761  2762  2763  2764  2765  2766  2767  2768  2769  2770  2771  2772  2773  2774  2775  No data pass: 1
2776  No data pass: 1
2777  No data pass: 1
2778  No data pass: 1
2779  No data pass: 

3165  3166  3167  3168  3169  3170  3171  3172  3173  3174  3175  3176  3177  3178  3179  3180  3181  3182  3183  3184  3185  3186  3187  3188  3189  3190  3191  3192  3193  3194  3195  3196  3197  3198  3199  3200  3201  3202  3203  3204  3205  3206  3207  3208  3209  3210  23.2 pass: 3
3211  23.1 pass: 3
3212  23.0 pass: 3
3213  22.9 pass: 3
3214  22.8 pass: 3
3215  22.7 pass: 3
3216  22.7 pass: 3
3217  22.6 pass: 3
3218  22.5 pass: 3
3219  22.4 pass: 3
3220  22.4 pass: 3
3221  22.3 pass: 3
3222  22.2 pass: 3
3223  22.1 pass: 3
3224  22.1 pass: 3
3225  22.1 pass: 1
3226  22.0 pass: 1
3227  21.9 pass: 1
3228  21.9 pass: 1
3229  21.8 pass: 1
3230  21.7 pass: 1
3231  21.7 pass: 1
3232  21.6 pass: 1
3233  21.5 pass: 1
3234  21.5 pass: 1
3235  21.4 pass: 1
3236  21.4 pass: 1
3237  21.3 pass: 1
3238  21.3 pass: 1
3239  21.2 pass: 1
3240  23.3 pass: 1
3241  23.2 pass: 1
3242  23.2 pass: 1
3243  23.2 pass: 1
3244  23.2 pass: 1
3245  23.1 pass: 1
3246  23.1 pass: 1
3247  23.1 pass: 1
3248  23

In [128]:
main_data.head()

Unnamed: 0,Country,Year,Status,Life_Expectancy,Adult_Mortality,Infant_Deaths,Alcohol,Percentage_Expenditure,Measles,BMI_5-19_years,...,Under-Five_Deaths,Polio,Total_Expenditure,Diphtheria,GDP,Population,Thinness_10-19_years,Thinness_5-9_years,Income_Composition_Of_Resources,Schooling
0,Afghanistan,2014,Low income,63.0,234,64,0.03,9.7,492,17.2,...,86,58,12.0,62,625.34,32758020.0,17.7,17.7,0.441,
1,Afghanistan,2013,Low income,62.7,235,66,0.03,8.8,430,17.1,...,89,62,10.59,64,647.966,31731688.0,17.9,18.0,0.443,
2,Afghanistan,2012,Low income,62.2,242,69,0.04,7.9,2787,17.0,...,93,67,11.67,67,648.511,30696958.0,18.2,18.2,0.442,
3,Afghanistan,2011,Low income,61.7,248,71,0.04,8.6,3013,16.9,...,97,68,10.17,68,599.298,29708599.0,18.4,18.4,0.426,
4,Afghanistan,2010,Low income,61.2,255,74,0.03,8.6,1989,16.8,...,101,66,14.4,66,550.515,28803167.0,18.6,18.7,0.421,


## SCHOOLING

In [129]:
school = pd.read_csv("Data/New/Education/Education_Internet.csv")

In [130]:
count = 0
school_data = pd.DataFrame(columns=['Country', 'Year', 'Schooling'])
for i in range(0, len(school['Country'].unique())):
    for j in range(1, len(school.columns)):
        #print(school.loc[i,'Country'], end='')
        # Space before a word by default in the dataset
        school_data.at[count, 'Country'] = school.loc[i,'Country'].split(' ',1)[1]
        school_data.at[count, 'Year'] = school.columns[j]
        #print(school.columns[j])
        school_data.at[count, 'Schooling'] = school[school['Country'] == school['Country'][i]].T[1:].loc[school.columns[j]].values[0]
        count+=1

In [131]:
school_data['Year'] = school_data['Year'].astype(np.int64)

In [132]:
for val in main_data['Country'].index:
    print(val,' ',end='')
    if len(school_data[school_data['Country'] == main_data['Country'][val]].values) != 0:
        try:
            school_other_data = school_data[school_data['Country'] == main_data['Country'][val]][school_data['Year'] == main_data['Year'][val]]['Schooling'].values[0]
            print(school_other_data, "pass: 1")
            main_data.at[val, 'Schooling'] = school_other_data
        except IndexError:
            pass
    else:
        try:
            school_other_data = school_data[school_data['Country'].str.startswith(main_data['Country'][val])][school_data['Year'] == main_data['Year'][val]]['Schooling'].values[0]
            print(school_other_data, "pass: 2")
            main_data.at[val, 'Schooling'] = school_other_data
        except IndexError:
            try:
                school_other_data = school_data[school_data['Country'].str.startswith(main_data['Country'][val].split(',')[0])][school_data['Year'] == main_data['Year'][val]]['Schooling'].values[0]
                print(school_other_data, "pass: 3")
                main_data.at[val, 'Schooling'] = school_other_data
            except IndexError:
                pass

0  3.5 pass: 1
1  3.5 pass: 1
2  3.4 pass: 1
3  3.3 pass: 1
4  3.2 pass: 1
5  3.1 pass: 1
6  3.0 pass: 1
7  2.9 pass: 1
8  2.7 pass: 1
9  2.6 pass: 1
10  2.5 pass: 1
11  2.4 pass: 1
12  2.3 pass: 1
13  2.2 pass: 1
14  2.2 pass: 1
15  9.7 pass: 1
16  9.7 pass: 1
17  9.6 pass: 1
18  9.3 pass: 1
19  9.3 pass: 1
20  9.3 pass: 1
21  9.2 pass: 1
22  9.2 pass: 1
23  9.2 pass: 1
24  9.1 pass: 1
25  9.1 pass: 1
26  9.0 pass: 1
27  9.0 pass: 1
28  8.7 pass: 1
29  8.8 pass: 1
30  7.9 pass: 1
31  7.8 pass: 1
32  7.6 pass: 1
33  7.4 pass: 1
34  7.1 pass: 1
35  6.9 pass: 1
36  6.7 pass: 1
37  7.2 pass: 1
38  7.0 pass: 1
39  6.9 pass: 1
40  6.7 pass: 1
41  6.5 pass: 1
42  6.3 pass: 1
43  6.1 pass: 1
44  5.9 pass: 1
45  46  47  48  49  

  """
  if sys.path[0] == '':


50  51  52  53  54  55  56  57  58  59  60  10.2 pass: 1
61  10.2 pass: 1
62  10.2 pass: 1
63  10.2 pass: 1
64  10.1 pass: 1
65  10.1 pass: 1
66  10.1 pass: 1
67  10.1 pass: 1
68  10.1 pass: 1
69  9.8 pass: 1
70  10.5 pass: 1
71  10.1 pass: 1
72  7.6 pass: 1
73  7.1 pass: 1
74  6.7 pass: 1
75  4.9 pass: 1
76  4.9 pass: 1
77  4.8 pass: 1
78  4.7 pass: 1
79  4.7 pass: 1
80  4.7 pass: 1
81  4.6 pass: 1
82  4.5 pass: 1
83  4.5 pass: 1
84  4.4 pass: 1
85  4.4 pass: 1
86  4.4 pass: 1
87  4.4 pass: 1
88  4.4 pass: 1
89  4.4 pass: 1
90  9.2 pass: 1
91  9.2 pass: 1
92  9.2 pass: 1
93  9.2 pass: 1
94  9.2 pass: 1
95  9.3 pass: 1
96  9.3 pass: 1
97  9.2 pass: 1
98  9.2 pass: 1
99  9.1 pass: 1
100  9.1 pass: 1
101  9.0 pass: 1
102  9.0 pass: 1
103  8.9 pass: 1
104  7.0 pass: 1
105  9.8 pass: 1
106  9.8 pass: 1
107  9.8 pass: 1
108  9.8 pass: 1
109  9.8 pass: 1
110  9.3 pass: 1
111  8.9 pass: 1
112  8.9 pass: 1
113  9.0 pass: 1
114  9.1 pass: 1
115  9.2 pass: 1
116  9.3 pass: 1
117  9.2 pass: 1
118

585  586  587  588  589  590  591  592  593  594  595  596  597  598  599  600  10.1 pass: 1
601  9.9 pass: 1
602  9.9 pass: 1
603  9.8 pass: 1
604  9.8 pass: 1
605  9.9 pass: 1
606  9.9 pass: 1
607  9.4 pass: 1
608  9.5 pass: 1
609  9.5 pass: 1
610  9.6 pass: 1
611  9.4 pass: 1
612  9.2 pass: 1
613  9.0 pass: 1
614  8.8 pass: 1
615  7.6 pass: 1
616  7.5 pass: 1
617  7.5 pass: 1
618  7.4 pass: 1
619  7.3 pass: 1
620  7.1 pass: 1
621  7.0 pass: 1
622  7.0 pass: 1
623  6.9 pass: 1
624  6.9 pass: 1
625  6.8 pass: 1
626  6.7 pass: 1
627  6.6 pass: 1
628  6.5 pass: 1
629  6.5 pass: 1
630  8.0 pass: 1
631  7.8 pass: 1
632  7.6 pass: 1
633  7.5 pass: 1
634  7.4 pass: 1
635  7.3 pass: 1
636  7.3 pass: 1
637  7.2 pass: 1
638  6.7 pass: 1
639  6.8 pass: 1
640  6.6 pass: 1
641  6.5 pass: 1
642  6.5 pass: 1
643  6.5 pass: 1
644  6.5 pass: 1
645  4.8 pass: 1
646  4.7 pass: 1
647  4.6 pass: 1
648  4.4 pass: 1
649  4.2 pass: 1
650  3.9 pass: 1
651  3.7 pass: 1
652  3.5 pass: 1
653  3.3 pass: 1
654  3

1155  1156  1157  1158  1159  1160  1161  1162  1163  1164  1165  1166  1167  1168  1169  1170  8.6 pass: 1
1171  8.5 pass: 1
1172  8.4 pass: 1
1173  8.4 pass: 1
1174  8.3 pass: 1
1175  8.2 pass: 1
1176  8.1 pass: 1
1177  8.0 pass: 1
1178  7.9 pass: 1
1179  7.8 pass: 1
1180  7.7 pass: 1
1181  7.6 pass: 1
1182  7.4 pass: 1
1183  nan pass: 1
1184  nan pass: 1
1185  1186  1187  1188  1189  1190  1191  1192  1193  1194  1195  1196  1197  1198  1199  1200  6.4 pass: 1
1201  4.7 pass: 1
1202  4.6 pass: 1
1203  5.3 pass: 1
1204  4.9 pass: 1
1205  4.6 pass: 1
1206  4.3 pass: 1
1207  3.9 pass: 1
1208  3.7 pass: 1
1209  3.5 pass: 1
1210  3.6 pass: 1
1211  3.7 pass: 1
1212  3.8 pass: 1
1213  3.8 pass: 1
1214  3.7 pass: 1
1215  2.6 pass: 1
1216  2.6 pass: 1
1217  2.4 pass: 1
1218  2.0 pass: 1
1219  1.6 pass: 1
1220  1.6 pass: 1
1221  1.6 pass: 1
1222  1.6 pass: 1
1223  1.6 pass: 1
1224  1.6 pass: 1
1225  1.6 pass: 1
1226  1.5 pass: 1
1227  1.5 pass: 1
1228  1.5 pass: 1
1229  1.5 pass: 1
1230  2.9 

1729  11.6 pass: 1
1730  11.5 pass: 1
1731  12.2 pass: 1
1732  12.1 pass: 1
1733  12.0 pass: 1
1734  11.8 pass: 1
1735  11.5 pass: 1
1736  11.3 pass: 1
1737  11.1 pass: 1
1738  10.9 pass: 1
1739  10.7 pass: 1
1740  12.0 pass: 1
1741  11.8 pass: 1
1742  11.8 pass: 1
1743  11.8 pass: 1
1744  11.8 pass: 1
1745  11.8 pass: 1
1746  11.7 pass: 1
1747  11.7 pass: 1
1748  11.5 pass: 1
1749  11.3 pass: 1
1750  11.1 pass: 1
1751  10.9 pass: 1
1752  10.7 pass: 1
1753  10.5 pass: 1
1754  10.3 pass: 1
1755  1756  1757  1758  1759  1760  1761  1762  1763  1764  1765  1766  1767  1768  1769  1770  6.1 pass: 1
1771  6.1 pass: 1
1772  6.1 pass: 1
1773  6.1 pass: 1
1774  6.0 pass: 1
1775  5.9 pass: 1
1776  5.9 pass: 1
1777  5.8 pass: 1
1778  5.7 pass: 1
1779  5.6 pass: 1
1780  5.5 pass: 1
1781  5.4 pass: 1
1782  5.3 pass: 1
1783  5.2 pass: 1
1784  5.2 pass: 1
1785  4.4 pass: 1
1786  4.4 pass: 1
1787  4.3 pass: 1
1788  4.3 pass: 1
1789  4.3 pass: 1
1790  4.1 pass: 1
1791  3.9 pass: 1
1792  3.8 pass: 1
17

2259  11.4 pass: 1
2260  11.4 pass: 1
2261  11.4 pass: 1
2262  11.4 pass: 1
2263  11.4 pass: 1
2264  11.4 pass: 1
2265  9.9 pass: 1
2266  9.7 pass: 1
2267  9.5 pass: 1
2268  9.3 pass: 1
2269  9.3 pass: 1
2270  9.3 pass: 1
2271  9.2 pass: 1
2272  9.2 pass: 1
2273  9.1 pass: 1
2274  9.0 pass: 1
2275  8.9 pass: 1
2276  8.8 pass: 1
2277  8.7 pass: 1
2278  8.6 pass: 1
2279  8.5 pass: 1
2280  4.3 pass: 1
2281  4.3 pass: 1
2282  4.2 pass: 1
2283  4.1 pass: 1
2284  4.0 pass: 1
2285  3.9 pass: 1
2286  3.8 pass: 1
2287  3.7 pass: 1
2288  3.6 pass: 1
2289  3.5 pass: 1
2290  3.5 pass: 1
2291  3.4 pass: 1
2292  3.4 pass: 1
2293  3.3 pass: 1
2294  3.3 pass: 1
2295  8.2 pass: 1
2296  8.3 pass: 1
2297  7.8 pass: 1
2298  7.8 pass: 1
2299  7.7 pass: 1
2300  7.0 pass: 1
2301  7.4 pass: 1
2302  7.1 pass: 1
2303  7.1 pass: 1
2304  7.3 pass: 1
2305  7.1 pass: 1
2306  7.0 pass: 1
2307  6.5 pass: 1
2308  6.2 pass: 1
2309  5.9 pass: 1
2310  9.4 pass: 1
2311  8.8 pass: 1
2312  8.6 pass: 1
2313  9.1 pass: 1
2314

2791  8.1 pass: 1
2792  7.9 pass: 1
2793  7.8 pass: 1
2794  7.7 pass: 1
2795  7.7 pass: 1
2796  7.7 pass: 1
2797  7.7 pass: 1
2798  7.7 pass: 1
2799  7.7 pass: 1
2800  7.7 pass: 1
2801  nan pass: 1
2802  nan pass: 1
2803  nan pass: 1
2804  nan pass: 1
2805  12.3 pass: 1
2806  12.2 pass: 1
2807  12.4 pass: 1
2808  12.4 pass: 1
2809  12.3 pass: 1
2810  12.2 pass: 1
2811  12.2 pass: 1
2812  12.5 pass: 1
2813  12.4 pass: 1
2814  12.4 pass: 1
2815  12.3 pass: 1
2816  11.8 pass: 1
2817  11.6 pass: 1
2818  11.5 pass: 1
2819  11.4 pass: 1
2820  13.4 pass: 1
2821  13.4 pass: 1
2822  13.4 pass: 1
2823  13.3 pass: 1
2824  13.3 pass: 1
2825  13.3 pass: 1
2826  12.9 pass: 1
2827  12.6 pass: 1
2828  12.3 pass: 1
2829  12.0 pass: 1
2830  11.9 pass: 1
2831  11.8 pass: 1
2832  11.7 pass: 1
2833  11.6 pass: 1
2834  11.4 pass: 1
2835  5.6 pass: 1
2836  6.3 pass: 1
2837  6.3 pass: 1
2838  6.3 pass: 1
2839  6.3 pass: 1
2840  6.6 pass: 1
2841  6.3 pass: 1
2842  6.5 pass: 1
2843  6.2 pass: 1
2844  5.8 pass: 

In [133]:
#school_data[school_data['Country'] == "Zimbabwe"]

In [134]:
#main_data[['Country','Year','Schooling']]

## Changing "No Data" to "NaNs"

In [135]:
# Replace "No Data" with "NaNs"
for i in range(0, len(main_data.columns)):
    for j in range(0, len(main_data)):
        value = main_data[main_data.columns[i]].tolist()[j]
        if value == "No data" or value == "No Data":
                main_data.at[j, main_data.columns[i]] = np.nan

## SAVING MAIN_DATA AS PICKLE and CSV DATASET

In [136]:
# Final save
pd.to_pickle(main_data, "Data/New/Main_Data/Dataset.pkl")

In [137]:
# Final save
main_data.to_csv("Data/New/Main_Data/Dataset.csv",index=False)

In [138]:
main_data.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 3255 entries, 0 to 3254
Data columns (total 21 columns):
Country                            3255 non-null object
Year                               3255 non-null int64
Status                             3180 non-null object
Life_Expectancy                    2565 non-null object
Adult_Mortality                    2565 non-null object
Infant_Deaths                      2670 non-null object
Alcohol                            2581 non-null object
Percentage_Expenditure             2621 non-null object
Measles                            2494 non-null object
BMI_5-19_years                     2610 non-null object
BMI_18+_years                      2610 non-null object
Under-Five_Deaths                  2670 non-null object
Polio                              2651 non-null object
Total_Expenditure                  2633 non-null object
Diphtheria                         2651 non-null object
GDP                                3045 non-null objec