In [1]:
import pandas as pd
import os
import matplotlib.pyplot as plt
import scipy.stats as st
import numpy as np
from geopy.geocoders import Nominatim

In [2]:
!pip install geopy



In [3]:
# Initialize Nominatim API
geolocator = Nominatim(user_agent="MyApp")

In [4]:
df_mh_subst_use = pd.read_csv("Resources/mental-and-substance-use-as-share-of-disease.csv")

In [5]:
df_mh_subst_use["Entity"].unique()

array(['Afghanistan', 'African Region (WHO)', 'Albania', 'Algeria',
       'American Samoa', 'Andorra', 'Angola', 'Antigua and Barbuda',
       'Argentina', 'Armenia', 'Australia', 'Austria', 'Azerbaijan',
       'Bahamas', 'Bahrain', 'Bangladesh', 'Barbados', 'Belarus',
       'Belgium', 'Belize', 'Benin', 'Bermuda', 'Bhutan', 'Bolivia',
       'Bosnia and Herzegovina', 'Botswana', 'Brazil', 'Brunei',
       'Bulgaria', 'Burkina Faso', 'Burundi', 'Cambodia', 'Cameroon',
       'Canada', 'Cape Verde', 'Central African Republic', 'Chad',
       'Chile', 'China', 'Colombia', 'Comoros', 'Congo', 'Cook Islands',
       'Costa Rica', "Cote d'Ivoire", 'Croatia', 'Cuba', 'Cyprus',
       'Czechia', 'Democratic Republic of Congo', 'Denmark', 'Djibouti',
       'Dominica', 'Dominican Republic', 'East Asia & Pacific (WB)',
       'Eastern Mediterranean Region (WHO)', 'Ecuador', 'Egypt',
       'El Salvador', 'England', 'Equatorial Guinea', 'Eritrea',
       'Estonia', 'Eswatini', 'Ethiopia', 'Eu

In [6]:
df_mh_subst_use.head()

Unnamed: 0,Entity,Code,Year,DALYs (Disability-Adjusted Life Years) - Mental disorders - Sex: Both - Age: All Ages (Percent)
0,Afghanistan,AFG,1990,1.69667
1,Afghanistan,AFG,1991,1.734281
2,Afghanistan,AFG,1992,1.791189
3,Afghanistan,AFG,1993,1.776779
4,Afghanistan,AFG,1994,1.712986


In [7]:
df_mh_subst_use.shape

(6840, 4)

In [8]:
def get_lat_lon(country):
    
    try:
        location = geolocator.geocode(country)
        return location.latitude, location.longitude
    except:
        return np.nan

In [9]:
countries = df_mh_subst_use["Entity"].unique()

In [10]:
countries_lat_lon = {}

for c in countries:
    print("country: ", c)
    countries_lat_lon[c] = get_lat_lon(c)

country:  Afghanistan
country:  African Region (WHO)
country:  Albania
country:  Algeria
country:  American Samoa
country:  Andorra
country:  Angola
country:  Antigua and Barbuda
country:  Argentina
country:  Armenia
country:  Australia
country:  Austria
country:  Azerbaijan
country:  Bahamas
country:  Bahrain
country:  Bangladesh
country:  Barbados
country:  Belarus
country:  Belgium
country:  Belize
country:  Benin
country:  Bermuda
country:  Bhutan
country:  Bolivia
country:  Bosnia and Herzegovina
country:  Botswana
country:  Brazil
country:  Brunei
country:  Bulgaria
country:  Burkina Faso
country:  Burundi
country:  Cambodia
country:  Cameroon
country:  Canada
country:  Cape Verde
country:  Central African Republic
country:  Chad
country:  Chile
country:  China
country:  Colombia
country:  Comoros
country:  Congo
country:  Cook Islands
country:  Costa Rica
country:  Cote d'Ivoire
country:  Croatia
country:  Cuba
country:  Cyprus
country:  Czechia
country:  Democratic Republic of 

In [11]:
countries_lat_lon

{'Afghanistan': (33.7680065, 66.2385139),
 'African Region (WHO)': nan,
 'Albania': (41.000028, 19.9999619),
 'Algeria': (28.0000272, 2.9999825),
 'American Samoa': (-14.297124, -170.7131481),
 'Andorra': (42.5407167, 1.5732033),
 'Angola': (-11.8775768, 17.5691241),
 'Antigua and Barbuda': (17.2234721, -61.9554608),
 'Argentina': (-34.9964963, -64.9672817),
 'Armenia': (40.7696272, 44.6736646),
 'Australia': (-24.7761086, 134.755),
 'Austria': (47.59397, 14.12456),
 'Azerbaijan': (40.3936294, 47.7872508),
 'Bahamas': (24.7736546, -78.0000547),
 'Bahrain': (26.1551249, 50.5344606),
 'Bangladesh': (24.4769288, 90.2934413),
 'Barbados': (13.1500331, -59.5250305),
 'Belarus': (53.4250605, 27.6971358),
 'Belgium': (50.6402809, 4.6667145),
 'Belize': (16.8259793, -88.7600927),
 'Benin': (9.5293472, 2.2584408),
 'Bermuda': (32.30382, -64.7561647),
 'Bhutan': (27.549511, 90.5119273),
 'Bolivia': (-17.0568696, -64.9912286),
 'Bosnia and Herzegovina': (44.3053476, 17.5961467),
 'Botswana': (-23

In [12]:
df_mh_subst_use.head()

Unnamed: 0,Entity,Code,Year,DALYs (Disability-Adjusted Life Years) - Mental disorders - Sex: Both - Age: All Ages (Percent)
0,Afghanistan,AFG,1990,1.69667
1,Afghanistan,AFG,1991,1.734281
2,Afghanistan,AFG,1992,1.791189
3,Afghanistan,AFG,1993,1.776779
4,Afghanistan,AFG,1994,1.712986


In [13]:
df_mh_subst_use["lat_lon"] = df_mh_subst_use["Entity"].map(countries_lat_lon)

In [14]:
df_mh_subst_use

Unnamed: 0,Entity,Code,Year,DALYs (Disability-Adjusted Life Years) - Mental disorders - Sex: Both - Age: All Ages (Percent),lat_lon
0,Afghanistan,AFG,1990,1.696670,"(33.7680065, 66.2385139)"
1,Afghanistan,AFG,1991,1.734281,"(33.7680065, 66.2385139)"
2,Afghanistan,AFG,1992,1.791189,"(33.7680065, 66.2385139)"
3,Afghanistan,AFG,1993,1.776779,"(33.7680065, 66.2385139)"
4,Afghanistan,AFG,1994,1.712986,"(33.7680065, 66.2385139)"
...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,2.193166,"(-18.4554963, 29.7468414)"
6836,Zimbabwe,ZWE,2016,2.279813,"(-18.4554963, 29.7468414)"
6837,Zimbabwe,ZWE,2017,2.364265,"(-18.4554963, 29.7468414)"
6838,Zimbabwe,ZWE,2018,2.472949,"(-18.4554963, 29.7468414)"


In [15]:
discard_indexes = df_mh_subst_use[df_mh_subst_use["lat_lon"].isnull()].index
df_mh_subst_use = df_mh_subst_use.drop(discard_indexes)

In [16]:
df_mh_subst_use

Unnamed: 0,Entity,Code,Year,DALYs (Disability-Adjusted Life Years) - Mental disorders - Sex: Both - Age: All Ages (Percent),lat_lon
0,Afghanistan,AFG,1990,1.696670,"(33.7680065, 66.2385139)"
1,Afghanistan,AFG,1991,1.734281,"(33.7680065, 66.2385139)"
2,Afghanistan,AFG,1992,1.791189,"(33.7680065, 66.2385139)"
3,Afghanistan,AFG,1993,1.776779,"(33.7680065, 66.2385139)"
4,Afghanistan,AFG,1994,1.712986,"(33.7680065, 66.2385139)"
...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,2.193166,"(-18.4554963, 29.7468414)"
6836,Zimbabwe,ZWE,2016,2.279813,"(-18.4554963, 29.7468414)"
6837,Zimbabwe,ZWE,2017,2.364265,"(-18.4554963, 29.7468414)"
6838,Zimbabwe,ZWE,2018,2.472949,"(-18.4554963, 29.7468414)"


In [17]:
df_mh_subst_use["latitude"] = df_mh_subst_use["lat_lon"].map(lambda x: x[0])
df_mh_subst_use["longitude"] = df_mh_subst_use["lat_lon"].map(lambda x: x[1])

In [18]:
df_mh_subst_use

Unnamed: 0,Entity,Code,Year,DALYs (Disability-Adjusted Life Years) - Mental disorders - Sex: Both - Age: All Ages (Percent),lat_lon,latitude,longitude
0,Afghanistan,AFG,1990,1.696670,"(33.7680065, 66.2385139)",33.768006,66.238514
1,Afghanistan,AFG,1991,1.734281,"(33.7680065, 66.2385139)",33.768006,66.238514
2,Afghanistan,AFG,1992,1.791189,"(33.7680065, 66.2385139)",33.768006,66.238514
3,Afghanistan,AFG,1993,1.776779,"(33.7680065, 66.2385139)",33.768006,66.238514
4,Afghanistan,AFG,1994,1.712986,"(33.7680065, 66.2385139)",33.768006,66.238514
...,...,...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,2.193166,"(-18.4554963, 29.7468414)",-18.455496,29.746841
6836,Zimbabwe,ZWE,2016,2.279813,"(-18.4554963, 29.7468414)",-18.455496,29.746841
6837,Zimbabwe,ZWE,2017,2.364265,"(-18.4554963, 29.7468414)",-18.455496,29.746841
6838,Zimbabwe,ZWE,2018,2.472949,"(-18.4554963, 29.7468414)",-18.455496,29.746841


In [19]:
df_mh_subst_use = df_mh_subst_use.drop('lat_lon', axis=1)
df_mh_subst_use

Unnamed: 0,Entity,Code,Year,DALYs (Disability-Adjusted Life Years) - Mental disorders - Sex: Both - Age: All Ages (Percent),latitude,longitude
0,Afghanistan,AFG,1990,1.696670,33.768006,66.238514
1,Afghanistan,AFG,1991,1.734281,33.768006,66.238514
2,Afghanistan,AFG,1992,1.791189,33.768006,66.238514
3,Afghanistan,AFG,1993,1.776779,33.768006,66.238514
4,Afghanistan,AFG,1994,1.712986,33.768006,66.238514
...,...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,2.193166,-18.455496,29.746841
6836,Zimbabwe,ZWE,2016,2.279813,-18.455496,29.746841
6837,Zimbabwe,ZWE,2017,2.364265,-18.455496,29.746841
6838,Zimbabwe,ZWE,2018,2.472949,-18.455496,29.746841


In [20]:
df_mh_subst_use.to_csv('Clean_data/cleaned-Disability-Adjusted-Life-Years.csv', index=False)

# Third csv file

In [21]:
df_depression_m_vs_f = pd.read_csv("Resources/prevalence-of-depression-males-vs-females.csv")

In [22]:
df_depression_m_vs_f.head()


Unnamed: 0,Entity,Code,Year,Prevalence - Depressive disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent
0,Abkhazia,OWID_ABK,2015,,,,Asia
1,Afghanistan,AFG,1990,4.291054,5.859656,12412311.0,
2,Afghanistan,AFG,1991,4.293268,5.853078,13299016.0,
3,Afghanistan,AFG,1992,4.298265,5.85002,14485543.0,
4,Afghanistan,AFG,1993,4.303087,5.844987,15816601.0,


In [23]:
df_depression_m_vs_f = df_depression_m_vs_f.dropna()
df_depression_m_vs_f

Unnamed: 0,Entity,Code,Year,Prevalence - Depressive disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent
26,Afghanistan,AFG,2015,4.384594,5.837310,34413603.0,Asia
575,Albania,ALB,2015,1.768626,3.410732,2890524.0,Europe
834,Algeria,DZA,2015,3.443441,5.172573,39728020.0,Africa
1093,American Samoa,ASM,2015,2.317518,3.199010,55806.0,Oceania
1207,Andorra,AND,2015,3.143566,4.713564,77993.0,Europe
...,...,...,...,...,...,...,...
54494,Venezuela,VEN,2015,2.798923,3.849009,30081827.0,South America
54753,Vietnam,VNM,2015,1.949282,3.137088,92677082.0,Asia
55638,Yemen,YEM,2015,3.993781,6.056418,26497881.0,Asia
55900,Zambia,ZMB,2015,3.658321,4.848113,15879370.0,Africa


In [24]:
df_depression_m_vs_f["lat_lon"] = df_depression_m_vs_f["Entity"].map(countries_lat_lon)

In [25]:
df_depression_m_vs_f

Unnamed: 0,Entity,Code,Year,Prevalence - Depressive disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,lat_lon
26,Afghanistan,AFG,2015,4.384594,5.837310,34413603.0,Asia,"(33.7680065, 66.2385139)"
575,Albania,ALB,2015,1.768626,3.410732,2890524.0,Europe,"(41.000028, 19.9999619)"
834,Algeria,DZA,2015,3.443441,5.172573,39728020.0,Africa,"(28.0000272, 2.9999825)"
1093,American Samoa,ASM,2015,2.317518,3.199010,55806.0,Oceania,"(-14.297124, -170.7131481)"
1207,Andorra,AND,2015,3.143566,4.713564,77993.0,Europe,"(42.5407167, 1.5732033)"
...,...,...,...,...,...,...,...,...
54494,Venezuela,VEN,2015,2.798923,3.849009,30081827.0,South America,"(8.0018709, -66.1109318)"
54753,Vietnam,VNM,2015,1.949282,3.137088,92677082.0,Asia,"(15.9266657, 107.9650855)"
55638,Yemen,YEM,2015,3.993781,6.056418,26497881.0,Asia,"(16.3471243, 47.8915271)"
55900,Zambia,ZMB,2015,3.658321,4.848113,15879370.0,Africa,"(-14.5189121, 27.5589884)"


In [26]:
discard_indexes = df_depression_m_vs_f[df_depression_m_vs_f["lat_lon"].isnull()].index
df_depression_m_vs_f = df_depression_m_vs_f.drop(discard_indexes)

In [27]:
df_depression_m_vs_f

Unnamed: 0,Entity,Code,Year,Prevalence - Depressive disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,lat_lon
26,Afghanistan,AFG,2015,4.384594,5.837310,34413603.0,Asia,"(33.7680065, 66.2385139)"
575,Albania,ALB,2015,1.768626,3.410732,2890524.0,Europe,"(41.000028, 19.9999619)"
834,Algeria,DZA,2015,3.443441,5.172573,39728020.0,Africa,"(28.0000272, 2.9999825)"
1093,American Samoa,ASM,2015,2.317518,3.199010,55806.0,Oceania,"(-14.297124, -170.7131481)"
1207,Andorra,AND,2015,3.143566,4.713564,77993.0,Europe,"(42.5407167, 1.5732033)"
...,...,...,...,...,...,...,...,...
54494,Venezuela,VEN,2015,2.798923,3.849009,30081827.0,South America,"(8.0018709, -66.1109318)"
54753,Vietnam,VNM,2015,1.949282,3.137088,92677082.0,Asia,"(15.9266657, 107.9650855)"
55638,Yemen,YEM,2015,3.993781,6.056418,26497881.0,Asia,"(16.3471243, 47.8915271)"
55900,Zambia,ZMB,2015,3.658321,4.848113,15879370.0,Africa,"(-14.5189121, 27.5589884)"


In [28]:
df_depression_m_vs_f["latitude"] = df_depression_m_vs_f["lat_lon"].map(lambda x: x[0])
df_depression_m_vs_f["longitude"] = df_depression_m_vs_f["lat_lon"].map(lambda x: x[1])

In [29]:
df_depression_m_vs_f

Unnamed: 0,Entity,Code,Year,Prevalence - Depressive disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,lat_lon,latitude,longitude
26,Afghanistan,AFG,2015,4.384594,5.837310,34413603.0,Asia,"(33.7680065, 66.2385139)",33.768006,66.238514
575,Albania,ALB,2015,1.768626,3.410732,2890524.0,Europe,"(41.000028, 19.9999619)",41.000028,19.999962
834,Algeria,DZA,2015,3.443441,5.172573,39728020.0,Africa,"(28.0000272, 2.9999825)",28.000027,2.999983
1093,American Samoa,ASM,2015,2.317518,3.199010,55806.0,Oceania,"(-14.297124, -170.7131481)",-14.297124,-170.713148
1207,Andorra,AND,2015,3.143566,4.713564,77993.0,Europe,"(42.5407167, 1.5732033)",42.540717,1.573203
...,...,...,...,...,...,...,...,...,...,...
54494,Venezuela,VEN,2015,2.798923,3.849009,30081827.0,South America,"(8.0018709, -66.1109318)",8.001871,-66.110932
54753,Vietnam,VNM,2015,1.949282,3.137088,92677082.0,Asia,"(15.9266657, 107.9650855)",15.926666,107.965086
55638,Yemen,YEM,2015,3.993781,6.056418,26497881.0,Asia,"(16.3471243, 47.8915271)",16.347124,47.891527
55900,Zambia,ZMB,2015,3.658321,4.848113,15879370.0,Africa,"(-14.5189121, 27.5589884)",-14.518912,27.558988


In [30]:
df_depression_m_vs_f = df_depression_m_vs_f.drop('lat_lon', axis=1)
df_depression_m_vs_f

Unnamed: 0,Entity,Code,Year,Prevalence - Depressive disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,latitude,longitude
26,Afghanistan,AFG,2015,4.384594,5.837310,34413603.0,Asia,33.768006,66.238514
575,Albania,ALB,2015,1.768626,3.410732,2890524.0,Europe,41.000028,19.999962
834,Algeria,DZA,2015,3.443441,5.172573,39728020.0,Africa,28.000027,2.999983
1093,American Samoa,ASM,2015,2.317518,3.199010,55806.0,Oceania,-14.297124,-170.713148
1207,Andorra,AND,2015,3.143566,4.713564,77993.0,Europe,42.540717,1.573203
...,...,...,...,...,...,...,...,...,...
54494,Venezuela,VEN,2015,2.798923,3.849009,30081827.0,South America,8.001871,-66.110932
54753,Vietnam,VNM,2015,1.949282,3.137088,92677082.0,Asia,15.926666,107.965086
55638,Yemen,YEM,2015,3.993781,6.056418,26497881.0,Asia,16.347124,47.891527
55900,Zambia,ZMB,2015,3.658321,4.848113,15879370.0,Africa,-14.518912,27.558988


In [31]:
df_depression_m_vs_f.to_csv('Clean_data/cleaned-prevalence-of-depression-males-vs-females.csv', index=False)

# 5th csv file

In [32]:
df_share_mental_substance_by_sex = pd.read_csv("Resources/share-with-mental-or-substance-disorders-by-sex.csv")

In [33]:
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent
0,Abkhazia,OWID_ABK,2015,,,,Asia
1,Afghanistan,AFG,1990,17.448695,17.634233,12412311.0,
2,Afghanistan,AFG,1991,17.771263,17.873184,13299016.0,
3,Afghanistan,AFG,1992,18.051575,18.092318,14485543.0,
4,Afghanistan,AFG,1993,18.275848,18.265196,15816601.0,
...,...,...,...,...,...,...,...
56624,Zimbabwe,ZWE,2018,,,14438812.0,
56625,Zimbabwe,ZWE,2019,,,14645473.0,
56626,Zimbabwe,ZWE,2020,,,14862927.0,
56627,Zimbabwe,ZWE,2021,,,15092171.0,


In [34]:
df_share_mental_substance_by_sex = df_share_mental_substance_by_sex.dropna()
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent
26,Afghanistan,AFG,2015,16.753068,17.041232,34413603.0,Asia
545,Albania,ALB,2015,10.648345,11.058989,2890524.0,Europe
804,Algeria,DZA,2015,14.040733,14.986809,39728020.0,Africa
1063,American Samoa,ASM,2015,10.692175,11.007287,55806.0,Oceania
1205,Andorra,AND,2015,13.604457,15.850925,77993.0,Europe
...,...,...,...,...,...,...,...
54824,Venezuela,VEN,2015,11.186214,11.002820,30081827.0,South America
55083,Vietnam,VNM,2015,8.966948,10.385800,92677082.0,Asia
55872,Yemen,YEM,2015,15.410116,16.247524,26497881.0,Asia
56134,Zambia,ZMB,2015,11.994085,12.449468,15879370.0,Africa


In [35]:
df_share_mental_substance_by_sex["lat_lon"] = df_share_mental_substance_by_sex["Entity"].map(countries_lat_lon)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_share_mental_substance_by_sex["lat_lon"] = df_share_mental_substance_by_sex["Entity"].map(countries_lat_lon)


In [36]:
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,lat_lon
26,Afghanistan,AFG,2015,16.753068,17.041232,34413603.0,Asia,"(33.7680065, 66.2385139)"
545,Albania,ALB,2015,10.648345,11.058989,2890524.0,Europe,"(41.000028, 19.9999619)"
804,Algeria,DZA,2015,14.040733,14.986809,39728020.0,Africa,"(28.0000272, 2.9999825)"
1063,American Samoa,ASM,2015,10.692175,11.007287,55806.0,Oceania,"(-14.297124, -170.7131481)"
1205,Andorra,AND,2015,13.604457,15.850925,77993.0,Europe,"(42.5407167, 1.5732033)"
...,...,...,...,...,...,...,...,...
54824,Venezuela,VEN,2015,11.186214,11.002820,30081827.0,South America,"(8.0018709, -66.1109318)"
55083,Vietnam,VNM,2015,8.966948,10.385800,92677082.0,Asia,"(15.9266657, 107.9650855)"
55872,Yemen,YEM,2015,15.410116,16.247524,26497881.0,Asia,"(16.3471243, 47.8915271)"
56134,Zambia,ZMB,2015,11.994085,12.449468,15879370.0,Africa,"(-14.5189121, 27.5589884)"


In [37]:
discard_indexes = df_share_mental_substance_by_sex[df_share_mental_substance_by_sex["lat_lon"].isnull()].index
df_share_mental_substance_by_sex = df_share_mental_substance_by_sex.drop(discard_indexes)

In [38]:
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,lat_lon
26,Afghanistan,AFG,2015,16.753068,17.041232,34413603.0,Asia,"(33.7680065, 66.2385139)"
545,Albania,ALB,2015,10.648345,11.058989,2890524.0,Europe,"(41.000028, 19.9999619)"
804,Algeria,DZA,2015,14.040733,14.986809,39728020.0,Africa,"(28.0000272, 2.9999825)"
1063,American Samoa,ASM,2015,10.692175,11.007287,55806.0,Oceania,"(-14.297124, -170.7131481)"
1205,Andorra,AND,2015,13.604457,15.850925,77993.0,Europe,"(42.5407167, 1.5732033)"
...,...,...,...,...,...,...,...,...
54824,Venezuela,VEN,2015,11.186214,11.002820,30081827.0,South America,"(8.0018709, -66.1109318)"
55083,Vietnam,VNM,2015,8.966948,10.385800,92677082.0,Asia,"(15.9266657, 107.9650855)"
55872,Yemen,YEM,2015,15.410116,16.247524,26497881.0,Asia,"(16.3471243, 47.8915271)"
56134,Zambia,ZMB,2015,11.994085,12.449468,15879370.0,Africa,"(-14.5189121, 27.5589884)"


In [39]:
df_share_mental_substance_by_sex["latitude"] = df_share_mental_substance_by_sex["lat_lon"].map(lambda x: x[0])
df_share_mental_substance_by_sex["longitude"] = df_share_mental_substance_by_sex["lat_lon"].map(lambda x: x[1])

In [40]:
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,lat_lon,latitude,longitude
26,Afghanistan,AFG,2015,16.753068,17.041232,34413603.0,Asia,"(33.7680065, 66.2385139)",33.768006,66.238514
545,Albania,ALB,2015,10.648345,11.058989,2890524.0,Europe,"(41.000028, 19.9999619)",41.000028,19.999962
804,Algeria,DZA,2015,14.040733,14.986809,39728020.0,Africa,"(28.0000272, 2.9999825)",28.000027,2.999983
1063,American Samoa,ASM,2015,10.692175,11.007287,55806.0,Oceania,"(-14.297124, -170.7131481)",-14.297124,-170.713148
1205,Andorra,AND,2015,13.604457,15.850925,77993.0,Europe,"(42.5407167, 1.5732033)",42.540717,1.573203
...,...,...,...,...,...,...,...,...,...,...
54824,Venezuela,VEN,2015,11.186214,11.002820,30081827.0,South America,"(8.0018709, -66.1109318)",8.001871,-66.110932
55083,Vietnam,VNM,2015,8.966948,10.385800,92677082.0,Asia,"(15.9266657, 107.9650855)",15.926666,107.965086
55872,Yemen,YEM,2015,15.410116,16.247524,26497881.0,Asia,"(16.3471243, 47.8915271)",16.347124,47.891527
56134,Zambia,ZMB,2015,11.994085,12.449468,15879370.0,Africa,"(-14.5189121, 27.5589884)",-14.518912,27.558988


In [41]:
df_share_mental_substance_by_sex = df_share_mental_substance_by_sex.drop('lat_lon', axis=1)
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,latitude,longitude
26,Afghanistan,AFG,2015,16.753068,17.041232,34413603.0,Asia,33.768006,66.238514
545,Albania,ALB,2015,10.648345,11.058989,2890524.0,Europe,41.000028,19.999962
804,Algeria,DZA,2015,14.040733,14.986809,39728020.0,Africa,28.000027,2.999983
1063,American Samoa,ASM,2015,10.692175,11.007287,55806.0,Oceania,-14.297124,-170.713148
1205,Andorra,AND,2015,13.604457,15.850925,77993.0,Europe,42.540717,1.573203
...,...,...,...,...,...,...,...,...,...
54824,Venezuela,VEN,2015,11.186214,11.002820,30081827.0,South America,8.001871,-66.110932
55083,Vietnam,VNM,2015,8.966948,10.385800,92677082.0,Asia,15.926666,107.965086
55872,Yemen,YEM,2015,15.410116,16.247524,26497881.0,Asia,16.347124,47.891527
56134,Zambia,ZMB,2015,11.994085,12.449468,15879370.0,Africa,-14.518912,27.558988


In [42]:
df_share_mental_substance_by_sex['Number of women with mental and substance use disorder']=(df_share_mental_substance_by_sex['Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent)']*df_share_mental_substance_by_sex['Population (historical estimates)'])/100

In [43]:
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,latitude,longitude,Number of women with mental and substance use disorder
26,Afghanistan,AFG,2015,16.753068,17.041232,34413603.0,Asia,33.768006,66.238514,5.864502e+06
545,Albania,ALB,2015,10.648345,11.058989,2890524.0,Europe,41.000028,19.999962,3.196627e+05
804,Algeria,DZA,2015,14.040733,14.986809,39728020.0,Africa,28.000027,2.999983,5.953962e+06
1063,American Samoa,ASM,2015,10.692175,11.007287,55806.0,Oceania,-14.297124,-170.713148,6.142726e+03
1205,Andorra,AND,2015,13.604457,15.850925,77993.0,Europe,42.540717,1.573203,1.236261e+04
...,...,...,...,...,...,...,...,...,...,...
54824,Venezuela,VEN,2015,11.186214,11.002820,30081827.0,South America,8.001871,-66.110932,3.309849e+06
55083,Vietnam,VNM,2015,8.966948,10.385800,92677082.0,Asia,15.926666,107.965086,9.625256e+06
55872,Yemen,YEM,2015,15.410116,16.247524,26497881.0,Asia,16.347124,47.891527,4.305250e+06
56134,Zambia,ZMB,2015,11.994085,12.449468,15879370.0,Africa,-14.518912,27.558988,1.976897e+06


In [44]:
df_share_mental_substance_by_sex.dtypes

Entity                                                                                              object
Code                                                                                                object
Year                                                                                                 int64
Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent)      float64
Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent)    float64
Population (historical estimates)                                                                  float64
Continent                                                                                           object
latitude                                                                                           float64
longitude                                                                                          float64
Number of women with mental and subst

In [45]:
df_share_mental_substance_by_sex['Number of men with mental and substance use disorder']=(df_share_mental_substance_by_sex['Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent)']*df_share_mental_substance_by_sex['Population (historical estimates)'])/100

In [46]:
df_share_mental_substance_by_sex

Unnamed: 0,Entity,Code,Year,Prevalence - Mental and substance use disorders - Sex: Male - Age: Age-standardized (Percent),Prevalence - Mental and substance use disorders - Sex: Female - Age: Age-standardized (Percent),Population (historical estimates),Continent,latitude,longitude,Number of women with mental and substance use disorder,Number of men with mental and substance use disorder
26,Afghanistan,AFG,2015,16.753068,17.041232,34413603.0,Asia,33.768006,66.238514,5.864502e+06,5.765334e+06
545,Albania,ALB,2015,10.648345,11.058989,2890524.0,Europe,41.000028,19.999962,3.196627e+05,3.077930e+05
804,Algeria,DZA,2015,14.040733,14.986809,39728020.0,Africa,28.000027,2.999983,5.953962e+06,5.578105e+06
1063,American Samoa,ASM,2015,10.692175,11.007287,55806.0,Oceania,-14.297124,-170.713148,6.142726e+03,5.966875e+03
1205,Andorra,AND,2015,13.604457,15.850925,77993.0,Europe,42.540717,1.573203,1.236261e+04,1.061052e+04
...,...,...,...,...,...,...,...,...,...,...,...
54824,Venezuela,VEN,2015,11.186214,11.002820,30081827.0,South America,8.001871,-66.110932,3.309849e+06,3.365018e+06
55083,Vietnam,VNM,2015,8.966948,10.385800,92677082.0,Asia,15.926666,107.965086,9.625256e+06,8.310306e+06
55872,Yemen,YEM,2015,15.410116,16.247524,26497881.0,Asia,16.347124,47.891527,4.305250e+06,4.083354e+06
56134,Zambia,ZMB,2015,11.994085,12.449468,15879370.0,Africa,-14.518912,27.558988,1.976897e+06,1.904585e+06


In [47]:
df_share_mental_substance_by_sex.to_csv('Clean_data/cleaned-share-with-mental-or-substance-disorders-by-sex.csv', index=False)

# 4th csv file

In [48]:
df_share_mental_substance = pd.read_csv("Resources/share-with-mental-and-substance-disorders.csv")

In [49]:
df_share_mental_substance

Unnamed: 0,Entity,Code,Year,Prevalence - Mental disorders - Sex: Both - Age: Age-standardized (Percent)
0,Afghanistan,AFG,1990,16.659229
1,Afghanistan,AFG,1991,16.765052
2,Afghanistan,AFG,1992,16.874469
3,Afghanistan,AFG,1993,16.990720
4,Afghanistan,AFG,1994,17.112730
...,...,...,...,...
6775,Zimbabwe,ZWE,2015,11.156429
6776,Zimbabwe,ZWE,2016,11.164133
6777,Zimbabwe,ZWE,2017,11.170427
6778,Zimbabwe,ZWE,2018,11.158765


In [50]:
df_share_mental_substance = df_share_mental_substance.dropna()
df_share_mental_substance

Unnamed: 0,Entity,Code,Year,Prevalence - Mental disorders - Sex: Both - Age: Age-standardized (Percent)
0,Afghanistan,AFG,1990,16.659229
1,Afghanistan,AFG,1991,16.765052
2,Afghanistan,AFG,1992,16.874469
3,Afghanistan,AFG,1993,16.990720
4,Afghanistan,AFG,1994,17.112730
...,...,...,...,...
6775,Zimbabwe,ZWE,2015,11.156429
6776,Zimbabwe,ZWE,2016,11.164133
6777,Zimbabwe,ZWE,2017,11.170427
6778,Zimbabwe,ZWE,2018,11.158765


In [51]:
df_share_mental_substance["lat_lon"] = df_share_mental_substance["Entity"].map(countries_lat_lon)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_share_mental_substance["lat_lon"] = df_share_mental_substance["Entity"].map(countries_lat_lon)


In [52]:
df_share_mental_substance

Unnamed: 0,Entity,Code,Year,Prevalence - Mental disorders - Sex: Both - Age: Age-standardized (Percent),lat_lon
0,Afghanistan,AFG,1990,16.659229,"(33.7680065, 66.2385139)"
1,Afghanistan,AFG,1991,16.765052,"(33.7680065, 66.2385139)"
2,Afghanistan,AFG,1992,16.874469,"(33.7680065, 66.2385139)"
3,Afghanistan,AFG,1993,16.990720,"(33.7680065, 66.2385139)"
4,Afghanistan,AFG,1994,17.112730,"(33.7680065, 66.2385139)"
...,...,...,...,...,...
6775,Zimbabwe,ZWE,2015,11.156429,"(-18.4554963, 29.7468414)"
6776,Zimbabwe,ZWE,2016,11.164133,"(-18.4554963, 29.7468414)"
6777,Zimbabwe,ZWE,2017,11.170427,"(-18.4554963, 29.7468414)"
6778,Zimbabwe,ZWE,2018,11.158765,"(-18.4554963, 29.7468414)"


In [53]:
discard_indexes = df_share_mental_substance[df_share_mental_substance["lat_lon"].isnull()].index
df_share_mental_substance = df_share_mental_substance.drop(discard_indexes)

In [54]:
df_share_mental_substance

Unnamed: 0,Entity,Code,Year,Prevalence - Mental disorders - Sex: Both - Age: Age-standardized (Percent),lat_lon
0,Afghanistan,AFG,1990,16.659229,"(33.7680065, 66.2385139)"
1,Afghanistan,AFG,1991,16.765052,"(33.7680065, 66.2385139)"
2,Afghanistan,AFG,1992,16.874469,"(33.7680065, 66.2385139)"
3,Afghanistan,AFG,1993,16.990720,"(33.7680065, 66.2385139)"
4,Afghanistan,AFG,1994,17.112730,"(33.7680065, 66.2385139)"
...,...,...,...,...,...
6775,Zimbabwe,ZWE,2015,11.156429,"(-18.4554963, 29.7468414)"
6776,Zimbabwe,ZWE,2016,11.164133,"(-18.4554963, 29.7468414)"
6777,Zimbabwe,ZWE,2017,11.170427,"(-18.4554963, 29.7468414)"
6778,Zimbabwe,ZWE,2018,11.158765,"(-18.4554963, 29.7468414)"


In [55]:
df_share_mental_substance["latitude"] = df_share_mental_substance["lat_lon"].map(lambda x: x[0])
df_share_mental_substance["longitude"] = df_share_mental_substance["lat_lon"].map(lambda x: x[1])

In [56]:
df_share_mental_substance.head()

Unnamed: 0,Entity,Code,Year,Prevalence - Mental disorders - Sex: Both - Age: Age-standardized (Percent),lat_lon,latitude,longitude
0,Afghanistan,AFG,1990,16.659229,"(33.7680065, 66.2385139)",33.768006,66.238514
1,Afghanistan,AFG,1991,16.765052,"(33.7680065, 66.2385139)",33.768006,66.238514
2,Afghanistan,AFG,1992,16.874469,"(33.7680065, 66.2385139)",33.768006,66.238514
3,Afghanistan,AFG,1993,16.99072,"(33.7680065, 66.2385139)",33.768006,66.238514
4,Afghanistan,AFG,1994,17.11273,"(33.7680065, 66.2385139)",33.768006,66.238514


In [57]:
df_share_mental_substance = df_share_mental_substance.drop('lat_lon', axis=1)
df_share_mental_substance

Unnamed: 0,Entity,Code,Year,Prevalence - Mental disorders - Sex: Both - Age: Age-standardized (Percent),latitude,longitude
0,Afghanistan,AFG,1990,16.659229,33.768006,66.238514
1,Afghanistan,AFG,1991,16.765052,33.768006,66.238514
2,Afghanistan,AFG,1992,16.874469,33.768006,66.238514
3,Afghanistan,AFG,1993,16.990720,33.768006,66.238514
4,Afghanistan,AFG,1994,17.112730,33.768006,66.238514
...,...,...,...,...,...,...
6775,Zimbabwe,ZWE,2015,11.156429,-18.455496,29.746841
6776,Zimbabwe,ZWE,2016,11.164133,-18.455496,29.746841
6777,Zimbabwe,ZWE,2017,11.170427,-18.455496,29.746841
6778,Zimbabwe,ZWE,2018,11.158765,-18.455496,29.746841


In [58]:
df_share_mental_substance.head()

Unnamed: 0,Entity,Code,Year,Prevalence - Mental disorders - Sex: Both - Age: Age-standardized (Percent),latitude,longitude
0,Afghanistan,AFG,1990,16.659229,33.768006,66.238514
1,Afghanistan,AFG,1991,16.765052,33.768006,66.238514
2,Afghanistan,AFG,1992,16.874469,33.768006,66.238514
3,Afghanistan,AFG,1993,16.99072,33.768006,66.238514
4,Afghanistan,AFG,1994,17.11273,33.768006,66.238514


In [59]:
df_share_mental_substance.to_csv('Clean_data/cleaned-share-with-mental-and-substance-disorders.csv', index=False)

# 2nd CSV file

In [60]:
df_diffdisorders = df_mh_subst_use = pd.read_csv("Resources/prevalence-by-mental-and-substance-use-disorder.csv")

In [61]:
df_diffdisorders.head(2)

Unnamed: 0,Entity,Code,Year,Prevalence - Schizophrenia - Sex: Both - Age: Age-standardized (Percent),Prevalence - Bipolar disorder - Sex: Both - Age: Age-standardized (Percent),Prevalence - Eating disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Anxiety disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Drug use disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Alcohol use disorders - Sex: Both - Age: Age-standardized (Percent)
0,Afghanistan,AFG,1990,0.228979,0.721207,0.131001,4.835127,0.454202,5.125291,0.444036
1,Afghanistan,AFG,1991,0.22812,0.719952,0.126395,4.821765,0.447112,5.116306,0.44425


In [62]:
df_diffdisorders.dropna()

Unnamed: 0,Entity,Code,Year,Prevalence - Schizophrenia - Sex: Both - Age: Age-standardized (Percent),Prevalence - Bipolar disorder - Sex: Both - Age: Age-standardized (Percent),Prevalence - Eating disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Anxiety disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Drug use disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Alcohol use disorders - Sex: Both - Age: Age-standardized (Percent)
0,Afghanistan,AFG,1990,0.228979,0.721207,0.131001,4.835127,0.454202,5.125291,0.444036
1,Afghanistan,AFG,1991,0.228120,0.719952,0.126395,4.821765,0.447112,5.116306,0.444250
2,Afghanistan,AFG,1992,0.227328,0.718418,0.121832,4.801434,0.441190,5.106558,0.445501
3,Afghanistan,AFG,1993,0.226468,0.717452,0.117942,4.789363,0.435581,5.100328,0.445958
4,Afghanistan,AFG,1994,0.225567,0.717012,0.114547,4.784923,0.431822,5.099424,0.445779
...,...,...,...,...,...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,0.209359,0.560882,0.099610,3.315701,0.599604,3.548613,1.734969
6836,Zimbabwe,ZWE,2016,0.209979,0.561768,0.100821,3.324230,0.603658,3.557508,1.689281
6837,Zimbabwe,ZWE,2017,0.210631,0.562612,0.101671,3.330569,0.608096,3.564138,1.651805
6838,Zimbabwe,ZWE,2018,0.211237,0.563283,0.102398,3.317500,0.609065,3.563141,1.686711


In [63]:
df_diffdisorders["lat_lon"] = df_diffdisorders["Entity"].map(countries_lat_lon)

In [64]:
df_diffdisorders

Unnamed: 0,Entity,Code,Year,Prevalence - Schizophrenia - Sex: Both - Age: Age-standardized (Percent),Prevalence - Bipolar disorder - Sex: Both - Age: Age-standardized (Percent),Prevalence - Eating disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Anxiety disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Drug use disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Alcohol use disorders - Sex: Both - Age: Age-standardized (Percent),lat_lon
0,Afghanistan,AFG,1990,0.228979,0.721207,0.131001,4.835127,0.454202,5.125291,0.444036,"(33.7680065, 66.2385139)"
1,Afghanistan,AFG,1991,0.228120,0.719952,0.126395,4.821765,0.447112,5.116306,0.444250,"(33.7680065, 66.2385139)"
2,Afghanistan,AFG,1992,0.227328,0.718418,0.121832,4.801434,0.441190,5.106558,0.445501,"(33.7680065, 66.2385139)"
3,Afghanistan,AFG,1993,0.226468,0.717452,0.117942,4.789363,0.435581,5.100328,0.445958,"(33.7680065, 66.2385139)"
4,Afghanistan,AFG,1994,0.225567,0.717012,0.114547,4.784923,0.431822,5.099424,0.445779,"(33.7680065, 66.2385139)"
...,...,...,...,...,...,...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,0.209359,0.560882,0.099610,3.315701,0.599604,3.548613,1.734969,"(-18.4554963, 29.7468414)"
6836,Zimbabwe,ZWE,2016,0.209979,0.561768,0.100821,3.324230,0.603658,3.557508,1.689281,"(-18.4554963, 29.7468414)"
6837,Zimbabwe,ZWE,2017,0.210631,0.562612,0.101671,3.330569,0.608096,3.564138,1.651805,"(-18.4554963, 29.7468414)"
6838,Zimbabwe,ZWE,2018,0.211237,0.563283,0.102398,3.317500,0.609065,3.563141,1.686711,"(-18.4554963, 29.7468414)"


In [65]:
discard_indexes = df_diffdisorders[df_diffdisorders["lat_lon"].isnull()].index
df_diffdisorders = df_diffdisorders.drop(discard_indexes)

In [66]:
df_diffdisorders

Unnamed: 0,Entity,Code,Year,Prevalence - Schizophrenia - Sex: Both - Age: Age-standardized (Percent),Prevalence - Bipolar disorder - Sex: Both - Age: Age-standardized (Percent),Prevalence - Eating disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Anxiety disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Drug use disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Alcohol use disorders - Sex: Both - Age: Age-standardized (Percent),lat_lon
0,Afghanistan,AFG,1990,0.228979,0.721207,0.131001,4.835127,0.454202,5.125291,0.444036,"(33.7680065, 66.2385139)"
1,Afghanistan,AFG,1991,0.228120,0.719952,0.126395,4.821765,0.447112,5.116306,0.444250,"(33.7680065, 66.2385139)"
2,Afghanistan,AFG,1992,0.227328,0.718418,0.121832,4.801434,0.441190,5.106558,0.445501,"(33.7680065, 66.2385139)"
3,Afghanistan,AFG,1993,0.226468,0.717452,0.117942,4.789363,0.435581,5.100328,0.445958,"(33.7680065, 66.2385139)"
4,Afghanistan,AFG,1994,0.225567,0.717012,0.114547,4.784923,0.431822,5.099424,0.445779,"(33.7680065, 66.2385139)"
...,...,...,...,...,...,...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,0.209359,0.560882,0.099610,3.315701,0.599604,3.548613,1.734969,"(-18.4554963, 29.7468414)"
6836,Zimbabwe,ZWE,2016,0.209979,0.561768,0.100821,3.324230,0.603658,3.557508,1.689281,"(-18.4554963, 29.7468414)"
6837,Zimbabwe,ZWE,2017,0.210631,0.562612,0.101671,3.330569,0.608096,3.564138,1.651805,"(-18.4554963, 29.7468414)"
6838,Zimbabwe,ZWE,2018,0.211237,0.563283,0.102398,3.317500,0.609065,3.563141,1.686711,"(-18.4554963, 29.7468414)"


In [67]:
df_diffdisorders["latitude"] = df_diffdisorders["lat_lon"].map(lambda x: x[0])
df_diffdisorders["longitude"] = df_diffdisorders["lat_lon"].map(lambda x: x[1])

In [68]:
df_diffdisorders

Unnamed: 0,Entity,Code,Year,Prevalence - Schizophrenia - Sex: Both - Age: Age-standardized (Percent),Prevalence - Bipolar disorder - Sex: Both - Age: Age-standardized (Percent),Prevalence - Eating disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Anxiety disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Drug use disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Alcohol use disorders - Sex: Both - Age: Age-standardized (Percent),lat_lon,latitude,longitude
0,Afghanistan,AFG,1990,0.228979,0.721207,0.131001,4.835127,0.454202,5.125291,0.444036,"(33.7680065, 66.2385139)",33.768006,66.238514
1,Afghanistan,AFG,1991,0.228120,0.719952,0.126395,4.821765,0.447112,5.116306,0.444250,"(33.7680065, 66.2385139)",33.768006,66.238514
2,Afghanistan,AFG,1992,0.227328,0.718418,0.121832,4.801434,0.441190,5.106558,0.445501,"(33.7680065, 66.2385139)",33.768006,66.238514
3,Afghanistan,AFG,1993,0.226468,0.717452,0.117942,4.789363,0.435581,5.100328,0.445958,"(33.7680065, 66.2385139)",33.768006,66.238514
4,Afghanistan,AFG,1994,0.225567,0.717012,0.114547,4.784923,0.431822,5.099424,0.445779,"(33.7680065, 66.2385139)",33.768006,66.238514
...,...,...,...,...,...,...,...,...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,0.209359,0.560882,0.099610,3.315701,0.599604,3.548613,1.734969,"(-18.4554963, 29.7468414)",-18.455496,29.746841
6836,Zimbabwe,ZWE,2016,0.209979,0.561768,0.100821,3.324230,0.603658,3.557508,1.689281,"(-18.4554963, 29.7468414)",-18.455496,29.746841
6837,Zimbabwe,ZWE,2017,0.210631,0.562612,0.101671,3.330569,0.608096,3.564138,1.651805,"(-18.4554963, 29.7468414)",-18.455496,29.746841
6838,Zimbabwe,ZWE,2018,0.211237,0.563283,0.102398,3.317500,0.609065,3.563141,1.686711,"(-18.4554963, 29.7468414)",-18.455496,29.746841


In [69]:
df_diffdisorders = df_diffdisorders.drop('lat_lon', axis=1)

In [70]:
df_diffdisorders

Unnamed: 0,Entity,Code,Year,Prevalence - Schizophrenia - Sex: Both - Age: Age-standardized (Percent),Prevalence - Bipolar disorder - Sex: Both - Age: Age-standardized (Percent),Prevalence - Eating disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Anxiety disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Drug use disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Depressive disorders - Sex: Both - Age: Age-standardized (Percent),Prevalence - Alcohol use disorders - Sex: Both - Age: Age-standardized (Percent),latitude,longitude
0,Afghanistan,AFG,1990,0.228979,0.721207,0.131001,4.835127,0.454202,5.125291,0.444036,33.768006,66.238514
1,Afghanistan,AFG,1991,0.228120,0.719952,0.126395,4.821765,0.447112,5.116306,0.444250,33.768006,66.238514
2,Afghanistan,AFG,1992,0.227328,0.718418,0.121832,4.801434,0.441190,5.106558,0.445501,33.768006,66.238514
3,Afghanistan,AFG,1993,0.226468,0.717452,0.117942,4.789363,0.435581,5.100328,0.445958,33.768006,66.238514
4,Afghanistan,AFG,1994,0.225567,0.717012,0.114547,4.784923,0.431822,5.099424,0.445779,33.768006,66.238514
...,...,...,...,...,...,...,...,...,...,...,...,...
6835,Zimbabwe,ZWE,2015,0.209359,0.560882,0.099610,3.315701,0.599604,3.548613,1.734969,-18.455496,29.746841
6836,Zimbabwe,ZWE,2016,0.209979,0.561768,0.100821,3.324230,0.603658,3.557508,1.689281,-18.455496,29.746841
6837,Zimbabwe,ZWE,2017,0.210631,0.562612,0.101671,3.330569,0.608096,3.564138,1.651805,-18.455496,29.746841
6838,Zimbabwe,ZWE,2018,0.211237,0.563283,0.102398,3.317500,0.609065,3.563141,1.686711,-18.455496,29.746841


In [72]:
df_diffdisorders.to_csv('Clean_data/df_diffdisorders.csv', index=False)