In [None]:
import pandas as pd
import json
import folium

## European unemployment

We obtained the data from [this eurostat page](http://ec.europa.eu/eurostat/data/database) navigating into the following directories hierarchy:

 - Tables by theme
 - Population and social conditions
 - Labour market
 - Employment and unemployment (Labour force survey)
 - LFS Main indicators
 - Unemployment - LFS adjusted series
 - Total unemployment rate

[Statistical description of the dataset](http://ec.europa.eu/eurostat/cache/metadata/en/tsdec450_esmsip.htm)

In [None]:
euro = pd.read_csv('Homework3-data/european_unemployment.tsv',
                   sep='\t',
                   usecols=['age,unit,sex,geo\\time', '2016 '])
euro.head()

In [None]:
countries = pd.DataFrame(euro['age,unit,sex,geo\\time'].str.split(',', expand=True))
countries.head()

In [None]:
countries[0].unique()

In [None]:
countries[1].unique()

As indicated [here](https://www.google.ch/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&ved=0ahUKEwiFm4i2-pzXAhUGZlAKHRd_BmQQFggmMAA&url=http%3A%2F%2Fec.europa.eu%2Feurostat%2Fdocuments%2F10186%2F6246844%2FChanges%2Bto%2Bthe%2Bunemployment%2Bdata%2Btables.pdf&usg=AOvVaw10j2p5RgC8vFvpEuvBX2Jn) we only keep `PC_ACT`

In [None]:
countries = countries[countries[1] == 'PC_ACT'][[3]]
countries.columns = ['country']

In [None]:
euro = countries.merge(euro, left_index=True, right_index=True)\
                .drop('age,unit,sex,geo\\time', axis=1)
euro.columns = ['country', '2016']

In [None]:
euro.head()

In [None]:
euro['2016'].describe()

In [None]:
KIEV = [50.450, 30.5234]

In [None]:
euromap = folium.Map(location=KIEV, zoom_start=4)

In [None]:
geo_data = folium.TopoJson(open('Homework3-data/topojson/europe.topojson.json'),
                           'objects.europe')
geo_data.add_to(euromap)

In [None]:
euromap

In [None]:
euromap.choropleth(
    geo_data=geo_data,
    data=euro,
    columns=['country', '2016'],
    key_on='feature.id',
    fill_color='BuPu', fill_opacity=0.7, line_opacity=0.2
)