# Differences in bad-very bad self-reported health among women aged 18-44 years by highest and lowest equivalised income quintiles in selected EU Member States, 2013

## Setup

In [1]:
from __future__ import unicode_literals, print_function, division

In [2]:
import os

In [3]:
import numpy as np
import pandas as pd

import plotly.plotly as py
from plotly.graph_objs import *
import plotly.tools as tls

  from pkg_resources import resource_stream


## Specific Configuration

In [4]:
DATA_DIR = os.path.join('.', 'data')
RAW_FILE = os.path.join(DATA_DIR, 'raw_data_20150701.xlsx')

In [5]:
SHEET = 'Figure24'

PARSE_COLS = 'A:C,F,G'
SKIPROWS = 14
SKIP_FOOTER = 118-48

title = 'Reports of bad or very bad personal health'
subtitle = 'Self-perceived health by income quintile (% women aged 18-44 years, 2013)'
source = dict(label='Eurostat', 
              link=('http://appsso.eurostat.ec.europa.eu/nui/show.do?',
                    'query=BOOKMARK_DS-051950_QID_-2B10F8F_UID_-3F171EB0&',
                    'layout=TIME,C,X,0;GEO,L,Y,0;INCGRP,L,Z,0;AGE,L,Z,1;SEX,L,Z,2;',
                    'LEVELS,L,Z,3;UNIT,L,Z,4;INDICATORS,C,Z,5;&zSelection=DS-051950INDICATORS,',
                    'OBS_FLAG;DS-051950AGE,Y18-44;DS-051950INCGRP,Q0_20;',
                    'DS-051950LEVELS,B_VB;DS-051950UNIT,PC;DS-051950SEX,F;',
                    '&rankName1=TIME_1_0_0_0&rankName2=UNIT_1_2_-1_2&rankName3=GEO_1_2_0_1&',
                    'rankName4=AGE_1_2_-1_2&rankName5=INDICATORS_1_2_-1_2&rankName6=SEX_1_2_-1_2&',
                    'rankName7=LEVELS_1_2_-1_2&rankName8=INCGRP_1_2_-1_2&',
                    'pprRK=FIRST&pprSO=PROTOCOL&ppcRK=FIRST&ppcSO=ASC&sortC=ASC_-1_FIRST&',
                    'rStp=&cStp=&rDCh=&cDCh=&rDM=true&cDM=true&footnes=false&empty=false&',
                    'wai=true&time_mode=NONE&time_most_recent=false&lang=EN&',
                    'cfo=%23%23%23%2C%23%23%23.%23%23%23'),
              accessed='25 May 2015')

X_LABEL = 'Percentage women rating themselves in bad health'
Y_LABEL = ''

## Data Importation and Munging

In [6]:
DF = pd.read_excel(RAW_FILE,
                   sheetname=SHEET,
                   parse_cols=PARSE_COLS,
                   skiprows=SKIPROWS,
                   skip_footer=SKIP_FOOTER)
DF.columns = ['country','bad','bad_flags','v_bad','v_bad_flags']
DF

Unnamed: 0,country,bad,bad_flags,v_bad,v_bad_flags
0,EU 27,5.1,,1.6,
1,Belgium,10.4,,0.7,
2,Bulgaria,4.3,,0.3,
3,Czech Republic,5.9,u,0.5,u
4,Denmark,3.1,,1.6,
5,Germany,7.1,,2.5,
6,Estonia,9.0,,0.2,
7,Ireland,2.6,,0.8,
8,Greece,1.8,,1.1,
9,Spain,3.0,,1.2,


#### Flags

```
b	break in time series
c	confidential
d	definition differs, see metadata
e	estimated
f	forecast
i	see metadata (phased out)
n	not significant
p	provisional
r	revised
s	Eurostat estimate (phased out)
u	low reliability
z	not applicable
```

####  Notes

Differences in bad-very bad self-reported health among women aged 18-44 years by highest and lowest equivalised income quintiles in selected EU Member States, 2013.

Quintile 1 is the lowest equivalised income (lowest 20%) and Quintile 5 is the highest equivalised income. Data for the Czech Republic, Croatia, Serbia and UK(5th quintile only) is noted as having low reliability.

## Plotting