Skip to content
Permalink
master
Switch branches/tags

Name already in use

A tag already exists with the provided branch name. Many Git commands accept both tag and branch names, so creating this branch may cause unexpected behavior. Are you sure you want to create this branch?
Go to file
 
 
Cannot retrieve contributors at this time
from collections import OrderedDict
from bokeh.plotting import figure, show, output_file
from bokeh.models import HoverTool, ColumnDataSource, Range1d
from bokeh.embed import components
import pandas as pd
df = pd.read_csv('~/Google Drive/Datasets/OECD_Labour_Stats.csv')
years = Range1d(1994, 2015)
countries = OrderedDict()
for c in df['Country'].values:
countries[c] = True
countries = [key for key, value in countries.items()]
countries = countries[::-1] # reverse the list so the x axis goes in the right direction
colours = [
"#75968f", "#a5bab7", "#c9d9d3", "#e2e2e2", "#dfccce",
"#ddb7b1", "#cc7878", "#933b41", "#550b1d"
]
df['colours'] = [colours[min(int(rate) - 2, 8)] for rate in df['Value'].values]
df = df[['Time', 'Country', 'colours', 'Value']]
#709
#limit to years after 1995
df = df.ix[df['Time'] >= 1995,]
#Adding NA values
for country in countries:
country_df = df.ix[df['Country'] == country,]
if len(country_df) < 20:
for year in range(1995, 2015):
if year not in country_df.Time.values:
new_df = pd.DataFrame({'Time': year,
'Country': country_df['Country'].iloc[0],
'colours': '#fffff4',
'Value': 'NaN'},
index= [(df.index[-1] + 1)]
)
print(new_df)
df = pd.concat([df, new_df])
print('Added values for ', country_df['Country'].iloc[0])
else:
print('Not missing values', country_df['Country'].iloc[0])
source = ColumnDataSource(df)
output_file('oecd_unemployment.html')
p = figure(title='OECD Unemployment (1990 - 2015)',
tools='resize,hover,save', x_range=years, y_range=countries)
p.rect(x='Time', y='Country', width=1, height=1, source=source,
color='colours', line_color=None)
hover = p.select(dict(type=HoverTool))
hover.tooltips = OrderedDict([
('Year', '@Time'),
('Country', '@Country'),
('Unemployment Rate (%)', '@Value')
])
p.toolbar_location = 'right'
p.plot_height = 800
p.plot_width = 1000
#Getting rid of chart junk
p.outline_line_color = None
p.grid.grid_line_color = None
p.axis.axis_line_color = None
p.axis.major_tick_line_color = None
p.axis.minor_tick_line_color = None
script_file = open('oecd_unemployment_script.html', 'w+')
div_file = open('oecd_unemployment_div.html', 'w+')
script, div = components(p)
print(script, file=script_file)
print(div, file=div_file)
show(p)