# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [47]:
import pandas as pd
import plotly.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()

In [48]:
data = pd.read_excel('../data/Online Retail.xlsx')

## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [51]:
#Drop UK
data_noUK = data[data['Country'] != 'United Kingdom']
#Filter for April only
graph_data_april = data_noUK[data_noUK['InvoiceDate'].map(lambda x: x.month) == 4]
#Filter for 2011 only
graph_data_april_2011 = graph_data_april[graph_data_april['InvoiceDate'].map(lambda x: x.year) == 2011]
#Group by country and keep only the data we are interested in
graph_data = graph_data_april_2011.groupby('Country').sum()[['Quantity','Revenue']]
#Plot
graph_data.iplot(kind='bar')



## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [52]:
#Drop all countries but France
data_France = data[data['Country'] == 'France']
#Filter only for 2011
data_France_2011 = data_France[data_France['InvoiceDate'].map(lambda x: x.year) == 2011]
#Filter only for up to may
data_France_2011_tillMay = data_France_2011[data_France_2011['InvoiceDate'].map(lambda x: x.month) < 6]
#We keep only the data we need to plot
graph_data = data_France_2011_tillMay[['InvoiceDate','Quantity','Revenue']]
#To order the date and avoid repeated dates
graph_data = graph_data.groupby('InvoiceDate').sum()
#Plot
graph_data.iplot(kind='line')



## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [74]:
#We keep only 'party bunting'
data_party = data[data['Description'] == 'PARTY BUNTING']
#data_party_countries = 
data_party_country = data_party.groupby('Country').mean()[['Quantity','Revenue']].reset_index()
#py.iplot({data='data_party_country', kind='bubbles',x='Quantity', y='Revenue', text='Country')

py.iplot(
    {
        'data': [
            {
                'x': data_party_country['Quantity'],
                'y': data_party_country['Revenue'],
                'name': country, 'mode': 'markers',
            } for country in list(data_party_country['Country'])
        ],
        'layout': {
            'xaxis': {'title': 'Quantity'},
            'yaxis': {'title': "Revenue"}
        }
}, filename='cufflinks/scatter-group-by')


Aw, snap! We didn't get a username with your request.

Don't have an account? https://plot.ly/api_signup

Questions? accounts@plot.ly


PlotlyError: Because you didn't supply a 'file_id' in the call, we're assuming you're trying to snag a figure from a url. You supplied the url, '', we expected it to start with 'https://plot.ly'.
Run help on this function for more information.

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [None]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.