# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [1]:
import pandas as pd
import plotly.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()

In [2]:
data = pd.read_excel('../data/Online Retail.xlsx')

In [3]:
data.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [4]:
filtered_date = data[(data['InvoiceDate'] > '2011-04-01') & (data['InvoiceDate'] <= '2011-04-30')]
grouped = filtered_date[filtered_date.Country != "United Kingdom"].groupby('Country', as_index=False).agg({'Quantity':'sum', "Revenue":"sum"})


In [5]:
grouped.iplot(kind='bar', x='Country', xTitle='Country',
           yTitle='Quantity', title='Total Quantity by Country')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [6]:
filtered_date1 = data[(data['InvoiceDate'] > '2011-01-01') & (data['InvoiceDate'] <= '2011-05-31')]

france = filtered_date1[filtered_date1.Country == "France"][["InvoiceDate", "Quantity", "Revenue"]].sort_values("InvoiceDate")

france.head()

Unnamed: 0,InvoiceDate,Quantity,Revenue
62212,2011-01-05 12:42:00,12,7.8
116492,2011-01-05 12:42:00,4,19.8
188781,2011-01-05 12:42:00,6,17.7
34108,2011-01-05 12:42:00,12,17.4
221614,2011-01-05 12:42:00,2,11.9


In [7]:
france.iplot(kind='line', x='InvoiceDate', xTitle='InvoiceDate',
           yTitle='Revenue', title='Revenue')

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [11]:
scatter = data[(data['Description']=='PARTY BUNTING')].groupby("Country", as_index=False).agg({"Quantity":"mean", "UnitPrice":"mean"})
scatter

Unnamed: 0,Country,Quantity,UnitPrice
0,Australia,33.125,4.7125
1,Austria,8.0,4.95
2,Belgium,4.0,4.95
3,Channel Islands,13.333333,4.95
4,Cyprus,2.333333,4.75
5,Denmark,12.0,4.95
6,EIRE,21.210526,4.739474
7,Finland,6.0,4.95
8,France,5.727273,4.922727
9,Germany,6.8,4.89


In [12]:
scatter.iplot(x='Quantity', y='UnitPrice', categories='Country',
           xTitle='Quantity', yTitle='UnitPrice',
           title='Relationship between average quantity and average unit price')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [54]:
countries = data[data.Country.isin(['EIRE','Germany','France', 
                                    'Netherlands'])].pivot_table(values = 'Quantity', index = 'InvoiceNo', 
                                                                 columns = 'Country', aggfunc = 'mean')
countries.head()

Country,EIRE,France,Germany,Netherlands
InvoiceNo,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
536370,,23.473684,,
536403,,,,96.0
536527,,,11.142857,
536540,12.105263,,,
536541,12.0,,,


In [47]:
countries.iplot(kind='hist', xTitle='Country', subplots=True, 
                yTitle='Quantity', title='Quantity per invoice')

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [None]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.