# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [95]:
import pandas as pd
import plotly.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()

In [96]:
data = pd.read_excel('/Users/johnngai/Desktop/lab-interactive-visualization/data/Online Retail.xlsx')
data.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


In [97]:
data.dtypes

InvoiceNo               int64
InvoiceDate    datetime64[ns]
StockCode              object
Description            object
Quantity                int64
UnitPrice             float64
Revenue               float64
CustomerID              int64
Country                object
dtype: object

## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [98]:
data_april=data[data['InvoiceDate'].dt.strftime('%Y-%m') == '2011-04']
data_no_uk=data_april[data_april['Country'] != 'United Kingdom']
dataplot=data_no_uk.groupby('Country', as_index=False).agg({"Revenue":"sum","Quantity":"sum"})


In [99]:
import plotly.plotly as py
import plotly.graph_objs as go

trace1 = go.Bar(
    x=dataplot['Country'],
    y=dataplot['Quantity'],
    name='Qty'
)
trace2 = go.Bar(
    x=dataplot['Country'],
    y=dataplot['Revenue'],
    name='Rev'
)

plotdata = [trace1, trace2]
layout = go.Layout(
    barmode='group'
)

fig = go.Figure(data=plotdata, layout=layout)
#replace py.iplot(fig, filename='grouped-bar') with following to avoid error
fig.iplot(filename='grouped-bar')



## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [114]:
#data_Jan_to_May=data[
data_jan_to_may=data[data['InvoiceDate'].dt.strftime('%Y-%m').isin(['2011-01','2011-02','2011-03','2011-04','2011-05'])]
data_jan_to_may
data_france=data_jan_to_may[data_jan_to_may['Country'] == 'France'].sort_values(by=['InvoiceDate'])
#fig = go.Figure(data=plotdata, layout=layout)

trace3 = go.Scatter(
    x = data_france['InvoiceDate'],
    y = data_france['Revenue'],
    mode = 'lines',
    name = 'Rev'
)
trace4 = go.Scatter(
    x = data_france['InvoiceDate'],
    y = data_france['Quantity'],
    mode = 'lines',
    name = 'Qty'
)


layout1 = dict(title = 'Quantity and Revenue sold to France between January1st to May31st',
              xaxis = dict(title = 'Date'),
              yaxis = dict(title = 'Qty / Dollars'),
              )

plotdata2 = [trace3, trace4]

fig = go.Figure(data=plotdata2, layout=layout1)

fig.iplot(filename='line-mode')



In [85]:
fig = go.Figure(data=plotdata, layout=layout)


## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [None]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.