# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [64]:
import pandas as pd
import chart_studio.plotly as py
import cufflinks as cf
import ipywidgets as widgets
import plotly.express as px
import plotly.graph_objects as go
import datetime

cf.go_offline()

In [2]:
data = pd.read_excel('../Data/Online Retail.xlsx')

In [3]:
data_UK = data[(data["InvoiceDate"] >= '2011-04-01') & (data["InvoiceDate"] <= '2011-04-30')]
data_UK = data_UK[(data_UK["Country"] != "United Kingdom")]
data_UK = data_UK.groupby("Country").agg({"Revenue": "sum", "Quantity": "sum"})

In [4]:
data

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.30,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.30,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.30,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.20,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.60,13408,United Kingdom
...,...,...,...,...,...,...,...,...,...
396029,580691,2011-12-05 15:48:00,90214W,"LETTER ""W"" BLING KEY RING",12,0.29,3.48,13790,United Kingdom
396030,580691,2011-12-05 15:48:00,90214Z,"LETTER ""Z"" BLING KEY RING",12,0.29,3.48,13790,United Kingdom
396031,580865,2011-12-06 11:58:00,90089,PINK CRYSTAL SKULL PHONE CHARM,12,0.19,2.28,17914,United Kingdom
396032,580865,2011-12-06 11:58:00,90089,PINK CRYSTAL SKULL PHONE CHARM,12,0.19,2.28,17914,United Kingdom


## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [5]:
fig = px.bar(data_UK, x= data_UK.index, y="Revenue")
fig.show()

In [6]:
fig = go.Figure(data=[
    go.Bar(name='Revenue', x=data_UK.index, y=data_UK.Revenue),
    go.Bar(name='Quantity', x=data_UK.index, y=data_UK.Quantity)
])
# Change the bar mode
fig.update_layout(barmode='group')
fig.show()

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [7]:
data_FR = data[(data["InvoiceDate"] >= '2011-01-01') & (data["InvoiceDate"] <= '2011-05-31')]
data_FR = data_FR[(data_FR["Country"] == "France")]
data_FR = data_FR.groupby("InvoiceDate").agg({"Revenue": "sum", "Quantity": "sum"})

In [8]:
data_FR.head()

Unnamed: 0_level_0,Revenue,Quantity
InvoiceDate,Unnamed: 1_level_1,Unnamed: 2_level_1
2011-01-05 12:42:00,502.07,359
2011-01-05 14:48:00,763.11,369
2011-01-06 14:26:00,283.77,261
2011-01-06 16:12:00,425.25,177
2011-01-07 12:07:00,676.16,488


In [9]:
fig = go.Figure(data=[
    go.Line(name='Revenue', x=data_FR.index, y=data_FR.Revenue),
    go.Line(name='Quantity', x=data_FR.index, y=data_FR.Quantity)
])
fig.show()


plotly.graph_objs.Line is deprecated.
Please replace it with one of the following more specific types
  - plotly.graph_objs.scatter.Line
  - plotly.graph_objs.layout.shape.Line
  - etc.




## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [10]:
data_Party = data[(data["Description"] == "PARTY BUNTING")]
data_Party = data_Party.groupby("Country").mean()

In [11]:
fig = px.scatter(data_Party, x=data_Party.Quantity, y=data_Party.UnitPrice, size='Quantity', color=data_Party.index, hover_data=['Revenue'])
fig.show()

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [20]:
data_count = data[data['Country'].isin(['EIRE', 'Germany', 'France', 'Netherlands'])]
quantityperinvoice = data_count.pivot_table(values='Quantity', columns='Country', 
                      index='InvoiceNo', aggfunc='sum')
quantityperinvoice.iplot(kind='hist', xTitle='Quantity of Invoice', 
           yTitle='Amount of invoices', title='Distribution of invoice quantities')

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [23]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

In [59]:
data_count = data[data['Country'].isin(country_list)]
data_count = data_count.pivot_table(values='Revenue', columns=['Description'], 
                      index=['Country'], aggfunc='sum')
fig = go.Figure(data=[
    go.Bar(name="CREAM HANGING HEART T-LIGHT HOLDER", x=data_count.index, y=data_count["CREAM HANGING HEART T-LIGHT HOLDER"]),
    go.Bar(name='JUMBO BAG RED RETROSPOT', x=data_count.index, y=data_count["JUMBO BAG RED RETROSPOT"]),
    go.Bar(name='REGENCY CAKESTAND 3 TIER', x=data_count.index, y=data_count["REGENCY CAKESTAND 3 TIER"])
])
# Change the bar mode
fig.update_layout(barmode='group')
fig.show()

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

In [67]:

dates = [datetime.date(i, i, 1) for i in range(1, 13)]
options = [(i.strftime('%b'), i) for i in dates]
widgets.SelectionRangeSlider(
    options=options,
    index=(0, 11),
    description='Months (2015)',
    disabled=False
)

SelectionRangeSlider(description='Months (2015)', index=(0, 11), options=(('Jan', datetime.date(1, 1, 1)), ('Fâ€¦

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.