# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [1]:
import pandas as pd
import numpy as np
import plotly.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()

In [2]:
data = pd.read_excel('Online Retail.xlsx')
print(data.shape)
data.head()

(396034, 9)


Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [3]:
lst = []
for i in range(len(data["InvoiceDate"])):
    if "2011-04" in str(data["InvoiceDate"][i]):
        lst.append(i)

In [4]:
data04 = data.loc[lst]

In [5]:
data_no_UK = data04[data["Country"] != "United Kingdom"]
df = data_no_UK.pivot_table(index = "Country", values = ["Quantity", "Revenue"], aggfunc="sum")
df.head()


Boolean Series key will be reindexed to match DataFrame index.



Unnamed: 0_level_0,Quantity,Revenue
Country,Unnamed: 1_level_1,Unnamed: 2_level_1
Australia,224,421.6
Austria,308,584.78
Belgium,1170,1788.48
Brazil,356,1143.6
Channel Islands,96,243.0


In [6]:
df = df.reset_index()

In [7]:
df.iplot(kind='bar', x='Country', xTitle='Country',
           yTitle='Quantity and Revenue', title='Total Quantity and Revenue by Country(excl.UK) in April 2011')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [8]:
lst1 = []
for i in range(len(data["InvoiceDate"])):
    if "2011-01" in str(data["InvoiceDate"][i]):
        lst1.append(i)
    elif "2011-02" in str(data["InvoiceDate"][i]):
        lst1.append(i)
    elif "2011-03" in str(data["InvoiceDate"][i]):
        lst1.append(i)
    elif "2011-04" in str(data["InvoiceDate"][i]):
        lst1.append(i)   
    elif "2011-05" in str(data["InvoiceDate"][i]):
        lst1.append(i) 

In [9]:
data010511 = data.loc[lst1].reset_index()

In [10]:
data010511["InvoiceDate"] =data010511["InvoiceDate"].dt.date

In [11]:
data_Fr = data010511[data["Country"] == "France"]
df2 = data_Fr.pivot_table(index = "InvoiceDate", values = ["Quantity", "Revenue"], aggfunc="sum")
df2.head()


Boolean Series key will be reindexed to match DataFrame index.



Unnamed: 0_level_0,Quantity,Revenue
InvoiceDate,Unnamed: 1_level_1,Unnamed: 2_level_1
2011-01-04,143,316.05
2011-01-05,327,482.37
2011-01-06,131,328.05
2011-01-07,649,1040.15
2011-01-09,310,729.14


In [12]:
df2 = df2.reset_index()

In [13]:
df2.iplot(kind='line', x='InvoiceDate', xTitle='Date and Time',
           yTitle='Quantity and Revenue', title='France Total Quantity and Revenue January through May 2011')

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [14]:
data3 = data[data["Description"]=="PARTY BUNTING"]

In [15]:
party_bunting = data3.pivot_table(index = "Country", values= ["Quantity", "UnitPrice"], aggfunc="mean")

In [16]:
party_bunting = party_bunting.reset_index()

In [17]:
party_bunting.head()

Unnamed: 0,Country,Quantity,UnitPrice
0,Australia,33.125,4.7125
1,Austria,8.0,4.95
2,Belgium,4.0,4.95
3,Channel Islands,13.333333,4.95
4,Cyprus,2.333333,4.75


In [18]:
party_bunting.iplot(x='Quantity', y='UnitPrice', categories='Country', xTitle='Average Quantity', 
           yTitle='Average Unit Price', title='PARTY BUNTING Average Quantity vs Average Unit Price by Country')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [30]:
lst4 = ["EIRE","Germany","France","Netherlands"]
data4=data[data['Country'].isin(lst4)]

In [33]:
data4pv = data4.pivot_table(index="InvoiceNo", columns="Country", values="Quantity", aggfunc='sum' )

In [36]:
data4pv.iplot(kind='hist', histnorm='percent', subplots=True, xTitle='Quantity',
yTitle='percent', title='Quantity per invoice')

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [37]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

In [43]:
data5 = data[data["Country"].isin(country_list) & data["Description"].isin(product_list)]

In [51]:
data5pv = data5.pivot_table(index="Country", columns="Description", values="Revenue", aggfunc="sum")
data5pv

Description,CREAM HANGING HEART T-LIGHT HOLDER,JUMBO BAG RED RETROSPOT,REGENCY CAKESTAND 3 TIER
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
EIRE,2740.8,278.72,7388.55
France,131.75,903.37,2816.85
Germany,35.4,1072.76,9061.95
Netherlands,1167.0,3468.0,3166.35


In [52]:
data5pv = data5pv.reset_index()
data5pv

Description,Country,CREAM HANGING HEART T-LIGHT HOLDER,JUMBO BAG RED RETROSPOT,REGENCY CAKESTAND 3 TIER
0,EIRE,2740.8,278.72,7388.55
1,France,131.75,903.37,2816.85
2,Germany,35.4,1072.76,9061.95
3,Netherlands,1167.0,3468.0,3166.35


In [53]:
data5pv.iplot(kind='bar', x='Country', xTitle='Country', 
           yTitle='Revenue', title='Revenue by Product')

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [58]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

In [62]:
data6 =uk.pivot_table(index='Day', values='Quantity', aggfunc='sum')

In [65]:
data6=data6.reset_index()

In [70]:
fig = data6.iplot(kind='line', x='Day', xTitle='Date', color='blue',
           yTitle='Quantiy', title='UK Quantity Sold by Day')

In [88]:
updatemenus = list(
      list(
        y = 0.8,
        buttons = list([

          dict(method = "restyle",
               args = ["Year", 2010],
               label = "2010"),

          dict(method = "restyle",
               args = ["Year", 2011],
               label = "2011")])),

      list(
        y = 0.7,
        buttons = list(
          list(method = "restyle",
               args = list("Month", 1),
               label = "1"),
          list(method = "restyle",
               args = list("Month", 2),
               label = "2"),
          list(method = "restyle",
               args = list("Month", 3),
               label = "3"),
          list(method = "restyle",
               args = list("Month", 4),
               label = "4"),
          list(method = "restyle",
               args = list("Month", 5),
               label = "5"),
          list(method = "restyle",
               args = list("Month", 6),
               label = "6"),
          list(method = "restyle",
               args = list("Month", 7),
               label = "7"),
          list(method = "restyle",
               args = list("Month", 8),
               label = "8"),
          list(method = "restyle",
               args = list("Month", 9),
               label = "9"),
          list(method = "restyle",
               args = list("Month", 10),
               label = "10"),
          list(method = "restyle",
               args = list("Month", 11),
               label = "11"),
          list(method = "restyle",
               args = list("Month", 12),
               label = "12"))),
)

TypeError: list() takes no keyword arguments

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.

In [None]:
from plotly import graph_objs as go
fig = go.Figure(data=go.Bar(x=[1, 2, 3], y=[1, 3, 2]))
button_layer_1_height = 1.08
fig.update_layout(
    updatemenus=[
        go.layout.Updatemenu(
            buttons=list([
                dict(
                    args=["Year", "2010"],
                    label="2010",
                    method="restyle"
                ),
                dict(
                    args=["Year", "2011"],
                    label="2011",
                    method="restyle"
                ),
            ]),
            direction="down",
            pad={"r": 10, "t": 10},
            showactive=True,
            x=0.1,
            xanchor="left",
            y=button_layer_1_height,
            yanchor="top"
        ),
        go.layout.Updatemenu(
            buttons=list([
                dict(
                    args=["Month", 1],
                    label="1",
                    method="restyle"
                ),
                dict(
                    args=["Month", 2],
                    label="2",
                    method="restyle"
                ),
                dict(
                    args=["Month", 3],
                    label="3",
                    method="restyle"
                ),
                dict(
                    args=["Month", 4],
                    label="4",
                    method="restyle"
                ),
                dict(
                    args=["Month", 5],
                    label="5",
                    method="restyle"
                ), 
                dict(
                    args=["Month", 6],
                    label="6",
                    method="restyle"
                ), 
                dict(
                    args=["Month", 7],
                    label="7",
                    method="restyle"
                ), 
                dict(
                    args=["Month", 8],
                    label="8",
                    method="restyle"
                ),
                dict(
                    args=["Month", 9],
                    label="9",
                    method="restyle"
                ),
                dict(
                    args=["Month", 10],
                    label="10",
                    method="restyle"
                ),
                dict(
                    args=["Month", 11],
                    label="11",
                    method="restyle"
                ),
                dict(
                    args=["Month", 12],
                    label="12",
                    method="restyle"
                ),
            ]),
            direction="down",
            pad={"r": 10, "t": 10},
            showactive=True,
            x=0.37,
            xanchor="left",
            y=button_layer_1_height,
            yanchor="top"
        ),
    ]
)

fig.update_layout(
    annotations=[
        go.layout.Annotation(text="colorscale", x=0, xref="paper", y=1.06, yref="paper",
                             align="left", showarrow=False),
        go.layout.Annotation(text="Reverse<br>Colorscale", x=0.25, xref="paper", y=1.07,
                             yref="paper", showarrow=False)
    ])