# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [44]:
import numpy as np
import pandas as pd
import cufflinks as cf
import ipywidgets as widgets
from ipywidgets import interact
import chart_studio.plotly as py
import plotly.graph_objs as go
from IPython.display import display
from plotly.subplots import make_subplots

cf.go_offline()

import warnings
warnings.filterwarnings('ignore')

%matplotlib inline

In [3]:
# Magically, import the data 

df = pd.read_excel('../data/Online Retail.xlsx')

## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [21]:
data = df[df.Country != 'United Kingdom']
data = data.loc[(data.InvoiceDate >= '2011-4-1') & (data.InvoiceDate <= '2011-4-30')]

In [38]:
pd.pivot_table(data,
               index = 'Country',
               values = ['Revenue', 'Quantity'],
               aggfunc = np.sum
).iplot(kind = 'bar', 
        xTitle = 'Country', 
        color = ['#C24167', '#722C6E'],
        title = 'Total Quantity and Revenue')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [45]:
data2 = df[df['Country'] == 'France']
data2 = data2.loc[(data2['InvoiceDate'] >= '2011-1-1') & (data2['InvoiceDate'] <= '2011-5-31')]

In [47]:
pd.pivot_table(data2,
               index = 'InvoiceDate',
               values = ['Revenue', 'Quantity'],
               aggfunc = np.sum           
).iplot(kind = 'line', 
        xTitle = 'Country', 
        color = ['#C24167', '#722C6E'],
        title = 'Total Quantity and Revenue')

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [53]:
data3 = df[df['Description'] == 'PARTY BUNTING']

In [73]:
data3 = pd.pivot_table(data3,
                       index = 'Country',
                       values = ['Quantity', 'UnitPrice'])

data3.reset_index(inplace = True)

In [84]:
colors = ['#FF3347', '#FF6347', '#EE824D', '#DF9E53', '#D0B659', 
          '#C2CC5F', '#B5D265', '#A8D86B', '#9BE471', '#8DE077', 
          '#7FE67D', '#71E283', '#63DE89', '#55DC8F', '#47DA95', 
          '#39D69B', '#2BD2A1', '#1DD8A7', '#0FDDAF', '#FFFFFF']

data3.iplot(x = 'Quantity', 
            y = 'UnitPrice', 
            categories = 'Country',
            xTitle = 'Average Quantity', 
            yTitle = 'Average Unit Price',
            color = colors, 
            title = 'Average by Country')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [199]:
countries = ['EIRE', 'Germany', 'France', 'Netherlands']

data4 = df.loc[df['Country'].isin(countries)]

In [200]:
data4.reset_index(inplace = True)

In [201]:
data4 = pd.pivot_table(data4,
                       index = ['InvoiceNo'],
                       columns = ['Country'],
                       values = ['Quantity'],
                       aggfunc = {'Quantity': np.sum})

In [203]:
data4 = data4.fillna('0')

In [213]:
data4['Quantity'].iplot(kind = 'histogram')

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [244]:
products = ['JUMBO BAG RED RETROSPOT', 
            'CREAM HANGING HEART T-LIGHT HOLDER',
            'REGENCY CAKESTAND 3 TIER']

countries = ['EIRE', 'Germany', 'France', 'Netherlands']

In [245]:
data5 = df.loc[df.Description.isin(products)]
data5 = data5.loc[data5.Country.isin(countries)]

In [246]:
data5 = pd.pivot_table(data5,
                       index = 'Country',
                       values = 'Revenue',
                       columns = 'Description',
                       aggfunc = {'Revenue': np.sum})

In [247]:
data5.reset_index(inplace = True)

In [248]:
data5.iplot(kind = 'bar', 
            x = 'Country', 
            title = 'Revenue by Country',
            xTitle = 'Country', 
            yTitle = 'Revenue')

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. 

In [113]:
data6 = df[df['Country'] == 'United Kingdom']

data6.reset_index(inplace = True)

data6 = pd.pivot_table(data6,
                       index = 'InvoiceDate',
                       values = 'Quantity',
                       aggfunc = np.sum)

data6.iplot(kind = 'bar')

### Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [166]:
'''
The x axis can be controlled interactivelly to select the period.
I tried to add the drop-down, but I did not achieve the success.
''';

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. 

In [6]:
data7 = df[['InvoiceNo', 'CustomerID', 'Description']]

data7 = pd.pivot_table(data7,
                       index = 'Description',
                       values = ['InvoiceNo', 'CustomerID'],
                       aggfunc = 'nunique')

data7.reset_index(inplace = True)

data7.iplot(x = 'InvoiceNo',
            y = 'CustomerID',
            categories = 'Description')

### Add two sliders that control the x and y axis ranges.

In [77]:
'''
The plot axis can both already be controlled interactivelly.
I tried to add extra two sliders, but I did not achieve the success.
''';

## 8. Create an interactive bar chart that shows revenue by product description. 

In [17]:
data8 = df[['Revenue', 'Description']]

data8 = pd.pivot_table(data8,
                       index = 'Description',
                       values = 'Revenue',
                       aggfunc = np.sum)

data8.reset_index(inplace = True)

data8.iplot(kind = 'bar', 
            x = 'Description',
            y = 'Revenue')

### Add a text field widget that filters the results to show the product that contain the text entered in their description.

In [161]:
def filter_data(description):
    filtered_data = data8[data8['Description'].str.contains(description, 
                                                            case = False)]
    filtered_data.iplot(kind = 'bar', 
                        x = 'Description', 
                        y = 'Revenue')

# Create the text field widget
text_widget = widgets.Text(value = '', 
                           description = 'Description:')

# Define the interaction between the text field and the plot
widgets.interactive(filter_data, 
                    description = text_widget)

interactive(children=(Text(value='', description='Description:'), Output()), _dom_classes=('widget-interact',)…