# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [2]:
import pandas as pd
import chart_studio.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()

In [3]:
data = pd.read_excel('../data/Online Retail.xlsx')

## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [4]:
data.head()

april_data = data.loc[data["Country"] != "United Kingdom"]
april_data.index = april_data['InvoiceDate']
april_data = april_data['2011-4'] 


In [5]:
info = april_data[['Quantity','Revenue']]
info.index = april_data['Country']
info.iplot(kind='bar', xTitle='Countries', yTitle='Amount', 
          title='Total Charges Distribution')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [6]:
data.index = data['InvoiceDate']
france = data.loc[data['Country'] == "France"]['2011-01-01':'2011-05-31'][['Quantity']][:10]
france.iplot(kind='line', xTitle='Countries',y = 'Quantity', yTitle='Amount', 
          title='Total Charges Distribution')
france

Unnamed: 0_level_0,Quantity
InvoiceDate,Unnamed: 1_level_1
2011-04-26 15:52:00,9
2011-01-12 15:00:00,4
2011-02-28 14:45:00,4
2011-01-31 09:57:00,160
2011-03-31 10:27:00,160
2011-04-26 15:52:00,4
2011-05-08 16:10:00,16
2011-05-11 15:07:00,120
2011-05-17 09:28:00,32
2011-01-14 10:42:00,6


## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [7]:
party = data.loc[data['Description'] == "PARTY BUNTING"].groupby('Country').agg({'Quantity':'mean','UnitPrice':'mean'})
party['Country'] = party.index
party
party.iplot(x='UnitPrice', y='Quantity',
           xTitle='Unit Price', yTitle='Quantity', categories = "Country",
           title='Quantity vs. Unit Price of Bounty Party per Country')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [34]:
four = data.loc[(data['Country'] == 'EIRE')|(data['Country'] == 'Germany')|(data['Country'] == 'France')|(data['Country'] == 'Netherlands')]
four = four.pivot_table(index = 'Country')
eire = data.loc[data['Country'] == 'EIRE']['Quantity']
eire.iplot(kind = "hist")
eire
[data[data.Country == country]['Quantity'].iplot(kind='hist') for country in ["France","EIRE","Germany","Netherlands"]] 

[None, None, None, None]

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [10]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

In [45]:
import plotly.graph_objs as go 

df = data.loc[data['Country'].isin(country_list) & data['Description'].isin(product_list)]
pd.pivot_table(df, index = ['Description','Country'])['Revenue'].iplot(kind = 'bar')

#info = [data.loc[(data['Country']== country) & (data['Description'].isin(product_list))]['Revenue']  for country in country_list]

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

In [27]:
data.head()

Unnamed: 0_level_0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
InvoiceDate,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
2010-12-01 08:26:00,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2010-12-01 09:02:00,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2010-12-01 09:32:00,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2010-12-01 10:19:00,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
2010-12-01 10:39:00,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.