# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [1]:
import pandas as pd
import plotly.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()

In [2]:
data = pd.read_excel('data/Online Retail.xlsx')

In [3]:
data.columns=[col.lower() for col in data.columns]
data.head()

Unnamed: 0,invoiceno,invoicedate,stockcode,description,quantity,unitprice,revenue,customerid,country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [4]:
# filtering by specific countries and date: 

filtrd_data = data.query('country != "United Kingdom" and (invoicedate >= "2011-4-1" & invoicedate <= "2011-4-30")')
filtrd_data.head()

Unnamed: 0,invoiceno,invoicedate,stockcode,description,quantity,unitprice,revenue,customerid,country
724,549667,2011-04-11 12:20:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.95,17.7,14911,EIRE
807,551163,2011-04-26 15:52:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,9,2.95,26.55,12573,France
3320,550899,2011-04-21 12:07:00,22752,SET 7 BABUSHKA NESTING BOXES,2,8.5,17.0,13505,Switzerland
4880,550527,2011-04-19 10:48:00,84879,ASSORTED COLOUR BIRD ORNAMENT,40,1.69,67.6,12476,Germany
4882,550620,2011-04-19 13:39:00,84879,ASSORTED COLOUR BIRD ORNAMENT,32,1.69,54.08,12585,Germany


In [5]:
# ploting the interactive graph: 

filtrd_data.iplot(kind = 'bar',x='country', y =['quantity', 'revenue'],
                  title='Total Quantity and Revenue by Country (April 2011)' )

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [6]:
# filtering 
month = [1,2,3]
filtrd_data2 = data.query('country == "France" and (invoicedate >= "2011-1-1" & invoicedate <= "2011-3-31")').sort_values(by='invoicedate')
filtrd_data2.head()

Unnamed: 0,invoiceno,invoicedate,stockcode,description,quantity,unitprice,revenue,customerid,country
197951,540178,2011-01-05 12:42:00,21238,RED RETROSPOT CUP,8,0.85,6.8,12681,France
260744,540178,2011-01-05 12:42:00,21224,SET/4 SKULL BADGES,10,1.25,12.5,12681,France
260332,540178,2011-01-05 12:42:00,22348,TEA BAG PLATE RED RETROSPOT,24,0.85,20.4,12681,France
255180,540178,2011-01-05 12:42:00,22892,SET OF SALT AND PEPPER TOADSTOOLS,12,1.25,15.0,12681,France
62505,540178,2011-01-05 12:42:00,21786,POLKADOT RAIN HAT,24,0.42,10.08,12681,France


In [7]:
filtrd_data2.iplot(kind='line',x='invoicedate', y=['quantity', 'revenue'],)

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [None]:
data.groupby()

In [17]:
filter_3 = data.query('description == "PARTY BUNTING"').groupby(by='country', as_index=False).agg({'quantity': 'mean',
                                                                                             'unitprice': 'mean'})

In [25]:
filter_3.iplot(kind='scatter', x='quantity', y='unitprice', categories ='country',
               title = 'PARTY BUNTING quantity X unit price by country',
               xTitle='average quantity', yTitle='average unit price')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [105]:
country_list = ['EIRE', 'Germany', 'France', 'Netherlands']
filters = [data.query(f'country == "{country}"').groupby(by='invoiceno').agg({'quantity':'sum'}) for country in country_list]

subplot = cf.subplots([filtered.figure(kind='histogram') for filtered in filters], shape=(2,2))
subplot.iplot()

AttributeError: 'dict' object has no attribute 'iplot'

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [None]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.