# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [8]:
import pandas as pd
import chart_studio.plotly as py
import cufflinks as cf
from ipywidgets import interact
cf.go_offline()

In [9]:
data = pd.read_excel('Online Retail.xlsx')
data.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


In [10]:
data.columns

Index(['InvoiceNo', 'InvoiceDate', 'StockCode', 'Description', 'Quantity',
       'UnitPrice', 'Revenue', 'CustomerID', 'Country'],
      dtype='object')

## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [11]:
data_withouth_april_england = data[(data['InvoiceDate'] < '2011-4-1') | (data['InvoiceDate'] > '2011-4-30') & (data['Country'] != 'United Kingdom')]
data_2 = data_withouth_april_england.groupby("Country")[['Quantity','Revenue']].sum().reset_index()

In [12]:
data_2.iplot(kind='bar', x='Country', xTitle='Country',
           yTitle='Revenue/Quantity', title='Revenue & Quantity by Country')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [13]:
france = data[(data.Country == 'France') & (data.InvoiceDate.dt.month >= 1) & (data.InvoiceDate.dt.month <= 5) & (data.InvoiceDate.dt.year == 2011)]

france1 = france.groupby(['InvoiceDate'])['Revenue', 'Quantity'].sum()

france2 = france1.reset_index()

france2.iplot(kind='line', x = 'InvoiceDate', xTitle='Date', yTitle='Total', title='Total quantity and revenue for France')


## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [17]:
party_bunting = data[data.Description == 'PARTY BUNTING']

party_bunting = party_bunting.groupby(['Country'])['Quantity', 'UnitPrice'].mean()
party_bunting = party_bunting.reset_index()
party_bunting.iplot(x='Quantity', y='UnitPrice', categories='Country',
          xTitle='Avg Quantity', yTitle='Avg UnitPrice',
           title='Quantity vs. UnitPrice')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [20]:
countries = data[(data.Country == 'EIRE') | (data.Country == 'Germany') | 
                 (data.Country == 'France') | (data.Country == 'Netherlands')]

countries = countries.pivot_table(values = 'Quantity', columns = 'Country', index = 'InvoiceNo', aggfunc = 'mean')

countries.iplot(kind='hist', xTitle='Countries', yTitle='Invoice', subplots = True,
           title='Total quantity by country')

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [23]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

In [24]:
data = data[(data['Description'].isin(df3['product'])) & (data['Country'].isin(df3['country']))]
df = data[['Description', 'Country','Revenue']]
table = pd.pivot_table(df, index='Country', columns='Description', values='Revenue', aggfunc='sum')
result = table.reset_index()

result.iplot(kind='bar', x='Country')

NameError: name 'df3' is not defined

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.