# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [2]:
import pandas as pd
import chart_studio.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()

In [4]:
data = pd.read_excel('../data/Online Retail.xlsx')

## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [40]:
data['Date'] = data['InvoiceDate'].dt.date
data['Day'] = data['InvoiceDate'].dt.day
data['Month'] = data['InvoiceDate'].dt.month
data['Year'] = data['InvoiceDate'].dt.year
data_exc_uk = data[(data['Country'] != 'United Kingdom') & (data['Month'] == 4) & (data['Year'] == 2011)]

agg_data = data_exc_uk.groupby('Country')['Quantity', 'Revenue'].sum()

agg_data.iplot(kind = 'bar')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [53]:
france_data = data[(data['Country'] == 'France') & (data['Year'] == 2011)]
france_data = france_data[(france_data['Month'] == 1) | (france_data['Month'] == 2) | (france_data['Month'] == 3) | (france_data['Month'] == 4) | (france_data['Month'] == 5)]

france_data.groupby('Date')['Quantity', 'Revenue'].sum().iplot(kind = 'line')

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [67]:
party_bunting = data[data['Description'] == 'PARTY BUNTING']
party_bunting = party_bunting.groupby('Country')['Quantity', 'UnitPrice'].mean().reset_index()



party_bunting.iplot(
    x = 'Quantity',
    y = 'UnitPrice',
    categories = 'Country',
    kind = 'scatter'
)

# party_bunting.head()

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [76]:
invoice_quant_eire = data[data['Country'] == 'EIRE']
invoice_quant_de = data[data['Country'] == 'Germany']
invoice_quant_fr = data[data['Country'] == 'France'] 
invoice_quant_nl = data[data['Country'] == 'Netherlands']

invoice_quant_eire = invoice_quant_eire.groupby('InvoiceNo')['Quantity'].sum()
invoice_quant_eire.iplot(kind = 'hist', title = 'EIRE')

invoice_quant_de = invoice_quant_de.groupby('InvoiceNo')['Quantity'].sum()
invoice_quant_de.iplot(kind = 'hist', title = 'Germany')

invoice_quant_fr = invoice_quant_fr.groupby('InvoiceNo')['Quantity'].sum()
invoice_quant_fr.iplot(kind = 'hist', title = 'France')

invoice_quant_nl = invoice_quant_nl.groupby('InvoiceNo')['Quantity'].sum()
invoice_quant_nl.iplot(kind = 'hist', title = 'Netherlands')


## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [79]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

In [88]:

for product in product_list:
    sorted_list = data[(data['Description'] == product) & ((data['Country'] == 'EIRE') | (data['Country'] == 'Germany') | (data['Country'] == 'France') | (data['Country'] == 'Netherlands'))]
    sorted_list = sorted_list.groupby('Country')['Revenue'].sum()
    sorted_list.iplot(kind = 'bar', title = product + ' Revenue by Country')
    

## Bonus Questions

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.