# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [21]:
import pandas as pd
import chart_studio.plotly as py 
import cufflinks as cf
from ipywidgets import interact
import datetime as dt

cf.go_offline()

In [2]:
data = pd.read_excel('/Users/sahivygonalez/Documents/Iron-Hack-Sahivy-Repo/data-labs/module-2/lab-interactive-visualization/data/Online Retail.xlsx')


In [3]:
data.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [37]:
data_no_uk_april_2011 = data[(data['InvoiceDate'].dt.year == 2011) 
                             & (data['InvoiceDate'].dt.month == 4) 
                             & (data['Country'] != 'United Kingdom')]

data_no_uk_april_2011.groupby(['Country'])['Quantity', 'Revenue'].sum().iplot(kind = 'bar')


## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [38]:
data_france_2011 = data[(data['InvoiceDate'].dt.year == 2011) 
                        & (data['InvoiceDate'].dt.month >= 1)
                        & (data['InvoiceDate'].dt.month < 6)
                        & (data['Country'] == 'France')]

In [51]:
data_clean_france = data_france_2011[['Quantity', 'Revenue']].set_index(data_france_2011['InvoiceDate'].dt.month).rename_axis('Month')


Unnamed: 0_level_0,Quantity,Revenue
Month,Unnamed: 1_level_1,Unnamed: 2_level_1
4,9,26.55
1,4,15.0
2,4,34.0
1,160,232.0
3,160,232.0


In [55]:
data_france_2011.groupby(['InvoiceDate'])[['Quantity', 'Revenue']].sum().iplot()


In [60]:
import calendar

data_france_2011['Month'] = data_france_2011['InvoiceDate'].dt.month.map(lambda x: calendar.month_name[x])

data_france_2011.groupby(['Month'])[['Quantity', 'Revenue']].sum().iplot()

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [80]:
import plotly.express as px

data_PB_Q_UP = data[data['Description'] == 'PARTY BUNTING'].groupby(['Country'])['Quantity', 'UnitPrice'].mean()

fig = px.scatter(
    data_PB_Q_UP, 
    x="Quantity", 
    y="UnitPrice", 
    color=data_PB_Q_UP.index,
)

fig.update_layout(title='PARTY BUNTING - Unit Price / Quanitty (by Country)')

fig.show()

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [105]:
data_Q_4 = pd.DataFrame(data[data['Country'].isin(['EIRE', 'Germany', 'France', 'Netherlands'])].groupby(['Country','InvoiceNo'])['Quantity'].sum())

data_Q_4.head()

Unnamed: 0_level_0,Unnamed: 1_level_0,Quantity
Country,InvoiceNo,Unnamed: 2_level_1
EIRE,536540,230
EIRE,536541,12
EIRE,536803,6
EIRE,536890,1548
EIRE,536975,827


In [108]:
fig = px.histogram(data_Q_4, x=data_Q_4.index, y="Quantity", histfunc='avg')
fig.show()

TypeError: Argument 'x' is a pandas MultiIndex. pandas MultiIndex is not supported by plotly express at the moment.

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [None]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

## Bonus Question:

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
from ipywidgets import interact
from bokeh.io import push_notebook, show, output_notebook
from bokeh.plotting import figure
output_notebook()

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.