# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [230]:
import pandas as pd
import chart_studio.plotly as py
import cufflinks as cf
from ipywidgets import interact
import plotly.express as px
cf.go_offline()

In [231]:
data = pd.read_excel('../data/Online Retail.xlsx')
data.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [232]:
withoutUK = data[(data['Country'] != 'United Kingdom')]
withoutUK = withoutUK[(withoutUK['InvoiceDate'] >= '2011-04-01') & (withoutUK['InvoiceDate'] <= '2011-04-30')]
withoutUK = withoutUK.groupby('Country').agg({'Revenue':'sum', 'Quantity':'sum'})
withoutUK.head()

Unnamed: 0_level_0,Revenue,Quantity
Country,Unnamed: 1_level_1,Unnamed: 2_level_1
Australia,421.6,224
Austria,584.78,308
Belgium,1788.48,1170
Brazil,1143.6,356
Channel Islands,243.0,96


In [233]:
country.iplot(kind='bar', xTitle='Whithout UK', yTitle='Revenue and Quantity', 
           title='for the month of April 2011.')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [234]:
france = data[data['Country']=='France']
france = france[(france['InvoiceDate'] >= '2011-01-01') & (france['InvoiceDate'] <= '2011-05-31')]
france = france.groupby('InvoiceDate').agg({'Revenue':'sum', 'Quantity':'sum'})
france.head()

Unnamed: 0_level_0,Revenue,Quantity
InvoiceDate,Unnamed: 1_level_1,Unnamed: 2_level_1
2011-01-05 12:42:00,502.07,359
2011-01-05 14:48:00,763.11,369
2011-01-06 14:26:00,283.77,261
2011-01-06 16:12:00,425.25,177
2011-01-07 12:07:00,676.16,488


In [235]:
france.iplot(kind='line', xTitle='France', yTitle='Revenue and Quantity', 
           title='Quantity and Revenue sold to France in 2011 Jan-May')

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [236]:
partyBunting = data[data['Description']=='PARTY BUNTING']
partyBunting = partyBunting.groupby('Country').mean()
partyBunting.head()

Unnamed: 0_level_0,InvoiceNo,Quantity,UnitPrice,Revenue,CustomerID
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Australia,554329.625,33.125,4.7125,143.78125,12399.25
Austria,552202.0,8.0,4.95,39.6,12414.0
Belgium,557600.0,4.0,4.95,19.8,12363.0
Channel Islands,561821.666667,13.333333,4.95,66.0,14934.0
Cyprus,553141.333333,2.333333,4.75,10.95,12373.333333


In [237]:
#partyBunting.iplot(x='Quantity', y='UnitPrice', categories='Revenue',
#           xTitle='Quantity', yTitle='UnitPrice',
#           title='')
# No logré que salieran los nombres de los países
fig = px.scatter(partyBunting, x='Quantity', y='UnitPrice', color=partyBunting.index, size='Quantity', hover_data=['Revenue'])
fig.show()

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [238]:
EireGerFraNeth = data[data['Country'].isin(['EIRE', 'Germany', 'France', 'Netherlands'])]
EireGerFraNeth.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
179,539320,2010-12-16 19:16:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,24,2.95,70.8,14911,EIRE
198,539722,2010-12-21 13:45:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,24,2.95,70.8,14911,EIRE
304,541570,2011-01-19 12:34:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,256,2.55,652.8,14646,Netherlands
322,541979,2011-01-24 14:54:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.95,17.7,14911,EIRE
367,542777,2011-02-01 08:31:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.95,17.7,14911,EIRE


In [239]:
EireGerFraNeth = EireGerFraNeth.pivot_table(values='Quantity', columns='Country', 
                      index='InvoiceNo', aggfunc='sum')
EireGerFraNeth.iplot(kind='hist', xTitle='Quantity per Invoice', 
           yTitle='Amount per invoices', title='Quantity per Invoice Distribution')

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [240]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

In [255]:
revByCount = data[(data['Country'].isin(country_list)) & (data['Description'].isin(product_list))]
revByCount = revByCount.pivot_table(columns="Country",index="Description",values="Revenue")
revByCount.iplot(kind='bar', xTitle='Description', 
           yTitle='Revenue', title='Quantity per Invoice Distribution')

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [256]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

In [257]:
uk = uk.pivot_table(columns=["Year","Month"],index="Day",values="Quantity")
uk.iplot(kind='line', xTitle ='Day', yTitle='Quantity', title='Sold by Day in UK')

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [259]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

KeyError: 'Description'

In [250]:
products.iplot(kind='scatter',)
products = products.pivot_table(values='Quantity', columns=['Year','Month'], index='Day')

NameError: name 'products' is not defined

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.