# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [77]:
import pandas as pd
import chart_studio.plotly as py
import cufflinks as cf
from ipywidgets import interact
import plotly.graph_objects as go
import plotly.express as px
from ipywidgets import interact

cf.go_offline()

In [2]:
data = pd.read_excel('../Data/Online Retail.xlsx')

In [3]:
data.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country
0,536365,2010-12-01 08:26:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
1,536373,2010-12-01 09:02:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
2,536375,2010-12-01 09:32:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.55,15.3,17850,United Kingdom
3,536390,2010-12-01 10:19:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,64,2.55,163.2,17511,United Kingdom
4,536394,2010-12-01 10:39:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,32,2.55,81.6,13408,United Kingdom


## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [4]:
data_april_2011=data[data.Country != 'United Kingdom'].loc[(data.InvoiceDate <'2011-05-01 00:00:00')& (data.InvoiceDate >='2011-04-01 00:00:00')]

data_group=data_april_2011.groupby('Country').sum().sort_values(by=['Revenue'], ascending=False)
data_group.reset_index(inplace=True)

In [5]:

fig = go.Figure(data=[
    go.Bar(name='Quantity', x=data_group.Country, y=data_group.Quantity),
    go.Bar(name='Revenue', x=data_group.Country, y=data_group.Revenue)
])

fig.update_layout(barmode='group')
fig.show()

In [6]:
d=data_group[['Revenue', 'Quantity', 'Country']]

d.iplot(kind='bar', x='Country', xTitle='Country', 
           yTitle='Quantity and Revenue', title='Plot')

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [7]:
df_france=data[data.Country == 'France'].loc[(data.InvoiceDate >='2011-01-01 00:00:00')&(data.InvoiceDate <'2011-06-01 00:00:00')].groupby(by=['InvoiceDate']).sum().reset_index()

df_france2=df_france[['Revenue', 'Quantity', 'InvoiceDate']]

df_france2.iplot(x='InvoiceDate', xTitle='Dates', 
           yTitle='Quantity and Revenue')

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [14]:
d_party=data[data.Description == 'PARTY BUNTING']

d_partyMean=d_party.groupby(['Country']).mean().reset_index()

d_partyMean.iplot(x='Quantity', y='UnitPrice', categories='Country',
           xTitle='Quantity', yTitle='Unit Price')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [26]:
lista=['EIRE', 'Germany', 'France', 'Netherlands']
for e in lista:
    d_set=data[data.Country == f'{e}'] 
    d_set.Quantity.iplot(kind='hist', title=f'{e}')

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [53]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']


new_data=data.loc[((data.Country == 'EIRE') | (data.Country == 'Germany') | (data.Country == 'France')
                   | (data.Country == 'Netherlands')) &
                 ((data.Description == 'JUMBO BAG RED RETROSPOT')|
                  (data.Description == 'CREAM HANGING HEART T-LIGHT HOLDER')|
                  (data.Description == 'REGENCY CAKESTAND 3 TIER'))]
new_data.head()

Unnamed: 0,InvoiceNo,InvoiceDate,StockCode,Description,Quantity,UnitPrice,Revenue,CustomerID,Country,Year,Month,Day
179,539320,2010-12-16 19:16:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,24,2.95,70.8,14911,EIRE,2010,12,16
198,539722,2010-12-21 13:45:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,24,2.95,70.8,14911,EIRE,2010,12,21
304,541570,2011-01-19 12:34:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,256,2.55,652.8,14646,Netherlands,2011,1,19
322,541979,2011-01-24 14:54:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.95,17.7,14911,EIRE,2011,1,24
367,542777,2011-02-01 08:31:00,85123A,CREAM HANGING HEART T-LIGHT HOLDER,6,2.95,17.7,14911,EIRE,2011,2,1


In [56]:
df_pivot=new_data.pivot_table(values='Revenue', columns='Description', 
                        index='Country', aggfunc='sum').reset_index()
display(df_pivot)

Description,Country,CREAM HANGING HEART T-LIGHT HOLDER,JUMBO BAG RED RETROSPOT,REGENCY CAKESTAND 3 TIER
0,EIRE,2740.8,278.72,7388.55
1,France,131.75,903.37,2816.85
2,Germany,35.4,1072.76,9061.95
3,Netherlands,1167.0,3468.0,3166.35


In [57]:
df_pivot.iplot(kind='bar', x='Country', xTitle='Countries', 
           yTitle='Revenue', title='Revenues')

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [58]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']

In [80]:
@interact(Selection=['Year', 'Month', 'Day'])
def linechart(Selection):
    uk_pivot=uk.pivot_table(values='Quantity',
                        index=Selection).reset_index()

    uk_pivot.iplot(kind='line', x=Selection, xTitle='Dates', 
           yTitle='Revenue', title='Revenues' + Selection.title())
    
    




interactive(children=(Dropdown(description='Selection', options=('Year', 'Month', 'Day'), value='Year'), Outpu…

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [87]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func).reset_index()

In [86]:
products.iplot(x='InvoiceNo', y='CustomerID', categories='Description',
           xTitle='InvoiceNo', yTitle='Customers')

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.