# Interactive Visualization Lab

Complete the following set of exercises to solidify your knowledge of interactive visualization using Plotly, Cufflinks, and IPyWidgets.

In [None]:
import pandas as pd
import chart_studio.plotly as py
import cufflinks as cf
from ipywidgets import interact

cf.go_offline()
#i imported chart_studio instead of plotly, as it suggested plotly was updated into chart_studio

Please download the Online_retail dataset dataset from [here](https://drive.google.com/file/d/1jD7eQYnfcvbm1ksDbD12U22JtbKItU7E/view?usp=sharing), place it in the data folder.<br>
Load the data:

In [None]:
data = pd.read_excel('../data/Online_Retail.xlsx')
data.head()

## 1. Create an interactive bar chart showing total quantity and revenue by country (excluding United Kingdom) for the month of April 2011.

In [None]:
#explore data
data.dtypes

In [None]:
data[(data['Country'] != 'United Kingdom') & (data['InvoiceDate'] >= '2011-04-01') & (data['InvoiceDate'] <= '2011-04-30')].groupby('Country', as_index=False).agg({'Quantity':'sum',
                                                    'Revenue': 'sum'}).iplot(kind='bar', x= 'Country', xTitle='Country',
            yTitle='Revenue and Quantity', title='April 2011 - Total quantity and revenue by country - exc. UK') 

## 2. Create an interactive line chart showing quantity and revenue sold to France between January 1st and May 31st 2011.

In [None]:
to_france = data[(data['Country'] == 'France')&(data['InvoiceDate'] >= '2011-01-01 00:00:00')&(data['InvoiceDate'] <= '2011-05-31 23:59:59')]
to_france[['InvoiceDate', 'Quantity', 'Revenue']].pivot_table(index='InvoiceDate', aggfunc='sum').iplot(kind='line',title='Total Quantity and Revenue sold to France between January 1st - May 31st 2011')

## 3. Create an interactive scatter plot showing the relationship between average quantity (x-axis) and average unit price (y-axis) for the product PARTY BUNTING with the plot points color-coded by country (categories).

In [None]:
party_bunting = data[data['Description']=='PARTY BUNTING'][['Country', 'Quantity', 'UnitPrice']].groupby('Country').agg('mean').reset_index()
party_bunting.iplot(kind='scatter', x='Quantity', 
              xTitle='Mean Quantity',y='UnitPrice', yTitle='Mean Unit Price', categories='Country',
              title='Party Bunting product - quantity vs avg unit price')

## 4. Create a set of interactive histograms showing the distributions of quantity per invoice for the following countries: EIRE, Germany, France, and Netherlands.

In [None]:
europe_histograms= (data[data['Country'].isin(['EIRE', 'Germany', 'France', 'Netherlands'])]
           [['Country', 'InvoiceNo', 'Quantity']]
          .pivot_table(index='InvoiceNo', columns='Country', values='Quantity', aggfunc='sum')
          ).iplot(kind='hist', subplots=True)

## 5. Create an interactive side-by-side bar chart showing the revenue by country listed below (bars) for each of the products listed below.

In [None]:
product_list = ['JUMBO BAG RED RETROSPOT', 
                'CREAM HANGING HEART T-LIGHT HOLDER',
                'REGENCY CAKESTAND 3 TIER']

country_list = ['EIRE', 'Germany', 'France', 'Netherlands']

In [None]:
bycountry= data[data['Country'].isin(country_list) & data['Description'].isin(product_list)][['Country', 'Revenue', 'Description']]
bycountry.pivot_table(index='Country', columns='Description', aggfunc='sum').iplot(kind='bar',
              title='Revenue per Country per Products')

## 6. Create an interactive line chart showing quantity sold by day for the United Kingdom. Add drop-down boxes for Year and Month that allow you to filter the date range that appears in the chart.

In [None]:
data['Year'] = pd.DatetimeIndex(data['InvoiceDate']).year
data['Month'] = pd.DatetimeIndex(data['InvoiceDate']).month
data['Day'] = pd.DatetimeIndex(data['InvoiceDate']).day
uk = data[data['Country']=='United Kingdom']
#not sure how to solve this one 
#will follow with https://plotly.com/python/dropdowns/ and ammend 

# Bonus challenges

## 7. Create an interactive scatter plot that plots number of invoices (x-axis) vs. number of customers (y-axis) and the plot points represent individual products. Add two sliders that control the x and y axis ranges.

In [None]:
agg_func = {'InvoiceNo':'nunique',
            'Quantity':'sum',
            'UnitPrice':'mean',
            'Revenue':'sum',
            'CustomerID':'nunique'}

products = uk.groupby('Description').agg(agg_func)

## 8. Creat an interactive bar chart that shows revenue by product description. Add a text field widget that filters the results to show the product that contain the text entered in their description.