In [6]:
# For the second part, we will look at the whole picture of the funnel conversion 
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import matplotlib.dates as mdates
import seaborn as sns
from matplotlib import rcParams
rcParams.update({'figure.autolayout': True})
pd.set_option('display.max_columns', 10)
pd.set_option('display.width', 350)
  
#read the files(
data = pd.read_csv('Funnel_Analysis_Data/processed/funnel_cleaned.csv')
data.head(10)

Unnamed: 0.1,Unnamed: 0,user_id,date,device,sex,page_home,page_search,page_payment,page_confirmation
0,0,450007,2015-02-28,Desktop,Female,1,0,0,0
1,1,756838,2015-01-13,Desktop,Male,1,0,0,0
2,2,568983,2015-04-09,Desktop,Male,1,1,0,0
3,3,190794,2015-02-18,Desktop,Female,1,1,0,0
4,4,537909,2015-01-15,Desktop,Male,1,0,0,0
5,5,993454,2015-03-03,Desktop,Male,1,0,0,0
6,6,377150,2015-04-15,Desktop,Female,1,1,0,0
7,7,137258,2015-01-27,Mobile,Male,1,0,0,0
8,8,608249,2015-04-12,Desktop,Female,1,0,0,0
9,9,615615,2015-02-24,Mobile,Female,1,1,0,0


In [7]:
#Overall conversion rate for variable sex
print(data.groupby('sex')['page_confirmation'].agg({'mean', 'count'}))

            mean  count
sex                    
Female  0.005347  45075
Male    0.004655  45325


In [11]:
from scipy import stats
#Statisitical test on conversion rate and sex
test = stats.ttest_ind(data.loc[data['sex'] == 'Female']['page_confirmation'], data.loc[data['sex'] != 'Female']['page_confirmation'], equal_var=False)
  
#t statistics
print(test.statistic)


1.473291657657286


In [12]:
#interaction of sex and device
print(data.groupby(['device', 'sex'])['page_confirmation'].agg({'mean', 'count'}))

                    mean  count
device  sex                    
Desktop Female  0.002467  29997
        Male    0.002516  30203
Mobile  Female  0.011076  15078
        Male    0.008927  15122


In [8]:
# Desktop has way more users than mobile, but much lower conversion rate. Having less mobile visitors is pretty worrisome. 
#Pretty much all healthy tech companies should have more mobile users than desktop. So growing mobile should be a top priority for the company as a whole


# There are a couple of ways to explain the lower conversion rate on desktop:
# Product: desktop has a worse product. So product team should look into the differences between the two to see if UX/UI can be improved on desktop

# Marketing: the two platforms are attracting different kinds of users. So they just act as a proxy for user distribution. For instance, mobile didn’t get popular and only has power users, who obviously convert at a much higher rate. Or desktop is spending a lot on ads and these ads are attracting lower intent users.
# If we had more data about the users, we could find out if user distribution is the same across the devices (so it is most likely a product problem) or not (-> marketing problem). The marketing explanation has the advantage of explaining also the strangely lower absolute count for mobile users

# All key metrics for both devices have actually gone down a lot in the last few months. All drops though appear to happen on specific days and one specific page. 
#This kind of behavior is often the sign of a bug (more likely) or bad product changes (which at the end of the day are basically bugs too, just product bugs instead of engineering bugs). Usual analysis steps to find out why a metric suddenly dropped should be done here.


# It is hard to say without more information about the site, but the funnel numbers across the board don’t look particularly good. For instance,
#even before the bug, only at most 20% of users go from the search page to the payment page. These are clearly users with some sort of intent. It could be interesting to look into the characteristics of the search queries to see if people are constantly looking for something they cannot find. Essentially, trying to understand lack of supply compared to user demand.