### Heroes Of Pymoli Data Analysis
* Of the 1163 active players, the vast majority are male (84%). There also exists, a smaller, but notable proportion of female players (14%).

* Our peak age demographic falls between 20-24 (44.8%) with secondary groups falling between 15-19 (18.60%) and 25-29 (13.4%).  
-----

In [None]:
# Dependencies and Setup
import pandas as pd
import numpy as np

# File to Load (Remember to Change These)
file_to_load = "Resources/purchase_data.csv"

# Read Purchasing File and store into Pandas data frame
purchase_data = pd.read_csv(file_to_load)
purchase_data.head()


## Total Players

In [None]:
# Count total number of players

purchase_data["SN"].nunique()

TotalPlayers = purchase_data["SN"].nunique()

# Create data frame for total number of players

TotalPlayers_df = pd.DataFrame({"Total Players": [TotalPlayers]})
TotalPlayers_df

## Purchasing Analysis (Total)

In [None]:
# Calculate number of unique items

UniqueItems = purchase_data["Item ID"].unique()
CountOfUniqueItems = pd.DataFrame(UniqueItems).count()
CountOfUniqueItems

# Calculate the average price

AveragePrice = purchase_data["Price"].mean()
AveragePrice

# Calculate the number of number of purchases

NumberOfPurchases = purchase_data["Purchase ID"].value_counts()
SumNumberOfPurchases = NumberOfPurchases.sum()
SumNumberOfPurchases

# Calculate the total revenue

TotalRevenue = purchase_data["Price"].sum()
TotalRevenue

# Create data frame

purchase_analysis = {'Number of Unique Items': CountOfUniqueItems,
                  'Average Price': AveragePrice,
                  'Number of Purchases': SumNumberOfPurchases,
                  'Total Revenue': TotalRevenue}

purchase_analysis_df = pd.DataFrame(purchase_analysis)
purchase_analysis_df


## Gender Demographics

In [None]:
player_demo = purchase_data.loc[:, ["Gender", "SN", "Age"]]
player_demo = player_demo.drop_duplicates()

In [None]:
# Count total number of players


TotalPlayers = player_demo["Gender"].count()
TotalPlayers


In [None]:
# Count  number of male players

MalePlayers = (player_demo["Gender"] == "Male").sum()
MalePlayers


In [None]:
# Count number of female players

FemalePlayers = (player_demo["Gender"] == "Female").sum()
FemalePlayers

In [None]:
# Count number of other players

OtherPlayers = (player_demo["Gender"] == "Other / Non-Disclosed").sum()
OtherPlayers

In [None]:
# Calculate percentage of male players

MalePlayersPercent = round((MalePlayers)/(TotalPlayers)*100)
MalePlayersPercent

In [None]:
# Calculate percentage of female players

FemalePlayersPercent = round((FemalePlayers)/(TotalPlayers)*100)
FemalePlayersPercent

In [None]:
# Calculate percentage of other players

OtherPlayersPercent = round((OtherPlayers)/(TotalPlayers)*100)
OtherPlayersPercent

In [None]:
# Create data frame for gender demographics

gender_demographics = pd.DataFrame({"Gender":["Male", "Female","Other / Non-Disclosed"], "Total Count":[MalePlayers, FemalePlayers, OtherPlayers], "Percentage of Players": [MalePlayersPercent, FemalePlayersPercent, OtherPlayersPercent]})

gender_demographics = gender_demographics.set_index("Gender")
gender_demographics

## Purchasing Analysis (Gender)

In [174]:
# Calculate purchase count

Purchasinggb = purchase_data.groupby(["Gender"])
PurchaseCount = Purchasinggb.count()["Price"]
AveragePurchasePrice = Purchasinggb.mean()["Price"]
TotalPurchaseValue = Purchasinggb.sum()["Price"]
AverageTotalPurchase = TotalPurchaseValue/gender_demographics["Total Count"]

SummaryTable = pd.DataFrame({"Purchase Count": PurchaseCount,
                            "Average Purchase Price": AveragePurchasePrice,
                            "Total Purchase Value": TotalPurchaseValue,
                            "Average Total Purchase per Person": AverageTotalPurchase})

SummaryTable = SummaryTable[["Purchase Count", "Average Purchase Price", "Total Purchase Value", "Average Total Purchase per Person"]]

SummaryTable = SummaryTable.round(2)
SummaryTable

Unnamed: 0_level_0,Purchase Count,Average Purchase Price,Total Purchase Value,Average Total Purchase per Person
Gender,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
Female,113,3.2,361.94,4.47
Male,652,3.02,1967.64,4.07
Other / Non-Disclosed,15,3.35,50.19,4.56


## Age Demographics

In [205]:
# Establish bins for ages

nodupdf = purchase_data.loc[:, ["SN", "Age"]].drop_duplicates()


bins = [0, 9.9, 14.9, 19.9, 24.9, 29.9, 34.9, 39.9, 990]
GroupNames = ['<10', '10-14','15-19','20-24', '25-29','30-34','35-39','40+']



nodupdf["Age Ranges"] = pd.cut(nodupdf ["Age"], bins, labels = GroupNames)
AgeDemographicsTotals = nodupdf ["Age Ranges"].value_counts()
AgeDemographicsPercents = (AgeDemographicsTotals / TotalPlayers * 100).round(2)

# Create data frame 

AgeDemographics = pd.DataFrame({"Age Group Total": AgeDemographicsTotals, "Percentage of Total": AgeDemographicsPercents, })
AgeDemographics.sort_index()

Unnamed: 0,Age Group Total,Percentage of Total
<10,17,2.95
10-14,22,3.82
15-19,107,18.58
20-24,258,44.79
25-29,77,13.37
30-34,52,9.03
35-39,31,5.38
40+,12,2.08


## Purchasing Analysis (Age)

In [219]:
# Bin the purchase_data data frame by age
purchase_data["Ranges"] = pd.cut(purchase_data["Age"], bins, labels = GroupNames)
purchase_data

AgePurchaseData = purchase_data.groupby(['Ranges'])

# Calculate purchase count, avgerage purchase price, avgerage purchase total per person 
PurchaseCount = AgePurchaseData['Purchase ID'].count()
PurchaseCount

AveragePurchasePrice = AgePurchaseData['Price'].mean()
AveragePurchasePrice

TotalPurchase = AgePurchaseData['Price'].sum()
TotalPurchase


AverageTotalPurchase = round(TotalPurchase/AgeDemographics["Age Group Total"],2)
AverageTotalPurchase
 
# Create a summary data frame

SummaryTable = pd.DataFrame({"Purchase Count": PurchaseCount,
                            "Average Purchase Price": AveragePurchasePrice,
                            "Total Purchase Value": TotalPurchase,
                            "Average Total Purchase per Person": AverageTotalPurchase})

SummaryTable = SummaryTable.round(2)
SummaryTable


Unnamed: 0,Purchase Count,Average Purchase Price,Total Purchase Value,Average Total Purchase per Person
<10,23,3.35,77.13,4.54
10-14,28,2.96,82.78,3.76
15-19,136,3.04,412.89,3.86
20-24,365,3.05,1114.06,4.32
25-29,101,2.9,293.0,3.81
30-34,73,2.93,214.0,4.12
35-39,41,3.6,147.67,4.76
40+,13,2.94,38.24,3.19


## Top Spenders

In [216]:
GroupedBySNCountMean =  purchase_data.groupby('SN').agg({'Price': ['count']})
GroupedBySNCountMean.columns = ['Total Count']
GroupedBySNCountMean.sort_values('Total Count', ascending=False).head()

GroupedBySNCountMean2 = purchase_data.groupby('SN').agg({'Price': ['count', 'mean', 'sum']})
GroupedBySNCountMean2.columns = GroupedBySNCountMean2.columns.droplevel(0)
GroupedBySNFinal = GroupedBySNCountMean2.sort_values(['count','mean'], ascending=False).head()
GroupedBySNFinal

Unnamed: 0_level_0,count,mean,sum
SN,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
Lisosia93,5,3.792,18.96
Idastidru52,4,3.8625,15.45
Iral74,4,3.405,13.62
Chamjask73,3,4.61,13.83
Iskadarya95,3,4.366667,13.1


## Most Popular Items

In [236]:
MostPopularItemsdf = purchase_data.loc[:,['Item ID','Item Name','Price']]
MostPopulardfGrp = MostPopularItemsdf.groupby(['Item ID','Item Name'])

purchase_count = MostPopulardfGrp["Item ID"].count()
ItemPrice = MostPopulardfGrp["Price"].mean()
TotalPurchaseValue = MostPopulardfGrp["Price"].sum()
MostPopularItems = pd.DataFrame({"Purchase Count":purchase_count,"Item Price":ItemPrice,"Total Purchase Value": TotalPurchaseValue})
MostPopularItems = MostPopularItems.sort_values("Purchase Count",ascending = False)

MostPopularItems.head()

Unnamed: 0_level_0,Unnamed: 1_level_0,Purchase Count,Item Price,Total Purchase Value
Item ID,Item Name,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
92,Final Critic,13,4.614615,59.99
178,"Oathbreaker, Last Hope of the Breaking Storm",12,4.23,50.76
145,Fiery Glass Crusader,9,4.58,41.22
132,Persuasion,9,3.221111,28.99
108,"Extraction, Quickblade Of Trembling Hands",9,3.53,31.77


## Most Profitable Items

In [243]:
MostProfitableItems = MostPopularItems.sort_values("Total Purchase Value",ascending = False)

MostProfitableItems["Item Price"] = MostProfitableItems["Item Price"].map("${:.2f}".format)
MostProfitableItems["Total Purchase Value"]= MostProfitableItems["Total Purchase Value"].map("${:.2f}".format)
MostProfitableItems.head()

Unnamed: 0_level_0,Unnamed: 1_level_0,Purchase Count,Item Price,Total Purchase Value
Item ID,Item Name,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
92,Final Critic,13,$4.61,$59.99
178,"Oathbreaker, Last Hope of the Breaking Storm",12,$4.23,$50.76
82,Nirvana,9,$4.90,$44.10
145,Fiery Glass Crusader,9,$4.58,$41.22
103,Singed Scalpel,8,$4.35,$34.80
