# Exploratory Data Analysis

## Initial Setup and Data Load

In [1]:
# ---------------- Basic Data Science Libraries ---------------- #
import numpy as np # Linear algebra
import pandas as pd # Data processing

# ---------------- System Libraries ---------------- #
import os # Miscellaneous operating system interfaces
import gc # Garbage collector interface
from subprocess import check_output # Saves results written to the current directory as output

# ---------------- Plotting Libraries ---------------- #
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline

# ---------------- Removing the max columns limiter ---------------- #
pd.set_option('display.max_columns', None)

# ---------------- Printing files in my clean data folder ---------------- #
print(check_output(['ls', '../Data/Clean']).decode('utf8'))

ability_ids.csv
ability_upgrades.csv
chat.csv
eng_chat.csv
hero_ids.csv
item_ids.csv
matches.csv
mmr.csv
objectives.csv
patch_dates.csv
player_time.csv
players.csv
positions.csv
prev_outcomes.csv
purchase_log.csv
regions.csv
teamfights.csv
teamfights_players.csv
test_outcomes.csv
test_players.csv
trueskill.csv



In [3]:
# Loading up players.csv
file_path = '../Data/Clean/players.csv'
players = pd.read_csv(file_path, index_col=0)

# Print the shape of the file
print(f'{file_path}:', '{:,} observations, {:,} features'.format(players.shape[0], players.shape[1]))

../Data/Clean/players.csv: 425,862 observations, 79 features


In [4]:
# Looking at the info and head of the data
display(players.info())
display(players.head())

<class 'pandas.core.frame.DataFrame'>
Index: 425862 entries, 0 to 499999
Data columns (total 79 columns):
 #   Column                             Non-Null Count   Dtype  
---  ------                             --------------   -----  
 0   match_id                           425862 non-null  int64  
 1   match_outcome                      425862 non-null  int64  
 2   account                            303894 non-null  object 
 3   account_id                         425862 non-null  int64  
 4   hero_id                            425862 non-null  int64  
 5   player_slot                        425862 non-null  int64  
 6   match_slot_id                      425862 non-null  object 
 7   gold                               425862 non-null  int64  
 8   gold_spent                         425862 non-null  int64  
 9   gold_per_min                       425862 non-null  int64  
 10  xp_per_min                         425862 non-null  int64  
 11  kills                              425862 no

None

Unnamed: 0,match_id,match_outcome,account,account_id,hero_id,player_slot,match_slot_id,gold,gold_spent,gold_per_min,xp_per_min,kills,deaths,assists,denies,last_hits,stuns,hero_damage,hero_healing,tower_damage,item_0,item_1,item_2,item_3,item_4,item_5,level,leaver_status,xp_hero,xp_creep,xp_roshan,xp_other,gold_other,gold_death,gold_buyback,gold_abandon,gold_sell,gold_destroying_structure,gold_killing_heros,gold_killing_creeps,gold_killing_roshan,gold_killing_couriers,unit_order_none,unit_order_move_to_position,unit_order_move_to_target,unit_order_attack_move,unit_order_attack_target,unit_order_cast_position,unit_order_cast_target,unit_order_cast_target_tree,unit_order_cast_no_target,unit_order_cast_toggle,unit_order_hold_position,unit_order_train_ability,unit_order_drop_item,unit_order_give_item,unit_order_pickup_item,unit_order_pickup_rune,unit_order_purchase_item,unit_order_sell_item,unit_order_disassemble_item,unit_order_move_item,unit_order_cast_toggle_auto,unit_order_stop,unit_order_taunt,unit_order_buyback,unit_order_glyph,unit_order_eject_item_from_stash,unit_order_cast_rune,unit_order_ping_ability,unit_order_move_to_direction,unit_order_patrol,unit_order_vector_target_position,unit_order_radar,unit_order_set_item_combine_lock,unit_order_continue,messages_sent,time_played,cluster
0,0,1,Double T,0,86,0,0_0,3261,10960,347,362,9,3,18,1,30,76.7356,8690,218,143,180,37,73,56,108,0,16,0,8840,5440,0,83,50,-957,0,0,212,3120,5145,1087,400,0,0,4070,1,25,416,51,144,3,71,0,188,16,0,0,0,2,35,2,0,11,0,0,0,0,0,0,0,6,0,0,0,0,0,0,4,2375,155
1,0,1,Monkey,1,51,1,0_1,2954,17760,494,659,13,3,18,9,109,87.4164,23747,0,423,46,63,119,102,24,108,22,0,14331,8440,2683,671,395,-1137,0,0,1650,3299,6676,4317,937,0,0,5894,214,165,1031,98,39,4,439,0,346,22,0,0,12,52,30,4,0,21,0,0,0,0,0,0,0,14,0,0,0,0,0,0,16,2375,155
2,0,1,Trash!!!,0,83,2,0_2,110,12195,350,385,0,4,15,1,58,0.0,4217,1595,399,48,60,59,108,65,0,17,0,6692,8112,0,453,259,-1436,-1015,0,0,3142,2418,3697,400,0,0,7053,3,132,645,36,160,20,373,0,643,17,5,0,7,8,28,0,1,18,0,0,0,1,0,0,0,17,0,0,0,0,0,0,2,2375,155
3,0,1,,2,11,3,0_3,1179,22505,599,605,8,4,19,6,271,0.0,14832,2714,6055,63,147,154,164,79,160,21,0,8583,14230,894,293,100,-2156,0,0,938,4714,4104,10432,400,0,0,4712,133,163,690,9,15,7,406,0,150,21,0,0,1,9,45,7,0,14,0,0,0,0,1,0,0,13,0,0,0,0,0,0,0,2375,155
4,0,1,Kira,3,67,4,0_4,3307,23825,613,762,20,3,17,13,245,0.0,33740,243,1833,114,92,147,0,137,63,24,0,15814,14325,0,62,0,-1437,-1056,0,4194,3217,7467,9220,400,0,0,3853,7,7,1173,31,84,8,198,0,111,23,1,0,0,2,44,6,0,13,0,0,0,1,3,0,0,23,0,0,0,0,0,0,1,2375,155


In [9]:
players[players['account'] == '0']

Unnamed: 0,match_id,match_outcome,account,account_id,hero_id,player_slot,match_slot_id,gold,gold_spent,gold_per_min,xp_per_min,kills,deaths,assists,denies,last_hits,stuns,hero_damage,hero_healing,tower_damage,item_0,item_1,item_2,item_3,item_4,item_5,level,leaver_status,xp_hero,xp_creep,xp_roshan,xp_other,gold_other,gold_death,gold_buyback,gold_abandon,gold_sell,gold_destroying_structure,gold_killing_heros,gold_killing_creeps,gold_killing_roshan,gold_killing_couriers,unit_order_none,unit_order_move_to_position,unit_order_move_to_target,unit_order_attack_move,unit_order_attack_target,unit_order_cast_position,unit_order_cast_target,unit_order_cast_target_tree,unit_order_cast_no_target,unit_order_cast_toggle,unit_order_hold_position,unit_order_train_ability,unit_order_drop_item,unit_order_give_item,unit_order_pickup_item,unit_order_pickup_rune,unit_order_purchase_item,unit_order_sell_item,unit_order_disassemble_item,unit_order_move_item,unit_order_cast_toggle_auto,unit_order_stop,unit_order_taunt,unit_order_buyback,unit_order_glyph,unit_order_eject_item_from_stash,unit_order_cast_rune,unit_order_ping_ability,unit_order_move_to_direction,unit_order_patrol,unit_order_vector_target_position,unit_order_radar,unit_order_set_item_combine_lock,unit_order_continue,messages_sent,time_played,cluster
83679,8367,0,0,38677,73,132,8367_132,224,9985,331,244,0,3,2,1,81,6.73174,1850,385,293,178,79,0,152,63,43,11,0,548,6601,0,25,1234,-777,0,1278,625,400,254,3227,0,0,0,2944,64,39,379,50,7,4,46,0,217,11,0,0,0,1,35,3,0,5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,1762,171
101652,10165,1,0,45571,102,2,10165_2,4574,9540,418,416,7,6,13,3,40,0.0,5849,4831,1220,231,36,81,46,0,0,16,0,9042,5093,447,82,0,-1404,0,0,100,4197,5246,1553,200,0,0,5612,2,1,1237,10,106,6,21,0,394,15,0,0,2,29,37,2,0,3,0,0,0,0,0,0,0,2,0,0,0,0,0,0,1,2111,153
129805,12980,0,0,56186,106,128,12980_128,251,19295,484,666,7,7,11,10,260,0.0,13957,0,187,145,0,41,141,141,48,24,0,16297,15303,0,374,289,-3413,-1565,0,100,702,7849,9384,200,0,0,8815,302,25,758,307,2,5,310,0,41,24,1,0,10,11,22,1,0,4,0,0,0,1,1,0,0,3,0,0,0,0,0,0,5,2878,133
151164,15116,0,0,62963,69,4,15116_4,1900,10725,382,326,4,6,2,2,68,11.0862,6933,0,0,1,65,108,181,214,46,14,0,2549,8102,0,665,2468,-1404,0,0,133,940,2073,4302,0,0,0,4697,79,0,336,32,65,3,36,0,0,14,0,0,3,6,22,3,0,8,0,0,0,0,0,0,0,2,0,0,0,0,0,0,1,2079,111
229600,22960,1,0,0,70,0,22960_0,2040,13465,637,544,19,2,13,8,75,9.13218,21705,612,2214,50,1,208,181,81,182,15,0,5346,5372,1789,383,231,-238,0,0,0,3120,5662,3291,405,0,0,3191,132,81,639,16,1,5,335,0,0,15,0,0,3,10,21,0,0,10,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1419,204
285650,28565,1,0,32993,46,0,28565_0,5341,13835,757,739,10,2,2,14,185,0.0,13874,0,3973,63,41,147,55,212,168,18,0,4600,11856,1789,617,301,-838,0,0,50,4646,3488,7959,392,0,0,2843,72,33,904,29,1,3,261,0,257,17,2,2,5,12,23,2,0,8,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1531,112
322627,32262,0,0,0,105,130,32262_130,2642,7475,280,328,3,12,13,1,98,2.50854,11353,0,114,29,1,41,0,23,21,17,0,7271,8041,0,105,62,-3378,-1016,0,400,680,3979,3736,0,0,0,5190,96,30,179,195,11,4,90,0,0,16,1,0,0,3,26,1,0,6,0,0,0,1,2,0,0,0,0,0,0,0,0,0,3,2813,204
438286,43828,0,0,10210,28,129,43828_129,237,11325,295,403,5,12,12,11,149,70.6617,7871,0,6,8,116,1,36,63,0,21,0,8834,13631,447,761,484,-5718,-336,0,400,680,4067,6041,200,0,0,4939,138,1,1208,66,38,4,270,0,228,21,0,0,2,51,28,2,0,10,0,0,0,1,1,0,0,7,0,0,0,0,0,0,1,3516,151


## Statistical Analysis