# Introduction and Setup

This notebook explores the player hand stats data.

The data is loaded from the database and then explored to understand the data types, missing values, and distributions of the data.

The data is then cleaned and prepared for further analysis.

First we have to load environment variables with dotenv.

In [1]:
from dotenv import load_dotenv
load_dotenv()

True

Then we can import necessary libraries and modules, and set some pandas options.

In [2]:
import pandas as pd
import numpy as np
from src.data.loader import DataLoader
pd.set_option('display.max_columns', None)


# Data Loading

## Downloading the dataset using the DataLoader class

In [3]:
data_loader = DataLoader()
data = data_loader.load_player_hand_stats()

['hero_combo_hand_is_suited', 'hero_combo_hand_is_offsuit', 'hero_combo_hand_is_paired', 'hero_combo_hand_is_connector', 'hero_combo_hand_is_one_gapper', 'hero_combo_hand_is_two_gapper', 'hero_combo_hand_is_broadway', 'hero_combo_hand_is_face', 'hero_combo_hand_is_suited_connector', 'hero_combo_first_card_is_broadway', 'hero_combo_first_card_is_face', 'hero_combo_second_card_is_broadway', 'hero_combo_second_card_is_face', 'flop_is_rainbow', 'flop_has_flush_draw', 'flop_is_monotone', 'flop_is_triplet', 'flop_is_paired', 'flop_is_sequential', 'flop_has_straights', 'flop_has_straight_draw', 'flop_has_gutshot', 'flop_first_card_is_broadway', 'flop_first_card_is_face', 'flop_second_card_is_broadway', 'flop_second_card_is_face', 'flop_third_card_is_broadway', 'flop_third_card_is_face', 'turn_card_is_broadway', 'turn_card_is_face', 'river_card_is_broadway', 'river_card_is_face']
['flag_went_to_showdown', 'flag_is_hero', 'flag_won_hand', 'player_combo_hand_is_suited', 'player_combo_hand_is_off

## Preliminary observations

In [4]:
data.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 2216200 entries, 0 to 2216199
Columns: 397 entries, id to river_total_bet_amount_bb
dtypes: Int16(1), Int8(17), bool(148), category(77), datetime64[ns, UTC](1), float16(152), int64(1)
memory usage: 1.2 GB


In [5]:
data.head()

Unnamed: 0,id,hand_date,max_players,cnt_players,button_seat,tournament_id,ref_tournament_buy_in_total,ref_tournament_speed,ref_tournament_type,total_players_range,level_value,level_sb,level_bb,level_ante,hero_combo,hero_combo_hand,hero_combo_hand_is_suited,hero_combo_hand_is_offsuit,hero_combo_hand_is_paired,hero_combo_hand_is_connector,hero_combo_hand_is_one_gapper,hero_combo_hand_is_two_gapper,hero_combo_hand_is_broadway,hero_combo_hand_is_face,hero_combo_hand_is_suited_connector,hero_combo_hand_rank_difference,hero_combo_hand_first_rank,hero_combo_hand_second_rank,hero_combo_hand_shape,hero_combo_first_card,hero_combo_first_card_is_broadway,hero_combo_first_card_is_face,hero_combo_first_card_rank,hero_combo_first_card_suit,hero_combo_second_card,hero_combo_second_card_is_broadway,hero_combo_second_card_is_face,hero_combo_second_card_rank,hero_combo_second_card_suit,flop,flop_is_rainbow,flop_has_flush_draw,flop_is_monotone,flop_is_triplet,flop_is_paired,flop_is_sequential,flop_has_straights,flop_has_straight_draw,flop_has_gutshot,flop_min_distance,flop_max_distance,flop_first_card,flop_first_card_is_broadway,flop_first_card_is_face,flop_first_card_rank,flop_first_card_suit,flop_second_card,flop_second_card_is_broadway,flop_second_card_is_face,flop_second_card_rank,flop_second_card_suit,flop_third_card,flop_third_card_is_broadway,flop_third_card_is_face,flop_third_card_rank,flop_third_card_suit,turn_card,turn_card_is_broadway,turn_card_is_face,turn_card_rank,turn_card_suit,river_card,river_card_is_broadway,river_card_is_face,river_card_rank,river_card_suit,flag_went_to_showdown,flag_is_hero,flag_won_hand,starting_stack,bounty,amount_won,chips_difference,amount_expected_won,total_bet_amount,seat,player_combo,player_combo_hand,player_combo_hand_is_suited,player_combo_hand_is_offsuit,player_combo_hand_is_paired,player_combo_hand_is_connector,player_combo_hand_is_one_gapper,player_combo_hand_is_two_gapper,player_combo_hand_is_broadway,player_combo_hand_is_face,player_combo_hand_is_suited_connector,player_combo_hand_rank_difference,player_combo_hand_first_rank,player_combo_hand_second_rank,player_combo_hand_shape,player_combo_first_card,player_combo_first_card_is_broadway,player_combo_first_card_is_face,player_combo_first_card_rank,player_combo_first_card_suit,player_combo_second_card,player_combo_second_card_is_broadway,player_combo_second_card_is_face,player_combo_second_card_rank,player_combo_second_card_suit,player_position_name,player_position_is_early,player_position_is_middle,player_position_is_late,player_position_is_blind,fold_street,all_in_street,face_covering_bet_street,face_all_in_street,facing_covering_bet_move,facing_all_in_move,preflop_flag_vpip,preflop_flag_open_opportunity,preflop_flag_open,preflop_flag_first_raise,preflop_flag_fold,preflop_flag_limp,preflop_flag_cold_called,preflop_flag_raise,preflop_flag_raise_opportunity,preflop_flag_face_raise,preflop_flag_3bet_opportunity,preflop_flag_3bet,preflop_flag_face_3bet,preflop_flag_4bet_opportunity,preflop_flag_4bet,preflop_flag_face_4bet,preflop_flag_squeeze_opportunity,preflop_flag_squeeze,preflop_flag_face_squeeze,preflop_flag_steal_opportunity,preflop_flag_steal_attempt,preflop_flag_face_steal_attempt,preflop_flag_fold_to_steal_attempt,preflop_flag_blind_defense_opportunity,preflop_flag_blind_defense,preflop_flag_open_shove,preflop_flag_voluntary_all_in,preflop_count_player_raises,preflop_count_player_calls,preflop_count_faced_limps,preflop_amount_effective_stack,preflop_amount_to_call_facing_1bet,preflop_amount_to_call_facing_2bet,preflop_amount_to_call_facing_3bet,preflop_amount_to_call_facing_4bet,preflop_amount_first_raise_made,preflop_amount_second_raise_made,preflop_ratio_to_call_facing_1bet,preflop_ratio_to_call_facing_2bet,preflop_ratio_to_call_facing_3bet,preflop_ratio_to_call_facing_4bet,preflop_ratio_first_raise_made,preflop_ratio_second_raise_made,preflop_total_bet_amount,preflop_move_facing_2bet,preflop_move_facing_3bet,preflop_move_facing_4bet,preflop_move_facing_squeeze,preflop_move_facing_steal_attempt,preflop_actions_sequence,flop_flag_saw,flop_flag_first_to_talk,flop_flag_has_position,flop_flag_bet,flop_flag_open_opportunity,flop_flag_open,flop_flag_cbet_opportunity,flop_flag_cbet,flop_flag_face_cbet,flop_flag_donk_bet_opportunity,flop_flag_donk_bet,flop_flag_face_donk_bet,flop_flag_first_raise,flop_flag_fold,flop_flag_check,flop_flag_check_raise,flop_flag_face_raise,flop_flag_3bet_opportunity,flop_flag_3bet,flop_flag_face_3bet,flop_flag_4bet_opportunity,flop_flag_4bet,flop_flag_face_4bet,flop_count_player_raises,flop_count_player_calls,flop_amount_effective_stack,flop_amount_to_call_facing_1bet,flop_amount_to_call_facing_2bet,flop_amount_to_call_facing_3bet,flop_amount_to_call_facing_4bet,flop_amount_bet_made,flop_amount_first_raise_made,flop_amount_second_raise_made,flop_ratio_to_call_facing_1bet,flop_ratio_to_call_facing_2bet,flop_ratio_to_call_facing_3bet,flop_ratio_to_call_facing_4bet,flop_ratio_bet_made,flop_ratio_first_raise_made,flop_ratio_second_raise_made,flop_total_bet_amount,flop_move_facing_1bet,flop_move_facing_2bet,flop_move_facing_3bet,flop_move_facing_4bet,flop_move_facing_cbet,flop_move_facing_donk_bet,flop_actions_sequence,turn_flag_saw,turn_flag_first_to_talk,turn_flag_has_position,turn_flag_bet,turn_flag_open_opportunity,turn_flag_open,turn_flag_cbet_opportunity,turn_flag_cbet,turn_flag_face_cbet,turn_flag_donk_bet_opportunity,turn_flag_donk_bet,turn_flag_face_donk_bet,turn_flag_first_raise,turn_flag_fold,turn_flag_check,turn_flag_check_raise,turn_flag_face_raise,turn_flag_3bet_opportunity,turn_flag_3bet,turn_flag_face_3bet,turn_flag_4bet_opportunity,turn_flag_4bet,turn_flag_face_4bet,turn_count_player_raises,turn_count_player_calls,turn_amount_effective_stack,turn_amount_to_call_facing_1bet,turn_amount_to_call_facing_2bet,turn_amount_to_call_facing_3bet,turn_amount_to_call_facing_4bet,turn_amount_bet_made,turn_amount_first_raise_made,turn_amount_second_raise_made,turn_ratio_to_call_facing_1bet,turn_ratio_to_call_facing_2bet,turn_ratio_to_call_facing_3bet,turn_ratio_to_call_facing_4bet,turn_ratio_bet_made,turn_ratio_first_raise_made,turn_ratio_second_raise_made,turn_total_bet_amount,turn_move_facing_1bet,turn_move_facing_2bet,turn_move_facing_3bet,turn_move_facing_4bet,turn_move_facing_cbet,turn_move_facing_donk_bet,turn_actions_sequence,river_flag_saw,river_flag_first_to_talk,river_flag_has_position,river_flag_bet,river_flag_open_opportunity,river_flag_open,river_flag_cbet_opportunity,river_flag_cbet,river_flag_face_cbet,river_flag_donk_bet_opportunity,river_flag_donk_bet,river_flag_face_donk_bet,river_flag_first_raise,river_flag_fold,river_flag_check,river_flag_check_raise,river_flag_face_raise,river_flag_3bet_opportunity,river_flag_3bet,river_flag_face_3bet,river_flag_4bet_opportunity,river_flag_4bet,river_flag_face_4bet,river_count_player_raises,river_count_player_calls,river_amount_effective_stack,river_amount_to_call_facing_1bet,river_amount_to_call_facing_2bet,river_amount_to_call_facing_3bet,river_amount_to_call_facing_4bet,river_amount_bet_made,river_amount_first_raise_made,river_amount_second_raise_made,river_ratio_to_call_facing_1bet,river_ratio_to_call_facing_2bet,river_ratio_to_call_facing_3bet,river_ratio_to_call_facing_4bet,river_ratio_bet_made,river_ratio_first_raise_made,river_ratio_second_raise_made,river_total_bet_amount,river_move_facing_1bet,river_move_facing_2bet,river_move_facing_3bet,river_move_facing_4bet,river_move_facing_cbet,river_move_facing_donk_bet,river_actions_sequence,player_name,player_went_to_showdown_ratio,player_won_hand_ratio,player_confidence_ratio,player_vpip,player_pfr,player_preflop_open_ratio,player_pfr/vpip,player_preflop_3bet_ratio,player_preflop_4bet_ratio,player_attempt_to_steal_ratio,player_fold_to_steal_ratio,player_blind_defense_ratio,player_limp_ratio,player_preflop_all_in_ratio,player_open_shove_ratio,player_preflop_squeeze_ratio,player_went_to_flop_ratio,player_flop_first_to_talk_ratio,player_flop_has_position_ratio,player_flop_open_ratio,player_flop_cbet_ratio,player_flop_donk_bet_ratio,player_flop_3bet_ratio,player_flop_4bet_ratio,player_went_to_turn_ratio,player_turn_first_to_talk_ratio,player_turn_has_position_ratio,player_turn_open_ratio,player_turn_cbet_ratio,player_turn_donk_bet_ratio,player_turn_3bet_ratio,player_turn_4bet_ratio,player_went_to_river_ratio,player_river_first_to_talk_ratio,player_river_has_position_ratio,player_river_open_ratio,player_river_cbet_ratio,player_river_donk_bet_ratio,player_river_3bet_ratio,player_river_4bet_ratio,starting_stack_bb,amount_won_bb,chips_difference_bb,amount_expected_won_bb,total_bet_amount_bb,preflop_amount_effective_stack_bb,preflop_amount_to_call_facing_1bet_bb,preflop_amount_to_call_facing_2bet_bb,preflop_amount_to_call_facing_3bet_bb,preflop_amount_to_call_facing_4bet_bb,preflop_amount_first_raise_made_bb,preflop_amount_second_raise_made_bb,preflop_total_bet_amount_bb,flop_amount_effective_stack_bb,flop_amount_to_call_facing_1bet_bb,flop_amount_to_call_facing_2bet_bb,flop_amount_to_call_facing_3bet_bb,flop_amount_to_call_facing_4bet_bb,flop_amount_bet_made_bb,flop_amount_first_raise_made_bb,flop_amount_second_raise_made_bb,flop_total_bet_amount_bb,turn_amount_effective_stack_bb,turn_amount_to_call_facing_1bet_bb,turn_amount_to_call_facing_2bet_bb,turn_amount_to_call_facing_3bet_bb,turn_amount_to_call_facing_4bet_bb,turn_amount_bet_made_bb,turn_amount_first_raise_made_bb,turn_amount_second_raise_made_bb,turn_total_bet_amount_bb,river_amount_effective_stack_bb,river_amount_to_call_facing_1bet_bb,river_amount_to_call_facing_2bet_bb,river_amount_to_call_facing_3bet_bb,river_amount_to_call_facing_4bet_bb,river_amount_bet_made_bb,river_amount_first_raise_made_bb,river_amount_second_raise_made_bb,river_total_bet_amount_bb
0,68015,2018-06-05 13:16:58+00:00,6,6,6,236599248,5.0,REGULAR,KO,1001 - 2000,10,500.0,1000.0,120.0,JdTs,JTo,False,True,False,True,False,False,True,False,False,1,J,T,OFFSUIT,Jd,True,True,J,d,Ts,True,False,T,s,Tc8d3c,False,True,False,False,False,False,False,True,True,2,7,Tc,True,False,T,c,8d,False,False,8,d,3c,False,False,3,c,,False,False,,,,False,False,,,False,True,True,20512.0,0.0,7440.0,2600.0,0.0,4720.0,5,JdTs,JTo,False,True,False,True,False,False,True,False,False,1.0,J,T,OFFSUIT,Jd,True,True,J,d,Ts,True,False,T,s,CO,False,False,True,False,,,,,,,True,True,True,False,False,True,False,False,True,False,False,False,False,False,False,False,False,False,False,True,False,False,False,False,False,False,False,0,1,0,19392.0,1000.0,0.0,0.0,0.0,0.0,0.0,0.310547,0.0,0.0,0.0,0.0,0.0,1000.0,,,,,,C,True,False,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,15672.0,0.0,0.0,0.0,0.0,3720.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,3720.0,,,,,,,B,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,manggy94,0.112427,0.181274,0.998535,0.299316,0.222412,0.525879,0.674316,0.050262,0.014526,0.394287,0.654297,0.30127,0.048065,0.093567,0.053772,0.042847,0.200439,0.458008,0.505371,0.393066,0.645996,0.111511,0.028107,0.047821,0.117615,0.460938,0.61377,0.387451,0.577637,0.094604,0.032654,0.038452,0.073853,0.482178,0.752441,0.407471,0.538086,0.207275,0.010017,0.0,20.515625,7.441406,2.599609,0.0,4.71875,19.390625,1.0,0.0,0.0,0.0,0.0,0.0,1.0,15.671875,0.0,0.0,0.0,0.0,3.720703,0.0,0.0,3.720703,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,68016,2018-06-05 13:16:58+00:00,6,6,6,236599248,5.0,REGULAR,KO,1001 - 2000,10,500.0,1000.0,120.0,JdTs,JTo,False,True,False,True,False,False,True,False,False,1,J,T,OFFSUIT,Jd,True,True,J,d,Ts,True,False,T,s,Tc8d3c,False,True,False,False,False,False,False,True,True,2,7,Tc,True,False,T,c,8d,False,False,8,d,3c,False,False,3,c,,False,False,,,,False,False,,,False,False,False,50272.0,0.0,0.0,-120.0,0.0,0.0,6,,,False,False,False,False,False,False,False,False,False,,,,,,False,False,,,,False,False,,,BTN,False,False,True,False,PF,,,,,,False,False,False,False,True,False,False,False,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0,50144.0,1000.0,0.0,0.0,0.0,0.0,0.0,0.310547,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,F,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,omar melade,0.142822,0.19043,0.781738,0.333252,0.095215,0.63623,0.285645,0.0,0.0,0.5,1.0,0.199951,0.272705,0.047607,0.0,0.0,0.333252,0.285645,0.571289,0.399902,0.5,0.0,0.0,0.0,0.238037,0.199951,0.799805,0.0,0.0,0.0,0.0,0.0,0.142822,0.333252,0.666504,0.333252,1.0,0.0,0.0,0.0,50.28125,0.0,-0.119995,0.0,0.0,50.15625,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,68013,2018-06-05 13:16:58+00:00,6,6,6,236599248,5.0,REGULAR,KO,1001 - 2000,10,500.0,1000.0,120.0,JdTs,JTo,False,True,False,True,False,False,True,False,False,1,J,T,OFFSUIT,Jd,True,True,J,d,Ts,True,False,T,s,Tc8d3c,False,True,False,False,False,False,False,True,True,2,7,Tc,True,False,T,c,8d,False,False,8,d,3c,False,False,3,c,,False,False,,,,False,False,,,False,False,False,inf,0.0,0.0,-120.0,0.0,0.0,3,,,False,False,False,False,False,False,False,False,False,,,,,,False,False,,,,False,False,,,UTG,True,False,False,False,PF,,,,,,False,True,False,False,True,False,False,False,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0,inf,1000.0,0.0,0.0,0.0,0.0,0.0,0.450439,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,F,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,P.Echtebust,0.045441,0.136353,0.786621,0.136353,0.047607,0.5,0.333252,0.0,0.0,0.0,0.75,0.199951,0.0,0.0,0.0,0.0,0.136353,0.333252,0.666504,0.5,1.0,0.0,0.0,0.0,0.090881,0.5,0.5,0.0,0.0,0.0,0.0,0.0,0.090881,0.5,0.5,1.0,0.0,0.0,0.0,0.0,inf,0.0,-0.119995,0.0,0.0,inf,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,68012,2018-06-05 13:16:58+00:00,6,6,6,236599248,5.0,REGULAR,KO,1001 - 2000,10,500.0,1000.0,120.0,JdTs,JTo,False,True,False,True,False,False,True,False,False,1,J,T,OFFSUIT,Jd,True,True,J,d,Ts,True,False,T,s,Tc8d3c,False,True,False,False,False,False,False,True,True,2,7,Tc,True,False,T,c,8d,False,False,8,d,3c,False,False,3,c,,False,False,,,,False,False,,,False,False,False,inf,0.0,0.0,-1120.0,0.0,0.0,2,,,False,False,False,False,False,False,False,False,False,,,,,,False,False,,,,False,False,,,BB,False,False,False,True,F,,,,,,False,False,False,False,False,False,False,False,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0,19392.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,X,True,True,False,False,True,False,False,False,True,False,False,False,False,True,True,False,False,False,False,False,False,False,False,0,0,19392.0,3720.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,F,,,,F,,XF,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,touchdown,0.142822,0.285645,0.781738,0.380859,0.285645,0.799805,0.75,0.0,0.0,0.399902,0.5,0.399902,0.0,0.0,0.0,0.0,0.238037,0.600098,0.199951,0.399902,1.0,0.0,0.0,0.0,0.142822,0.666504,0.333252,0.333252,0.5,0.0,0.0,0.0,0.142822,0.666504,0.333252,0.333252,1.0,0.0,0.0,0.0,inf,0.0,-1.120117,0.0,0.0,19.390625,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.390625,3.720703,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,68014,2018-06-05 13:16:58+00:00,6,6,6,236599248,5.0,REGULAR,KO,1001 - 2000,10,500.0,1000.0,120.0,JdTs,JTo,False,True,False,True,False,False,True,False,False,1,J,T,OFFSUIT,Jd,True,True,J,d,Ts,True,False,T,s,Tc8d3c,False,True,False,False,False,False,False,True,True,2,7,Tc,True,False,T,c,8d,False,False,8,d,3c,False,False,3,c,,False,False,,,,False,False,,,False,False,False,42304.0,0.0,0.0,-120.0,0.0,0.0,4,,,False,False,False,False,False,False,False,False,False,,,,,,False,False,,,,False,False,,,HJ,False,True,False,False,PF,,,,,,False,True,False,False,True,False,False,False,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0,42176.0,1000.0,0.0,0.0,0.0,0.0,0.0,0.450439,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,F,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,vikrammm,0.095215,0.142822,0.781738,0.19043,0.199951,0.375,1.0,0.0,0.0,0.5,1.0,0.0,0.0,0.0,0.0,0.0,0.19043,0.75,0.25,0.5,0.5,0.0,0.0,0.0,0.142822,0.666504,0.666504,0.666504,1.0,0.0,0.0,0.0,0.095215,0.5,1.0,0.0,0.0,0.0,0.0,0.0,42.3125,0.0,-0.119995,0.0,0.0,42.1875,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [6]:
data.player_combo_hand_is_suited.value_counts()

False    2062068
True      154132
Name: player_combo_hand_is_suited, dtype: int64

In [7]:
data.dtypes.value_counts()

float16                152
bool                   148
Int8                    17
category                13
category                13
category                 9
category                 5
category                 5
category                 3
category                 2
category                 2
category                 2
category                 2
category                 2
category                 2
category                 2
category                 1
category                 1
category                 1
category                 1
category                 1
int64                    1
category                 1
category                 1
category                 1
category                 1
category                 1
datetime64[ns, UTC]      1
Int16                    1
category                 1
category                 1
category                 1
category                 1
category                 1
dtype: int64

In [8]:
print(f"This dataset has {data.shape[0]} rows and {data.shape[1]} columns.\n"
      f"It gathers information about the player's hand stats.\n"
      f"It has both numerical and categorical data types.\n"
      f"It also has a datetime column that enables time series analysis.")


This dataset has 2216200 rows and 397 columns.
It gathers information about the player's hand stats.
It has both numerical and categorical data types.
It also has a datetime column that enables time series analysis.


## Observation of subgroups by data type (categorical, numerical)

In [10]:
numerical_data = data.select_dtypes(include=[np.number])
numerical_data.describe()

