# SETUP

In [1]:
import pandas as pd
import os
os.chdir('../')

from Utils.constants import *
import Utils.scraping_file as scraping_file
import Utils.utils_file as utils_file

pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.width', 1000)
pd.options.mode.chained_assignment = None

# SCRAPING

### Initialize Class

In [2]:
cache=True

Utils = utils_file.Utils_Class(cache_model=False, cache_scraping=cache)
Scraping = scraping_file.Scraping_Class(cache=cache)

if cache:
    match_list = Utils.match_list
    match_list_fill = Utils.match_list_fill
    player_data_table = Utils.player_data_table
    team_data_table = Utils.team_data_table

### Update

In [3]:
len(match_list)

29860

In [4]:
Scraping.update()

Updating semester 1 of year 2023



player_data_table updated!

team_data_table updated!



KeyboardInterrupt: 

In [None]:
len(Scraping.match_list)

29860

### Player

In [3]:
player_data_table = Scraping.make_player_data_table()
player_data_table = Scraping.transforming_player(player_data_table)

### Matches

In [None]:
match_list = Scraping.make_matches_table()
team_data_table = Scraping.transforming_team(team_data_table)

### Teams

In [3]:
team_data_table = Scraping.make_team_data_table()
match_list = Scraping.transforming_match(match_list)

# FEATURE ENGINEERING

### Season data swap

In [3]:
match_list = Scraping.season_data_swap(match_list)

### Fill null values

In [None]:
match_list_fill = Scraping.fill_nan_values_player(match_list)

# SAVE FILES

In [6]:
player_data_table.to_pickle("Data/raw_data/player_data_table.pkl")
team_data_table.to_pickle("Data/raw_data/team_data_table.pkl")

match_list.to_pickle("Data/raw_data/match_list.pkl")
match_list_fill.to_pickle("Data/raw_data/match_list_fill.pkl")

# Notes

In [181]:
player_data_table.describe()

Unnamed: 0,Games,Win_rate,KDA,Avg_kills,Avg_deaths,Avg_assists,CSM,GPM,KP%,DMG%,DPM,VSPM,Avg_WPM,Avg_WCPM,Avg_VWPM,GD@15,CSD@15,XPD@15,FB_%,FB_Victim,Penta_Kills,Solo_Kills,Semester,Year
count,13123.0,13123.0,13108.0,13123.0,13123.0,13123.0,13123.0,13123.0,13123.0,13121.0,13123.0,12425.0,12812.0,12812.0,12812.0,13123.0,13123.0,13123.0,12490.0,12490.0,13123.0,13123.0,13123.0,13123.0
mean,22.125657,44.127799,3.27233,2.559918,2.888478,5.889263,6.22235,348.635449,64.000587,19.724198,381.805989,1.420299,0.615101,0.270174,0.245624,-79.775356,-1.18418,-49.290101,23.246773,10.249752,0.035967,3.675913,0.449288,2020.918007
std,13.838768,21.213997,1.584695,1.353688,0.914306,2.05796,2.846278,68.293654,9.306458,7.458566,155.568079,0.599563,0.418568,0.106207,0.129656,416.07575,8.561031,314.729115,15.003662,10.410995,0.20714,5.03138,0.497441,1.283588
min,1.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,2.7,0.0,0.22,0.0,0.0,0.0,-4452.0,-148.0,-3840.0,0.0,0.0,0.0,0.0,0.0,2019.0
25%,14.0,31.3,2.3,1.5,2.3,4.5,4.9,308.0,59.0,13.5,249.0,1.0,0.37,0.18,0.15,-260.0,-5.0,-199.0,13.8,3.6,0.0,0.0,0.0,2020.0
50%,20.0,46.7,3.1,2.6,2.8,5.6,7.4,363.0,65.3,21.6,401.0,1.2,0.44,0.26,0.21,-27.0,0.0,-10.0,22.2,8.7,0.0,2.0,0.0,2021.0
75%,30.0,58.8,4.0,3.5,3.4,7.0,8.4,400.0,70.0,25.8,502.0,1.63,0.6,0.34,0.33,142.0,3.0,126.0,31.8,14.3,0.0,5.0,1.0,2022.0
max,85.0,100.0,31.8,15.0,10.0,20.0,10.8,590.0,100.0,42.8,1372.0,4.29,2.64,0.95,1.2,2685.0,72.0,2692.0,100.0,100.0,4.0,56.0,1.0,2023.0


In [182]:
team_data_table.describe()

Unnamed: 0,Games,K:D,GPM,GDM,Kills / game,Deaths / game,Towers killed,Towers lost,FB%,FT%,DRAPG,DRA%,HERPG,HER%,DRA@15,TD@15,GD@15,PPG,NASHPG,NASH%,CSM,DPM
count,2203.0,2203.0,2203.0,2203.0,2203.0,2203.0,2203.0,2203.0,2168.0,2157.0,2203.0,2203.0,2108.0,2106.0,2108.0,2108.0,2148.0,813.0,2203.0,2203.0,2203.0,2203.0
mean,26.459374,0.986668,1761.545166,-31.586473,13.205402,14.040899,5.70345,6.287653,49.116882,47.661799,2.208983,48.301952,0.860769,48.465195,0.871746,-0.075237,-209.574488,4.384563,0.648407,46.929006,31.502951,1951.907853
std,13.044344,0.311002,86.995162,159.753159,2.665958,2.922707,1.505508,1.455439,12.598821,15.985495,0.490554,10.841339,0.313345,13.952926,0.24017,0.5057,1271.392815,1.054903,0.223736,16.294452,1.387918,235.839342
min,2.0,0.08,1354.0,-842.0,1.5,4.3,0.0,1.5,2.2,2.2,0.0,0.0,0.0,0.0,0.0,-4.5,-11005.0,1.3,0.0,0.0,21.1,1023.0
25%,18.0,0.78,1706.0,-127.0,11.5,12.1,4.8,5.3,41.7,37.1,1.94,41.9,0.6375,39.5,0.71,-0.3,-886.25,3.68,0.5,36.6,30.7,1793.0
50%,23.0,0.96,1767.0,-18.0,13.3,13.7,5.9,6.2,50.0,48.0,2.26,48.9,0.9,50.0,0.88,0.0,-79.0,4.4,0.67,48.2,31.6,1938.0
75%,34.0,1.165,1820.0,77.0,15.0,15.7,6.8,7.3,57.1,58.6,2.53,55.4,1.09,57.3,1.03,0.2,565.25,5.0,0.8,58.3,32.4,2102.5
max,85.0,3.21,2099.0,452.0,23.4,28.7,9.8,11.0,100.0,100.0,4.33,94.4,2.0,100.0,2.0,1.8,4081.0,10.5,1.5,100.0,41.1,3089.0
