In [1]:
import logging
import sys

from kloppy import datasets, transform, to_pandas
from kloppy.utils import performance_logging


def main():

    logging.basicConfig(
        stream=sys.stdout,
        level=logging.INFO,
        format="%(asctime)s - %(name)s - %(levelname)s - %(message)s"
    )

    logger = logging.getLogger(__name__)

    dataset = datasets.load("statsbomb", {"event_types": ["pass", "take_on","carry","shot"]}
    )

    with performance_logging("transform", logger=logger):
        dataset = transform(
            dataset,
            to_orientation="FIXED_HOME_AWAY",
            to_pitch_dimensions=[(-5500, 5500), (-3300, 3300)]
        )

    with performance_logging("to pandas", logger=logger):
        dataframe = to_pandas(dataset)

    return dataframe

In [2]:
df_sb = main()

2020-11-10 17:03:11,462 - kloppy.infra.datasets.core.loading - INFO - Using local cached file C:\Users\ajenk/kloppy_datasets/statsbomb/event_data=15946.json
2020-11-10 17:03:11,463 - kloppy.infra.datasets.core.loading - INFO - Using local cached file C:\Users\ajenk/kloppy_datasets/statsbomb/lineup_data=15946.json
2020-11-10 17:03:11,571 - kloppy.infra.serializers.event.statsbomb.serializer - INFO - Determined Fidelity versions: shot v2 / XY v1
2020-11-10 17:03:11,572 - kloppy.infra.serializers.event.statsbomb.serializer - INFO - load data took: 92.03ms 



You are about to use StatsBomb public data.
By using this data, you are agreeing to the user agreement. 
The user agreement can be found here: https://github.com/statsbomb/open-data/blob/master/LICENSE.pdf

  "\n\nYou are about to use StatsBomb public data."


2020-11-10 17:03:11,650 - kloppy.infra.serializers.event.statsbomb.serializer - INFO - parse data took: 76.84ms 
2020-11-10 17:03:11,717 - __main__ - INFO - transform took: 62.40ms 
2020-11-10 17:03:12,445 - __main__ - INFO - to pandas took: 728.27ms 


In [3]:
df_sb.head()

Unnamed: 0,event_id,event_type,result,success,period_id,timestamp,end_timestamp,ball_state,ball_owning_team,team_id,player_id,coordinates_x,coordinates_y,end_coordinates_x,end_coordinates_y,receiver_player_id,set_piece_type
0,34208ade-2af4-45c3-970e-655937cad938,PASS,COMPLETE,True,1,0.098,2.007,alive,206,206,6581,60.5,40.5,35.5,25.5,6855.0,KICK_OFF
1,8e3dacc2-7a39-4301-9053-e78cfec1aa95,CARRY,COMPLETE,True,1,2.007,3.497,alive,206,206,6855,35.5,25.5,35.5,28.5,,
2,d1cccb73-c7ef-4b02-8267-ebd7f149904b,PASS,INCOMPLETE,False,1,3.497,,alive,206,206,6855,35.5,28.5,,,,
3,f1cc47d6-4b19-45a6-beb9-33d67fc83f4b,PASS,COMPLETE,True,1,6.785,8.431,alive,217,217,5203,34.5,7.5,34.5,20.5,5470.0,
4,f774571f-4b65-43a0-9bfc-6384948d1b82,PASS,COMPLETE,True,1,8.431,9.576,alive,217,217,5470,35.5,20.5,35.5,1.5,5477.0,


In [4]:
df_sb.shape

(2167, 17)