In [1]:
import requests, json
from pprint import pprint

In [2]:
# base url for all FPL API endpoints
base_url = 'https://fantasy.premierleague.com/api/'

# get data from bootstrap-static endpoint
r = requests.get(base_url+'bootstrap-static/').json()

# show the top level fields
pprint(r, indent=2, depth=1, compact=True)

{ 'element_stats': [...],
  'element_types': [...],
  'elements': [...],
  'events': [...],
  'game_settings': {...},
  'phases': [...],
  'teams': [...],
  'total_players': 10618510}


In [3]:
# get player data from 'elements' field
players = r['elements']

# show data for first player
pprint(players[0])

{'assists': 0,
 'bonus': 0,
 'bps': 0,
 'chance_of_playing_next_round': 0,
 'chance_of_playing_this_round': 0,
 'clean_sheets': 0,
 'clean_sheets_per_90': 0,
 'code': 232223,
 'corners_and_indirect_freekicks_order': None,
 'corners_and_indirect_freekicks_text': '',
 'cost_change_event': 0,
 'cost_change_event_fall': 0,
 'cost_change_start': -1,
 'cost_change_start_fall': 1,
 'creativity': '0.0',
 'creativity_rank': 638,
 'creativity_rank_type': 65,
 'direct_freekicks_order': None,
 'direct_freekicks_text': '',
 'dreamteam_count': 0,
 'element_type': 4,
 'ep_next': '0.0',
 'ep_this': '0.0',
 'event_points': 0,
 'expected_assists': '0.00',
 'expected_assists_per_90': 0,
 'expected_goal_involvements': '0.00',
 'expected_goal_involvements_per_90': 0,
 'expected_goals': '0.00',
 'expected_goals_conceded': '0.00',
 'expected_goals_conceded_per_90': 0,
 'expected_goals_per_90': 0,
 'first_name': 'Folarin',
 'form': '0.0',
 'form_rank': 533,
 'form_rank_type': 45,
 'goals_conceded': 0,
 'goals

In [4]:
import pandas as pd

# display all columns of a DataFrame when it is printed
pd.set_option('display.max_columns', None) 

In [5]:
# create players dataframe
players = pd.json_normalize(r['elements'])

# show some information about first five players
players[['id', 'web_name', 'team', 'element_type']].head()

Unnamed: 0,id,web_name,team,element_type
0,1,Balogun,1,4
1,2,Cédric,1,2
2,3,M.Elneny,1,3
3,4,Fábio Vieira,1,3
4,5,Gabriel,1,2


In [6]:
# create teams dataframe
teams = pd.json_normalize(r['teams'])

teams

Unnamed: 0,code,draw,form,id,loss,name,played,points,position,short_name,strength,team_division,unavailable,win,strength_overall_home,strength_overall_away,strength_attack_home,strength_attack_away,strength_defence_home,strength_defence_away,pulse_id
0,3,0,,1,0,Arsenal,0,0,0,ARS,4,,False,0,1220,1260,1270,1280,1170,1240,1
1,7,0,,2,0,Aston Villa,0,0,0,AVL,3,,False,0,1130,1235,1120,1220,1130,1250,2
2,91,0,,3,0,Bournemouth,0,0,0,BOU,3,,False,0,1095,1100,1070,1120,1130,1110,127
3,94,0,,4,0,Brentford,0,0,0,BRE,3,,False,0,1120,1155,1120,1130,1120,1180,130
4,36,0,,5,0,Brighton,0,0,0,BHA,3,,False,0,1130,1185,1100,1120,1160,1250,131
5,90,0,,6,0,Burnley,0,0,0,BUR,3,,False,0,1070,1080,1080,1060,1060,1060,43
6,8,0,,7,0,Chelsea,0,0,0,CHE,3,,False,0,1125,1170,1100,1180,1160,1180,4
7,31,0,,8,0,Crystal Palace,0,0,0,CRY,3,,False,0,1095,1100,1110,1150,1090,1085,6
8,11,0,,9,0,Everton,0,0,0,EVE,3,,False,0,1095,1100,1110,1140,1080,1110,7
9,54,0,,10,0,Fulham,0,0,0,FUL,3,,False,0,1095,1100,1050,1110,1060,1140,34


In [7]:
# get position information from 'element_types' field
positions = pd.json_normalize(r['element_types'])

positions.head()

Unnamed: 0,id,plural_name,plural_name_short,singular_name,singular_name_short,squad_select,squad_min_play,squad_max_play,ui_shirt_specific,sub_positions_locked,element_count
0,1,Goalkeepers,GKP,Goalkeeper,GKP,2,1,1,True,[12],91
1,2,Defenders,DEF,Defender,DEF,5,3,5,False,[],258
2,3,Midfielders,MID,Midfielder,MID,5,2,5,False,[],349
3,4,Forwards,FWD,Forward,FWD,3,1,3,False,[],102


In [18]:
# join players to teams
df = pd.merge(
    left=players,
    right=teams,
    left_on='team',
    right_on='id'
)

# show joined result
df[['first_name', 'second_name', 'name']].head()

Unnamed: 0,first_name,second_name,name
0,Folarin,Balogun,Arsenal
1,Cédric,Alves Soares,Arsenal
2,Mohamed,Elneny,Arsenal
3,Fábio,Ferreira Vieira,Arsenal
4,Gabriel,dos Santos Magalhães,Arsenal


In [20]:
# join player positions
df = df.merge(
    positions,
    left_on='element_type',
    right_on='id'
)

# rename columns
df = df.rename(
    columns={'name':'team_name', 'singular_name':'position_name'}
)

# show result
df[
    ['first_name', 'second_name', 'team_name', 'position_name']
].head()

Unnamed: 0,first_name,second_name,team_name,position_name
0,Folarin,Balogun,Arsenal,Forward
1,Gabriel,Fernando de Jesus,Arsenal,Forward
2,Eddie,Nketiah,Arsenal,Forward
3,Keinan,Davis,Aston Villa,Forward
4,Jhon,Durán,Aston Villa,Forward


In [22]:
squads_2324 = df[['first_name', 'second_name', 'team_name', 'position_name']]
squads_2324

Unnamed: 0,first_name,second_name,team_name,position_name
0,Folarin,Balogun,Arsenal,Forward
1,Gabriel,Fernando de Jesus,Arsenal,Forward
2,Eddie,Nketiah,Arsenal,Forward
3,Keinan,Davis,Aston Villa,Forward
4,Jhon,Durán,Aston Villa,Forward
...,...,...,...,...
795,Joseph,Anang,West Ham,Goalkeeper
796,Daniel,Bentley,Wolves,Goalkeeper
797,Tom,King,Wolves,Goalkeeper
798,José,Malheiro de Sá,Wolves,Goalkeeper


In [41]:
squads_2324[squads_2324['team_name'] == 'Spurs']

Unnamed: 0,first_name,second_name,team_name,position_name
88,Harry,Kane,Spurs,Forward
89,Dane,Scarlett,Spurs,Forward
90,Alejo,Véliz,Spurs,Forward
91,Jamie,Donley,Spurs,Forward
92,Timo,Werner,Spurs,Forward
320,Ben,Davies,Spurs,Defender
321,Eric,Dier,Spurs,Defender
322,Emerson,Leite de Souza Junior,Spurs,Defender
323,Pedro,Porro,Spurs,Defender
324,Ivan,Perišić,Spurs,Defender


In [42]:
# get data from 'element-summary/{PID}/' endpoint for PID=516 (Son)
r = requests.get(base_url + 'element-summary/516/').json()

# show top-level fields for player summary
pprint(r, depth=1)

{'fixtures': [...], 'history': [...], 'history_past': [...]}


In [43]:
# show data for first gameweek
pprint(r['history'][0])

{'assists': 0,
 'bonus': 0,
 'bps': 5,
 'clean_sheets': 0,
 'creativity': '6.8',
 'element': 516,
 'expected_assists': '0.05',
 'expected_goal_involvements': '0.13',
 'expected_goals': '0.08',
 'expected_goals_conceded': '1.72',
 'fixture': 8,
 'goals_conceded': 2,
 'goals_scored': 0,
 'ict_index': '3.7',
 'influence': '0.0',
 'kickoff_time': '2023-08-13T13:00:00Z',
 'minutes': 74,
 'opponent_team': 4,
 'own_goals': 0,
 'penalties_missed': 0,
 'penalties_saved': 0,
 'red_cards': 0,
 'round': 1,
 'saves': 0,
 'selected': 428040,
 'starts': 1,
 'team_a_score': 2,
 'team_h_score': 2,
 'threat': '31.0',
 'total_points': 2,
 'transfers_balance': 0,
 'transfers_in': 0,
 'transfers_out': 0,
 'value': 90,
 'was_home': False,
 'yellow_cards': 0}


In [44]:
def get_gameweek_history(player_id):
    '''get all gameweek info for a given player_id'''
    
    # send GET request to
    # https://fantasy.premierleague.com/api/element-summary/{PID}/
    r = requests.get(
            base_url + 'element-summary/' + str(player_id) + '/'
    ).json()
    
    # extract 'history' data from response into dataframe
    df = pd.json_normalize(r['history'])
    
    return df

In [46]:
# show player #516's gameweek history
get_gameweek_history(516)[
    [
        'round',
        'total_points',
        'minutes',
        'goals_scored',
        'assists'
    ]
]

Unnamed: 0,round,total_points,minutes,goals_scored,assists
0,1,2,74,0,0
1,2,3,90,0,0
2,3,3,90,0,0
3,4,20,71,3,0
4,5,2,79,0,0
5,6,14,78,2,0
6,7,7,68,1,0
7,8,3,75,0,0
8,9,14,81,1,1
9,10,10,90,1,0


In [47]:
def get_season_history(player_id):
    '''get all past season info for a given player_id'''
    
    # send GET request to
    # https://fantasy.premierleague.com/api/element-summary/{PID}/
    r = requests.get(
            base_url + 'element-summary/' + str(player_id) + '/'
    ).json()
    
    # extract 'history_past' data from response into dataframe
    df = pd.json_normalize(r['history_past'])
    
    return df

In [49]:
# show player #516's gameweek history
get_season_history(516)[
    [
        'season_name',
        'total_points',
        'minutes',
        'goals_scored',
        'assists'
    ]
]

Unnamed: 0,season_name,total_points,minutes,goals_scored,assists
0,2015/16,70,1107,4,1
1,2016/17,174,2063,14,9
2,2017/18,178,2292,12,8
3,2018/19,159,2033,12,8
4,2019/20,169,2478,11,13
5,2020/21,228,3119,17,11
6,2021/22,258,3009,23,10
7,2022/23,152,2886,10,6


In [50]:
# select columns of interest from players df
players = players[
    ['id', 'first_name', 'second_name', 'web_name', 'team',
     'element_type']
]

# join team name
players = players.merge(
    teams[['id', 'name']],
    left_on='team',
    right_on='id',
    suffixes=['_player', None]
).drop(['team', 'id'], axis=1)

# join player positions
players = players.merge(
    positions[['id', 'singular_name_short']],
    left_on='element_type',
    right_on='id'
).drop(['element_type', 'id'], axis=1)

players.head()

Unnamed: 0,id_player,first_name,second_name,web_name,name,singular_name_short
0,1,Folarin,Balogun,Balogun,Arsenal,FWD
1,8,Gabriel,Fernando de Jesus,G.Jesus,Arsenal,FWD
2,13,Eddie,Nketiah,Nketiah,Arsenal,FWD
3,39,Keinan,Davis,Davis,Aston Villa,FWD
4,44,Jhon,Durán,Duran,Aston Villa,FWD


In [52]:
from tqdm.auto import tqdm
tqdm.pandas()

In [53]:
# get gameweek histories for each player
points = players['id_player'].progress_apply(get_gameweek_history)

# combine results into single dataframe
points = pd.concat(df for df in points)

# join web_name
points = players[['id_player', 'web_name']].merge(
    points,
    left_on='id_player',
    right_on='element'
)

100%|█████████████████████████████████████████████████████████| 800/800 [01:34<00:00,  8.50it/s]


In [59]:
# get top scoring players
points.groupby(
    ['web_name']
).agg(
    {'total_points':'sum', 'goals_scored':'sum', 'assists':'sum'}
).reset_index(
).sort_values(
    'goals_scored', ascending=False
).head(10)

Unnamed: 0,web_name,total_points,goals_scored,assists
619,Salah,156,14,8
303,Haaland,113,14,5
656,Solanke,106,13,1
658,Son,136,12,5
106,Bowen,114,11,2
345,Isak,79,10,0
732,Watkins,128,10,11
316,Hee Chan,100,10,3
747,Wilson,108,9,5
553,Palmer,104,9,5
