# Bayesian Bivariate Model

In [1]:
import sys

sys.path.append("../../")

import penaltyblog as pb

## Get data from football-data.co.uk

In [2]:
fb = pb.scrapers.FootballData("ENG Premier League", "2019-2020")
df = fb.get_fixtures()

df.head()

Unnamed: 0_level_0,date,datetime,season,competition,div,time,team_home,team_away,fthg,ftag,...,b365_cahh,b365_caha,pcahh,pcaha,max_cahh,max_caha,avg_cahh,avg_caha,goals_home,goals_away
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
1565308800---liverpool---norwich,2019-08-09,2019-08-09 20:00:00,2019-2020,ENG Premier League,E0,20:00,Liverpool,Norwich,4,1,...,1.91,1.99,1.94,1.98,1.99,2.07,1.9,1.99,4,1
1565395200---bournemouth---sheffield_united,2019-08-10,2019-08-10 15:00:00,2019-2020,ENG Premier League,E0,15:00,Bournemouth,Sheffield United,1,1,...,1.95,1.95,1.98,1.95,2.0,1.96,1.96,1.92,1,1
1565395200---burnley---southampton,2019-08-10,2019-08-10 15:00:00,2019-2020,ENG Premier League,E0,15:00,Burnley,Southampton,3,0,...,1.87,2.03,1.89,2.03,1.9,2.07,1.86,2.02,3,0
1565395200---crystal_palace---everton,2019-08-10,2019-08-10 15:00:00,2019-2020,ENG Premier League,E0,15:00,Crystal Palace,Everton,0,0,...,1.82,2.08,1.97,1.96,2.03,2.08,1.96,1.93,0,0
1565395200---tottenham---aston_villa,2019-08-10,2019-08-10 17:30:00,2019-2020,ENG Premier League,E0,17:30,Tottenham,Aston Villa,3,1,...,2.1,1.7,2.18,1.77,2.21,1.87,2.08,1.8,3,1


## Train the Model

In [3]:
clf = pb.models.BayesianBivariateGoalModel(
    df["goals_home"], df["goals_away"], df["team_home"], df["team_away"]
)
clf.fit()

20:18:39 - cmdstanpy - INFO - compiling stan file /private/var/folders/qg/1pn4sbxj7h91pv3skp6h118c0000gn/T/tmp8oe1yhvh.stan to exe file /private/var/folders/qg/1pn4sbxj7h91pv3skp6h118c0000gn/T/tmp8oe1yhvh
20:18:45 - cmdstanpy - INFO - compiled model executable: /private/var/folders/qg/1pn4sbxj7h91pv3skp6h118c0000gn/T/tmp8oe1yhvh
20:18:45 - cmdstanpy - INFO - CmdStan start processing


chain 1 |          | 00:00 Status

chain 2 |          | 00:00 Status

chain 3 |          | 00:00 Status

chain 4 |          | 00:00 Status

                                                                                                                                                                                                                                                                                                                                

20:18:51 - cmdstanpy - INFO - CmdStan done processing.





Module: Penaltyblog

Model: Bayesian Bivariate (Stan)

Number of parameters: 42
Team                 Attack               Defence             
------------------------------------------------------------
Arsenal              0.182                0.009               
Aston Villa          -0.108               -0.307              
Bournemouth          -0.133               -0.276              
Brighton             -0.168               -0.091              
Burnley              -0.077               -0.017              
Chelsea              0.397                -0.121              
Crystal Palace       -0.398               -0.006              
Everton              -0.048               -0.132              
Leicester            0.355                0.155               
Liverpool            0.585                0.351               
Man City             0.771                0.276               
Man United           0.335                0.282               
Newcastle            -0.193             

## The model's parameters

In [5]:
clf.get_params()

Module: Penaltyblog

Model: Bayesian Bivariate (Stan)

Number of parameters: 42
Team                 Attack               Defence             
------------------------------------------------------------
Arsenal              0.182                0.009               
Aston Villa          -0.108               -0.307              
Bournemouth          -0.133               -0.276              
Brighton             -0.168               -0.091              
Burnley              -0.077               -0.017              
Chelsea              0.397                -0.121              
Crystal Palace       -0.398               -0.006              
Everton              -0.048               -0.132              
Leicester            0.355                0.155               
Liverpool            0.585                0.351               
Man City             0.771                0.276               
Man United           0.335                0.282               
Newcastle            -0.193             

## Predict Match Outcomes

In [6]:
probs = clf.predict("Liverpool", "Wolves")
probs

Module: Penaltyblog

Class: FootballProbabilityGrid

Home Goal Expectation: 2.322132526685624
Away Goal Expectation: 0.9398271579967213

Home Win: 0.6763034208189161
Draw: 0.18094599408745884
Away Win: 0.1427505494019847

### 1x2 Probabilities

In [7]:
probs.home_draw_away

[np.float64(0.6763034208189161),
 np.float64(0.18094599408745884),
 np.float64(0.1427505494019847)]

In [8]:
probs.home_win

np.float64(0.6763034208189161)

In [9]:
probs.draw

np.float64(0.18094599408745884)

In [10]:
probs.away_win

np.float64(0.1427505494019847)

### Probablity of Total Goals >1.5

In [11]:
probs.total_goals("over", 1.5)

np.float64(0.8286012179144905)

### Probability of Asian Handicap 1.5

In [12]:
probs.asian_handicap("home", 1.5)

np.float64(0.4519055310691253)

## Probability of both teams scoring

In [13]:
probs.both_teams_to_score

np.float64(0.5379812980315706)

## Train the model with more recent data weighted to be more important

In [14]:
weights = pb.models.dixon_coles_weights(df["date"], 0.001)

clf = pb.models.BayesianBivariateGoalModel(
    df["goals_home"], df["goals_away"], df["team_home"], df["team_away"], weights
)
clf.fit()

20:19:42 - cmdstanpy - INFO - compiling stan file /private/var/folders/qg/1pn4sbxj7h91pv3skp6h118c0000gn/T/tmpx5be9930.stan to exe file /private/var/folders/qg/1pn4sbxj7h91pv3skp6h118c0000gn/T/tmpx5be9930
20:19:47 - cmdstanpy - INFO - compiled model executable: /private/var/folders/qg/1pn4sbxj7h91pv3skp6h118c0000gn/T/tmpx5be9930
20:19:48 - cmdstanpy - INFO - CmdStan start processing


chain 1 |          | 00:00 Status

chain 2 |          | 00:00 Status

chain 3 |          | 00:00 Status

chain 4 |          | 00:00 Status

                                                                                                                                                                                                                                                                                                                                

20:19:53 - cmdstanpy - INFO - CmdStan done processing.





Module: Penaltyblog

Model: Bayesian Bivariate (Stan)

Number of parameters: 42
Team                 Attack               Defence             
------------------------------------------------------------
Arsenal              0.175                0.016               
Aston Villa          -0.148               -0.299              
Bournemouth          -0.14                -0.294              
Brighton             -0.197               -0.101              
Burnley              -0.099               -0.01               
Chelsea              0.385                -0.132              
Crystal Palace       -0.423               -0.038              
Everton              -0.074               -0.13               
Leicester            0.313                0.117               
Liverpool            0.564                0.31                
Man City             0.76                 0.299               
Man United           0.343                0.294               
Newcastle            -0.186             

In [15]:
clf

Module: Penaltyblog

Model: Bayesian Bivariate (Stan)

Number of parameters: 42
Team                 Attack               Defence             
------------------------------------------------------------
Arsenal              0.175                0.016               
Aston Villa          -0.148               -0.299              
Bournemouth          -0.14                -0.294              
Brighton             -0.197               -0.101              
Burnley              -0.099               -0.01               
Chelsea              0.385                -0.132              
Crystal Palace       -0.423               -0.038              
Everton              -0.074               -0.13               
Leicester            0.313                0.117               
Liverpool            0.564                0.31                
Man City             0.76                 0.299               
Man United           0.343                0.294               
Newcastle            -0.186             