## Baseball Prediction: 3a - Getting Odds Data

This notebook merges odds data with our game data from the previous notebooks. I recieved the odds data from Scottfree Analytics. This data will be hidden from the repo to protect the rights of the paid-for data.

In [2]:
import numpy as np
import pandas as pd
pd.set_option('display.max_columns',1000)
pd.set_option('display.max_rows',1000)

In [6]:
# Load in odds data
odds_df = pd.read_csv('./hidden_data/mlb_betting_odds.csv')
odds_df.head()

Unnamed: 0,season,date,away_team,away_score,away_point_spread,away_point_spread_line,away_money_line,home_team,home_score,home_point_spread,home_point_spread_line,home_money_line,over_under,over_line,under_line
0,2014,3/22/2014,los_angeles_dodgers,3,-1.5,-103,-170,arizona_diamondbacks,1,1.5,-115,150,6.5,-110,-110
1,2014,3/22/2014,los_angeles_dodgers,7,-1.5,132,-119,arizona_diamondbacks,5,1.5,-152,109,7.5,-110,-110
2,2014,3/30/2014,los_angeles_dodgers,1,-1.5,141,-115,san_diego_padres,3,1.5,-162,105,6.5,-110,-110
3,2014,3/31/2014,chicago_cubs,0,1.5,-128,170,pittsburgh_pirates,1,-1.5,100,-190,6.5,-110,-110
4,2014,3/31/2014,washington_nationals,9,-1.5,-118,-179,new_york_mets,7,1.5,-100,159,6.5,-110,-110


In [7]:
odds_df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 22920 entries, 0 to 22919
Data columns (total 15 columns):
 #   Column                  Non-Null Count  Dtype  
---  ------                  --------------  -----  
 0   season                  22920 non-null  int64  
 1   date                    22920 non-null  object 
 2   away_team               22920 non-null  object 
 3   away_score              22920 non-null  int64  
 4   away_point_spread       22920 non-null  float64
 5   away_point_spread_line  22920 non-null  int64  
 6   away_money_line         22920 non-null  int64  
 7   home_team               22920 non-null  object 
 8   home_score              22920 non-null  int64  
 9   home_point_spread       22920 non-null  float64
 10  home_point_spread_line  22920 non-null  int64  
 11  home_money_line         22920 non-null  int64  
 12  over_under              22920 non-null  float64
 13  over_line               22920 non-null  int64  
 14  under_line              22920 non-null

In [9]:
# Change datetime format
odds_df['date_numeric'] = pd.to_datetime(odds_df.date).astype(str).str.replace('-','')
odds_df.head()

Unnamed: 0,season,date,away_team,away_score,away_point_spread,away_point_spread_line,away_money_line,home_team,home_score,home_point_spread,home_point_spread_line,home_money_line,over_under,over_line,under_line,date_numeric
0,2014,3/22/2014,los_angeles_dodgers,3,-1.5,-103,-170,arizona_diamondbacks,1,1.5,-115,150,6.5,-110,-110,20140322
1,2014,3/22/2014,los_angeles_dodgers,7,-1.5,132,-119,arizona_diamondbacks,5,1.5,-152,109,7.5,-110,-110,20140322
2,2014,3/30/2014,los_angeles_dodgers,1,-1.5,141,-115,san_diego_padres,3,1.5,-162,105,6.5,-110,-110,20140330
3,2014,3/31/2014,chicago_cubs,0,1.5,-128,170,pittsburgh_pirates,1,-1.5,100,-190,6.5,-110,-110,20140331
4,2014,3/31/2014,washington_nationals,9,-1.5,-118,-179,new_york_mets,7,1.5,-100,159,6.5,-110,-110,20140331


In [11]:
odds_df.away_team.unique()

array(['los_angeles_dodgers', 'chicago_cubs', 'washington_nationals',
       'atlanta_braves', 'st._louis_cardinals', 'colorado_rockies',
       'san_francisco_giants', 'kansas_city_royals', 'boston_red_sox',
       'toronto_blue_jays', 'minnesota_twins', 'cleveland_indians',
       'seattle_mariners', 'philadelphia_phillies', 'new_york_yankees',
       'arizona_diamondbacks', 'cincinnati_reds', 'san_diego_padres',
       'baltimore_orioles', 'chicago_white_sox', 'texas_rangers',
       'los_angeles_angels', 'milwaukee_brewers', 'oakland_athletics',
       'tampa_bay_rays', 'miami_marlins', 'new_york_mets',
       'pittsburgh_pirates', 'houston_astros', 'detroit_tigers',
       'cleveland_guardians', 'american_league', 'national_league'],
      dtype=object)

In [12]:
# manually remap team names with abbreviations for future joining
team_name_dict = {}
team_name_dict["philadelphia_phillies"]='PHI'
team_name_dict["san_diego_padres"]='SDN'
team_name_dict["san_francisco_giants"]='SFN'
team_name_dict["los_angeles_angels"]='ANA'
team_name_dict["detroit_tigers"]='DET'
team_name_dict["cincinnati_reds"]='CIN'
team_name_dict["new_york_yankees"]='NYA'
team_name_dict["texas_rangers"]='TEX'
team_name_dict["tampa_bay_rays"]='TBA'
team_name_dict["colorado_rockies"]='COL'
team_name_dict["minnesota_twins"]='MIN'
team_name_dict["kansas_city_royals"]='KCA'
team_name_dict["arizona_diamondbacks"]='ARI'
team_name_dict["baltimore_orioles"]='BAL'
team_name_dict["atlanta_braves"]='ATL'
team_name_dict["toronto_blue_jays"]='TOR'
team_name_dict["seattle_mariners"]='SEA'
team_name_dict["milwaukee_brewers"]='MIL'
team_name_dict["pittsburgh_pirates"]='PIT'
team_name_dict["new_york_mets"]='NYN'
team_name_dict["los_angeles_dodgers"]='LAN'
team_name_dict["oakland_athletics"]='OAK'
team_name_dict["washington_nationals"]='WAS'
team_name_dict["chicago_white_sox"]='CHA'
team_name_dict["st._louis_cardinals"]='SLN' 
team_name_dict["chicago_cubs"]='CHN'
team_name_dict["boston_red_sox"]='BOS'
team_name_dict["miami_marlins"]='MIA'
team_name_dict["houston_astros"]='HOU'
team_name_dict["cleveland_indians"]='CLE'
team_name_dict["cleveland_guardians"]='CLE'

In [17]:
# Create new columns mapping names with shorthand name
away_team_short = []
home_team_short = []

i = 0
for home_long, away_long in zip(odds_df['home_team'], odds_df['away_team']):
    if i%1000==0:
        print(i)
    try:
        home_short = team_name_dict[home_long]
        home_team_short.append(home_short)
    except KeyError:
        home_team_short.append(None)
    try:
        away_short = team_name_dict[away_long]
        away_team_short.append(away_short)
    except KeyError:
        away_team_short.append(None)
    i+=1 
    # break

odds_df['home_team_short'] = home_team_short
odds_df['away_team_short'] = away_team_short
odds_df.head()

0
1000
2000
3000
4000
5000
6000
7000
8000
9000
10000
11000
12000
13000
14000
15000
16000
17000
18000
19000
20000
21000
22000


Unnamed: 0,season,date,away_team,away_score,away_point_spread,away_point_spread_line,away_money_line,home_team,home_score,home_point_spread,home_point_spread_line,home_money_line,over_under,over_line,under_line,date_numeric,home_team_short,away_team_short
0,2014,3/22/2014,los_angeles_dodgers,3,-1.5,-103,-170,arizona_diamondbacks,1,1.5,-115,150,6.5,-110,-110,20140322,ARI,LAN
1,2014,3/22/2014,los_angeles_dodgers,7,-1.5,132,-119,arizona_diamondbacks,5,1.5,-152,109,7.5,-110,-110,20140322,ARI,LAN
2,2014,3/30/2014,los_angeles_dodgers,1,-1.5,141,-115,san_diego_padres,3,1.5,-162,105,6.5,-110,-110,20140330,SDN,LAN
3,2014,3/31/2014,chicago_cubs,0,1.5,-128,170,pittsburgh_pirates,1,-1.5,100,-190,6.5,-110,-110,20140331,PIT,CHN
4,2014,3/31/2014,washington_nationals,9,-1.5,-118,-179,new_york_mets,7,1.5,-100,159,6.5,-110,-110,20140331,NYN,WAS


In [25]:
# Load in game level data
game_df = pd.read_csv('output_data/input_model_data_01.csv')
game_df['date'] = game_df['date'].astype(str)
game_df.head(-5)

  exec(code_obj, self.user_global_ns, self.user_ns)


Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OPS_162_h,OPS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,SO_perc_162_h,SO_perc_162_v,BB_perc_162_h,BB_perc_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OPS_30_h,OPS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,SO_perc_30_h,SO_perc_30_v,BB_perc_30_h,BB_perc_30_v
0,20000329,0,Wed,CHN,NL,1,NYN,NL,1,5,3,54,N,,,,TOK01,55000.0,206,100010210,001000020,33,12,1,0,2,5,1,0,1,10,0,5,1,0,4,0,13,3,3,3,0,0,27,10,2,0,1,0,33,7,1,0,1,3,1,1,0,3,0,4,0,0,1,0,8,5,5,5,1,0,27,12,0,0,4,0,marsr901,Randy Marsh,herna901,Angel Hernandez,fostm901,Marty Foster,kulpr901,Ron Kulpa,,(none),,(none),bayld001,Don Baylor,valeb102,Bobby Valentine,liebj001,Jon Lieber,hampm001,Mike Hampton,aguir001,Rick Aguilera,andrs001,Shane Andrews,liebj001,Jon Lieber,hampm001,Mike Hampton,youne001,Eric Young,4,bufod001,Damon Buford,8,gracm001,Mark Grace,3,sosas001,Sammy Sosa,9,rodrh001,Henry Rodriguez,7,andrs001,Shane Andrews,5,nievj002,Jose Nieves,6,giraj001,Joe Girardi,2,liebj001,Jon Lieber,1,hendr001,Rickey Henderson,7,hamid001,Darryl Hamilton,8,alfoe001,Edgardo Alfonzo,4,piazm001,Mike Piazza,2,ventr001,Robin Ventura,5,belld001,Derek Bell,9,zeilt001,Todd Zeile,3,ordor001,Rey Ordonez,6,hampm001,Mike Hampton,1,,Y,2000,-2,0,8,200003290,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,20000330,0,Thu,NYN,NL,2,CHN,NL,2,5,1,66,N,,,,TOK01,55000.0,235,00001000004,00001000000,37,6,2,0,1,5,1,1,1,8,0,5,1,0,0,0,10,5,0,0,0,0,33,14,2,0,2,0,36,5,0,0,0,0,2,0,0,6,1,9,0,0,2,0,10,7,5,5,0,0,33,14,0,0,0,0,herna901,Angel Hernandez,fostm901,Marty Foster,kulpr901,Ron Kulpa,marsr901,Randy Marsh,,(none),,(none),valeb102,Bobby Valentine,bayld001,Don Baylor,cookd001,Dennis Cook,yound002,Danny Young,,(none),agbab001,Benny Agbayani,reedr002,Rick Reed,farnk001,Kyle Farnsworth,hendr001,Rickey Henderson,7,hamid001,Darryl Hamilton,8,alfoe001,Edgardo Alfonzo,4,piazm001,Mike Piazza,2,ventr001,Robin Ventura,5,belld001,Derek Bell,9,zeilt001,Todd Zeile,3,ordor001,Rey Ordonez,6,reedr002,Rick Reed,1,youne001,Eric Young,4,bufod001,Damon Buford,8,sosas001,Sammy Sosa,9,gracm001,Mark Grace,3,rodrh001,Henry Rodriguez,7,andrs001,Shane Andrews,5,husoj001,Jeff Huson,6,giraj001,Joe Girardi,2,farnk001,Kyle Farnsworth,1,,Y,2000,-4,0,6,200003300,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,20000403,0,Mon,COL,NL,1,ATL,NL,1,0,2,51,D,,,,ATL02,42255.0,134,000000000,00000020x,31,6,2,0,0,0,1,0,0,2,2,7,0,0,1,0,7,3,2,2,1,0,24,10,0,0,1,0,30,7,0,0,2,2,0,0,1,1,0,6,1,0,1,0,6,2,0,0,0,0,27,12,0,0,1,0,hirsj901,John Hirschbeck,willc901,Charlie Williams,wegnm901,Mark Wegner,reynj901,Jim Reynolds,,(none),,(none),bellb001,Buddy Bell,cox-b103,Bobby Cox,maddg002,Greg Maddux,astap001,Pedro Astacio,remlm001,Mike Remlinger,galaa001,Andres Galarraga,astap001,Pedro Astacio,maddg002,Greg Maddux,goodt001,Tom Goodwin,8,lansm001,Mike Lansing,4,walkl001,Larry Walker,9,cirij001,Jeff Cirillo,5,heltt001,Todd Helton,3,hammj001,Jeffrey Hammonds,7,peren001,Neifi Perez,6,maynb001,Brent Mayne,2,astap001,Pedro Astacio,1,veraq001,Quilvio Veras,4,sandr002,Reggie Sanders,7,jonec004,Chipper Jones,5,jordb001,Brian Jordan,9,galaa001,Andres Galarraga,3,jonea002,Andruw Jones,8,peree002,Eddie Perez,2,weisw001,Walt Weiss,6,maddg002,Greg Maddux,1,,Y,2000,2,1,2,200004030,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,20000403,0,Mon,MIL,NL,1,CIN,NL,1,3,3,31,D,,,,CIN08,55596.0,111,002100,21000x,22,7,1,0,0,2,0,0,0,5,0,1,1,0,0,0,8,1,3,3,0,0,15,5,0,0,0,0,19,5,1,0,1,3,0,0,0,1,0,4,0,0,0,0,2,2,2,2,0,0,16,8,2,0,0,0,marsr901,Randy Marsh,herna901,Angel Hernandez,fostm901,Marty Foster,kulpr901,Ron Kulpa,,(none),,(none),loped001,Davey Lopes,mckej801,Jack McKeon,,,,,,(none),,(none),woods001,Steve Woodard,harnp001,Pete Harnisch,grism001,Marquis Grissom,8,lorem001,Mark Loretta,6,burnj001,Jeromy Burnitz,9,jenkg001,Geoff Jenkins,7,hernj001,Jose Hernandez,5,barkk001,Kevin Barker,3,bellr002,Ronnie Belliard,4,blanh001,Henry Blanco,2,woods001,Steve Woodard,1,reesp001,Pokey Reese,4,larkb001,Barry Larkin,6,grifk002,Ken Griffey,8,bichd001,Dante Bichette,9,yound001,Dmitri Young,3,taube001,Ed Taubensee,2,boona001,Aaron Boone,5,tuckm001,Michael Tucker,7,harnp001,Pete Harnisch,1,,Y,2000,0,0,6,200004030,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,20000403,0,Mon,SFN,NL,1,FLO,NL,1,4,6,51,N,,,,MIA01,35101.0,166,002100001,20002101x,35,10,2,2,1,4,0,0,0,1,0,8,0,0,2,0,5,2,4,4,0,0,24,7,2,0,1,0,36,12,3,0,0,5,0,0,1,1,0,7,1,0,1,0,8,3,4,4,0,0,27,15,0,0,2,0,demud901,Dana DeMuth,relic901,Charlie Reliford,eddid901,Doug Eddings,carlm901,Mark Carlson,,(none),,(none),baked002,Dusty Baker,bolej801,John Boles,ferna001,Alex Fernandez,hernl003,Livan Hernandez,alfoa001,Antonio Alfonseca,,(none),hernl003,Livan Hernandez,ferna001,Alex Fernandez,benam001,Marvin Benard,8,muelb001,Bill Mueller,5,bondb001,Barry Bonds,7,kentj001,Jeff Kent,4,snowj001,J.T. Snow,3,burke001,Ellis Burks,9,aurir001,Rich Aurilia,6,estab001,Bobby Estalella,2,hernl003,Livan Hernandez,1,castl001,Luis Castillo,4,gonza002,Alex Gonzalez,6,floyc001,Cliff Floyd,7,wilsp002,Preston Wilson,8,lowem001,Mike Lowell,5,millk005,Kevin Millar,3,browb003,Brant Brown,9,redmm001,Mike Redmond,2,ferna001,Alex Fernandez,1,,Y,2000,2,1,10,200004030,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
56765,20231001,0,Sun,MIA,NL,162,PIT,NL,162,0,3,51,D,,,,PIT08,22954.0,137,000000000,00000003x,29,3,0,0,0,0,0,0,0,1,0,11,0,1,1,0,3,3,3,3,0,0,24,9,1,0,0,0,29,6,4,1,0,3,0,0,0,5,0,9,0,2,0,0,7,5,0,0,1,0,27,9,1,0,1,0,lentn901,Nic Lentz,rehaj901,Jeremie Rehak,ramoc901,Charlie Ramos,fairc901,Chad Fairchild,,(none),,(none),mattd001,Don Mattingly,sheld801,Derek Shelton,mored002,Dauri Moreta,hoeib001,Bryan Hoeing,bednd001,David Bednar,andum001,Miguel Andujar,weatr001,Ryan Weathers,jacka003,Andre Jackson,edwax001,Xavier Edwards,4,delab001,Bryan De La Cruz,7,sancj003,Jesus Sanchez,9,gurry001,Yulieski Gurriel,3,hampg001,Garrett Hampson,8,wendj002,Joey Wendle,6,stalj001,Jacob Stallings,10,fortn001,Nick Fortes,2,bertj001,Jon Berti,5,joe-c001,Connor Joe,3,trioj001,Jared Triolo,5,andum001,Miguel Andujar,9,suwij001,Jack Suwinski,7,davih001,Henry Davis,10,pegul001,Liover Peguero,6,gonzn001,Nick Gonzales,4,bae-j001,Ji Hwan Bae,8,delaj004,Jason Delay,2,,Y,2023,3,1,3,202310010,0.239734,0.260403,0.310518,0.314584,0.392157,0.407959,0.702675,0.722543,117.0,87.0,39.0,20.0,92.0,97.0,0.270070,0.232782,0.102664,0.079048,0.259615,0.265885,0.317981,0.325853,0.419231,0.434995,0.737211,0.760848,21.0,20.0,5.0,1.0,14.0,21.0,0.275962,0.232649,0.085577,0.088954
56766,20231001,0,Sun,LAN,NL,162,SFN,NL,162,5,2,54,D,,,,SFO03,38359.0,164,000005000,000001010,34,7,0,0,1,5,0,0,3,3,0,8,1,0,0,0,8,4,2,2,1,0,27,10,1,0,0,0,31,3,0,0,2,2,0,0,1,2,0,9,0,0,0,0,5,4,5,5,1,0,27,3,0,0,0,0,barrl901,Lance Barrett,arrid901,David Arrieta,segac901,Chris Segal,cejan901,Nestor Ceja,,(none),,(none),robed001,Dave Roberts,kaplg001,Gabe Kapler,gonzv001,Victor Gonzalez,brebj001,John Brebbia,phile001,Evan Phillips,rosaa003,Amed Rosario,millb005,Bobby Miller,harrk001,Kyle Harrison,bettm001,Mookie Betts,9,freef001,Freddie Freeman,3,smitw003,Will Smith,2,martj006,J.D. Martinez,10,muncm001,Max Muncy,5,taylc001,Chris Taylor,7,rosaa003,Amed Rosario,4,outmj002,James Outman,8,herne001,Enrique Hernandez,6,crawb001,Brandon Crawford,6,wadel001,LaMonte Wade,3,estrt001,Thairo Estrada,4,confm001,Michael Conforto,7,pedej001,Joc Pederson,10,yastm001,Mike Yastrzemski,9,fitzt001,Tyler Fitzgerald,8,sabob001,Blake Sabol,2,schmc003,Casey Schmitt,5,,Y,2023,-3,0,7,202310010,0.236250,0.257696,0.306170,0.335333,0.385382,0.456356,0.691552,0.791690,59.0,104.0,16.0,25.0,117.0,75.0,0.275194,0.246288,0.100775,0.116806,0.220061,0.263969,0.297696,0.332168,0.367451,0.438343,0.665147,0.770511,10.0,22.0,3.0,6.0,31.0,16.0,0.251791,0.241811,0.110542,0.102119
56767,20231001,0,Sun,CIN,NL,162,SLN,NL,162,3,4,51,D,,,,STL10,44614.0,136,101000100,01300000x,35,9,4,0,1,3,0,0,0,0,0,14,1,1,0,0,5,3,4,4,0,0,24,6,0,0,0,0,30,9,3,0,0,4,1,1,2,1,0,9,1,1,0,0,7,3,3,3,0,0,27,3,0,0,1,0,lives901,Shane Livensparger,rippm901,Mark Ripperger,cuzzp901,Phil Cuzzi,belld901,Dan Bellino,,(none),,(none),belld002,David Bell,marmo801,Oliver Marmol,mikom001,Miles Mikolas,greeh001,Hunter Greene,helsr001,Ryan Helsley,bakel001,Luken Baker,greeh001,Hunter Greene,mikom001,Miles Mikolas,martn003,Nick Martini,7,delae003,Elly De La Cruz,6,vottj001,Joey Votto,3,encac001,Christian Encarnacion-Strand,10,martn004,Noelvi Marte,5,bensw001,Will Benson,9,senzn001,Nick Senzel,4,fairs001,Stuart Fairchild,8,maill001,Luke Maile,2,edmat001,Tommy Edman,8,nootl001,Lars Nootbaar,10,walkj003,Jordan Walker,9,bakel001,Luken Baker,3,palar002,Richie Palacios,7,kniza001,Andrew Knizner,2,fermj001,Jose Fermin,5,lopei001,Irving Lopez,4,winnm001,Masyn Winn,6,,Y,2023,1,1,7,202310010,0.249365,0.248954,0.319803,0.318369,0.415125,0.418440,0.734928,0.736809,101.0,189.0,28.0,47.0,68.0,91.0,0.239753,0.272049,0.103555,0.101837,0.227408,0.251969,0.310284,0.322638,0.368421,0.439961,0.678705,0.762599,26.0,36.0,4.0,10.0,13.0,21.0,0.230387,0.261811,0.120159,0.104331
56768,20231001,0,Sun,OAK,AL,162,ANA,AL,162,3,7,51,D,,,,ANA01,26539.0,152,000000111,10113100x,34,10,2,0,1,3,0,0,0,4,0,6,1,0,2,0,8,4,7,7,1,1,24,6,1,0,1,0,33,10,2,0,3,5,0,0,2,6,1,10,1,0,1,0,10,3,3,3,1,1,27,14,1,0,2,0,walsb901,Brian Walsh,may-b901,Ben May,nelsj901,Jeff Nelson,navaj901,Jose Navas,,(none),,(none),kotsm001,Mark Kotsay,nevip001,Phil Nevin,fulmc001,Carson Fulmer,searj001,JP Sears,,(none),drurb001,Brandon Drury,searj001,JP Sears,fulmc001,Carson Fulmer,ruize001,Esteury Ruiz,9,geloz001,Zack Gelof,4,nodar001,Ryan Noda,3,rookb001,Brent Rooker,10,bledj001,JJ Bleday,7,butll001,Lawrence Butler,8,diazj008,Jordan Diaz,5,sodet001,Tyler Soderstrom,2,allen002,Nick Allen,6,gricr001,Randal Grichuk,7,netoz001,Zach Neto,6,drurb001,Brandon Drury,3,ohopl001,Logan O'Hoppe,2,adelj001,Jo Adell,9,escoe001,Eduardo Escobar,10,stefm001,Michael Stefanic,5,fletd002,David Fletcher,4,philb002,Brett Phillips,8,,Y,2023,4,1,10,202310010,0.244578,0.222662,0.309167,0.289138,0.424640,0.369532,0.733807,0.658670,71.0,149.0,31.0,31.0,94.0,101.0,0.276654,0.282428,0.093494,0.093514,0.229557,0.224049,0.283226,0.279580,0.389163,0.388489,0.672389,0.668069,8.0,28.0,8.0,7.0,14.0,20.0,0.287685,0.294964,0.074877,0.077081


In [31]:
# Join odds and game data by date and teams 
merged_df = game_df.merge(odds_df, how = 'left', left_on = ['date', 'team_h', 'team_v'], right_on = ['date_numeric', 'home_team_short', 'away_team_short'])
merged_df.drop(['home_team_short', 'away_team_short', 'date_numeric', 'home_score', 'away_score', 'home_team', 'away_team', 'season_y', 'date_y'], axis = 1, inplace=True)
merged_df.head(-5)


Unnamed: 0,date_x,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season_x,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OPS_162_h,OPS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,SO_perc_162_h,SO_perc_162_v,BB_perc_162_h,BB_perc_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OPS_30_h,OPS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,SO_perc_30_h,SO_perc_30_v,BB_perc_30_h,BB_perc_30_v,away_point_spread,away_point_spread_line,away_money_line,home_point_spread,home_point_spread_line,home_money_line,over_under,over_line,under_line
0,20000329,0,Wed,CHN,NL,1,NYN,NL,1,5,3,54,N,,,,TOK01,55000.0,206,100010210,001000020,33,12,1,0,2,5,1,0,1,10,0,5,1,0,4,0,13,3,3,3,0,0,27,10,2,0,1,0,33,7,1,0,1,3,1,1,0,3,0,4,0,0,1,0,8,5,5,5,1,0,27,12,0,0,4,0,marsr901,Randy Marsh,herna901,Angel Hernandez,fostm901,Marty Foster,kulpr901,Ron Kulpa,,(none),,(none),bayld001,Don Baylor,valeb102,Bobby Valentine,liebj001,Jon Lieber,hampm001,Mike Hampton,aguir001,Rick Aguilera,andrs001,Shane Andrews,liebj001,Jon Lieber,hampm001,Mike Hampton,youne001,Eric Young,4,bufod001,Damon Buford,8,gracm001,Mark Grace,3,sosas001,Sammy Sosa,9,rodrh001,Henry Rodriguez,7,andrs001,Shane Andrews,5,nievj002,Jose Nieves,6,giraj001,Joe Girardi,2,liebj001,Jon Lieber,1,hendr001,Rickey Henderson,7,hamid001,Darryl Hamilton,8,alfoe001,Edgardo Alfonzo,4,piazm001,Mike Piazza,2,ventr001,Robin Ventura,5,belld001,Derek Bell,9,zeilt001,Todd Zeile,3,ordor001,Rey Ordonez,6,hampm001,Mike Hampton,1,,Y,2000,-2,0,8,200003290,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,20000330,0,Thu,NYN,NL,2,CHN,NL,2,5,1,66,N,,,,TOK01,55000.0,235,00001000004,00001000000,37,6,2,0,1,5,1,1,1,8,0,5,1,0,0,0,10,5,0,0,0,0,33,14,2,0,2,0,36,5,0,0,0,0,2,0,0,6,1,9,0,0,2,0,10,7,5,5,0,0,33,14,0,0,0,0,herna901,Angel Hernandez,fostm901,Marty Foster,kulpr901,Ron Kulpa,marsr901,Randy Marsh,,(none),,(none),valeb102,Bobby Valentine,bayld001,Don Baylor,cookd001,Dennis Cook,yound002,Danny Young,,(none),agbab001,Benny Agbayani,reedr002,Rick Reed,farnk001,Kyle Farnsworth,hendr001,Rickey Henderson,7,hamid001,Darryl Hamilton,8,alfoe001,Edgardo Alfonzo,4,piazm001,Mike Piazza,2,ventr001,Robin Ventura,5,belld001,Derek Bell,9,zeilt001,Todd Zeile,3,ordor001,Rey Ordonez,6,reedr002,Rick Reed,1,youne001,Eric Young,4,bufod001,Damon Buford,8,sosas001,Sammy Sosa,9,gracm001,Mark Grace,3,rodrh001,Henry Rodriguez,7,andrs001,Shane Andrews,5,husoj001,Jeff Huson,6,giraj001,Joe Girardi,2,farnk001,Kyle Farnsworth,1,,Y,2000,-4,0,6,200003300,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,20000403,0,Mon,COL,NL,1,ATL,NL,1,0,2,51,D,,,,ATL02,42255.0,134,000000000,00000020x,31,6,2,0,0,0,1,0,0,2,2,7,0,0,1,0,7,3,2,2,1,0,24,10,0,0,1,0,30,7,0,0,2,2,0,0,1,1,0,6,1,0,1,0,6,2,0,0,0,0,27,12,0,0,1,0,hirsj901,John Hirschbeck,willc901,Charlie Williams,wegnm901,Mark Wegner,reynj901,Jim Reynolds,,(none),,(none),bellb001,Buddy Bell,cox-b103,Bobby Cox,maddg002,Greg Maddux,astap001,Pedro Astacio,remlm001,Mike Remlinger,galaa001,Andres Galarraga,astap001,Pedro Astacio,maddg002,Greg Maddux,goodt001,Tom Goodwin,8,lansm001,Mike Lansing,4,walkl001,Larry Walker,9,cirij001,Jeff Cirillo,5,heltt001,Todd Helton,3,hammj001,Jeffrey Hammonds,7,peren001,Neifi Perez,6,maynb001,Brent Mayne,2,astap001,Pedro Astacio,1,veraq001,Quilvio Veras,4,sandr002,Reggie Sanders,7,jonec004,Chipper Jones,5,jordb001,Brian Jordan,9,galaa001,Andres Galarraga,3,jonea002,Andruw Jones,8,peree002,Eddie Perez,2,weisw001,Walt Weiss,6,maddg002,Greg Maddux,1,,Y,2000,2,1,2,200004030,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,20000403,0,Mon,MIL,NL,1,CIN,NL,1,3,3,31,D,,,,CIN08,55596.0,111,002100,21000x,22,7,1,0,0,2,0,0,0,5,0,1,1,0,0,0,8,1,3,3,0,0,15,5,0,0,0,0,19,5,1,0,1,3,0,0,0,1,0,4,0,0,0,0,2,2,2,2,0,0,16,8,2,0,0,0,marsr901,Randy Marsh,herna901,Angel Hernandez,fostm901,Marty Foster,kulpr901,Ron Kulpa,,(none),,(none),loped001,Davey Lopes,mckej801,Jack McKeon,,,,,,(none),,(none),woods001,Steve Woodard,harnp001,Pete Harnisch,grism001,Marquis Grissom,8,lorem001,Mark Loretta,6,burnj001,Jeromy Burnitz,9,jenkg001,Geoff Jenkins,7,hernj001,Jose Hernandez,5,barkk001,Kevin Barker,3,bellr002,Ronnie Belliard,4,blanh001,Henry Blanco,2,woods001,Steve Woodard,1,reesp001,Pokey Reese,4,larkb001,Barry Larkin,6,grifk002,Ken Griffey,8,bichd001,Dante Bichette,9,yound001,Dmitri Young,3,taube001,Ed Taubensee,2,boona001,Aaron Boone,5,tuckm001,Michael Tucker,7,harnp001,Pete Harnisch,1,,Y,2000,0,0,6,200004030,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,20000403,0,Mon,SFN,NL,1,FLO,NL,1,4,6,51,N,,,,MIA01,35101.0,166,002100001,20002101x,35,10,2,2,1,4,0,0,0,1,0,8,0,0,2,0,5,2,4,4,0,0,24,7,2,0,1,0,36,12,3,0,0,5,0,0,1,1,0,7,1,0,1,0,8,3,4,4,0,0,27,15,0,0,2,0,demud901,Dana DeMuth,relic901,Charlie Reliford,eddid901,Doug Eddings,carlm901,Mark Carlson,,(none),,(none),baked002,Dusty Baker,bolej801,John Boles,ferna001,Alex Fernandez,hernl003,Livan Hernandez,alfoa001,Antonio Alfonseca,,(none),hernl003,Livan Hernandez,ferna001,Alex Fernandez,benam001,Marvin Benard,8,muelb001,Bill Mueller,5,bondb001,Barry Bonds,7,kentj001,Jeff Kent,4,snowj001,J.T. Snow,3,burke001,Ellis Burks,9,aurir001,Rich Aurilia,6,estab001,Bobby Estalella,2,hernl003,Livan Hernandez,1,castl001,Luis Castillo,4,gonza002,Alex Gonzalez,6,floyc001,Cliff Floyd,7,wilsp002,Preston Wilson,8,lowem001,Mike Lowell,5,millk005,Kevin Millar,3,browb003,Brant Brown,9,redmm001,Mike Redmond,2,ferna001,Alex Fernandez,1,,Y,2000,2,1,10,200004030,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
57345,20231001,0,Sun,MIA,NL,162,PIT,NL,162,0,3,51,D,,,,PIT08,22954.0,137,000000000,00000003x,29,3,0,0,0,0,0,0,0,1,0,11,0,1,1,0,3,3,3,3,0,0,24,9,1,0,0,0,29,6,4,1,0,3,0,0,0,5,0,9,0,2,0,0,7,5,0,0,1,0,27,9,1,0,1,0,lentn901,Nic Lentz,rehaj901,Jeremie Rehak,ramoc901,Charlie Ramos,fairc901,Chad Fairchild,,(none),,(none),mattd001,Don Mattingly,sheld801,Derek Shelton,mored002,Dauri Moreta,hoeib001,Bryan Hoeing,bednd001,David Bednar,andum001,Miguel Andujar,weatr001,Ryan Weathers,jacka003,Andre Jackson,edwax001,Xavier Edwards,4,delab001,Bryan De La Cruz,7,sancj003,Jesus Sanchez,9,gurry001,Yulieski Gurriel,3,hampg001,Garrett Hampson,8,wendj002,Joey Wendle,6,stalj001,Jacob Stallings,10,fortn001,Nick Fortes,2,bertj001,Jon Berti,5,joe-c001,Connor Joe,3,trioj001,Jared Triolo,5,andum001,Miguel Andujar,9,suwij001,Jack Suwinski,7,davih001,Henry Davis,10,pegul001,Liover Peguero,6,gonzn001,Nick Gonzales,4,bae-j001,Ji Hwan Bae,8,delaj004,Jason Delay,2,,Y,2023,3,1,3,202310010,0.239734,0.260403,0.310518,0.314584,0.392157,0.407959,0.702675,0.722543,117.0,87.0,39.0,20.0,92.0,97.0,0.270070,0.232782,0.102664,0.079048,0.259615,0.265885,0.317981,0.325853,0.419231,0.434995,0.737211,0.760848,21.0,20.0,5.0,1.0,14.0,21.0,0.275962,0.232649,0.085577,0.088954,,,,,,,,,
57346,20231001,0,Sun,LAN,NL,162,SFN,NL,162,5,2,54,D,,,,SFO03,38359.0,164,000005000,000001010,34,7,0,0,1,5,0,0,3,3,0,8,1,0,0,0,8,4,2,2,1,0,27,10,1,0,0,0,31,3,0,0,2,2,0,0,1,2,0,9,0,0,0,0,5,4,5,5,1,0,27,3,0,0,0,0,barrl901,Lance Barrett,arrid901,David Arrieta,segac901,Chris Segal,cejan901,Nestor Ceja,,(none),,(none),robed001,Dave Roberts,kaplg001,Gabe Kapler,gonzv001,Victor Gonzalez,brebj001,John Brebbia,phile001,Evan Phillips,rosaa003,Amed Rosario,millb005,Bobby Miller,harrk001,Kyle Harrison,bettm001,Mookie Betts,9,freef001,Freddie Freeman,3,smitw003,Will Smith,2,martj006,J.D. Martinez,10,muncm001,Max Muncy,5,taylc001,Chris Taylor,7,rosaa003,Amed Rosario,4,outmj002,James Outman,8,herne001,Enrique Hernandez,6,crawb001,Brandon Crawford,6,wadel001,LaMonte Wade,3,estrt001,Thairo Estrada,4,confm001,Michael Conforto,7,pedej001,Joc Pederson,10,yastm001,Mike Yastrzemski,9,fitzt001,Tyler Fitzgerald,8,sabob001,Blake Sabol,2,schmc003,Casey Schmitt,5,,Y,2023,-3,0,7,202310010,0.236250,0.257696,0.306170,0.335333,0.385382,0.456356,0.691552,0.791690,59.0,104.0,16.0,25.0,117.0,75.0,0.275194,0.246288,0.100775,0.116806,0.220061,0.263969,0.297696,0.332168,0.367451,0.438343,0.665147,0.770511,10.0,22.0,3.0,6.0,31.0,16.0,0.251791,0.241811,0.110542,0.102119,-1.5,105.0,-155.0,1.5,-125.0,142.0,8.0,-113.0,-107.0
57347,20231001,0,Sun,CIN,NL,162,SLN,NL,162,3,4,51,D,,,,STL10,44614.0,136,101000100,01300000x,35,9,4,0,1,3,0,0,0,0,0,14,1,1,0,0,5,3,4,4,0,0,24,6,0,0,0,0,30,9,3,0,0,4,1,1,2,1,0,9,1,1,0,0,7,3,3,3,0,0,27,3,0,0,1,0,lives901,Shane Livensparger,rippm901,Mark Ripperger,cuzzp901,Phil Cuzzi,belld901,Dan Bellino,,(none),,(none),belld002,David Bell,marmo801,Oliver Marmol,mikom001,Miles Mikolas,greeh001,Hunter Greene,helsr001,Ryan Helsley,bakel001,Luken Baker,greeh001,Hunter Greene,mikom001,Miles Mikolas,martn003,Nick Martini,7,delae003,Elly De La Cruz,6,vottj001,Joey Votto,3,encac001,Christian Encarnacion-Strand,10,martn004,Noelvi Marte,5,bensw001,Will Benson,9,senzn001,Nick Senzel,4,fairs001,Stuart Fairchild,8,maill001,Luke Maile,2,edmat001,Tommy Edman,8,nootl001,Lars Nootbaar,10,walkj003,Jordan Walker,9,bakel001,Luken Baker,3,palar002,Richie Palacios,7,kniza001,Andrew Knizner,2,fermj001,Jose Fermin,5,lopei001,Irving Lopez,4,winnm001,Masyn Winn,6,,Y,2023,1,1,7,202310010,0.249365,0.248954,0.319803,0.318369,0.415125,0.418440,0.734928,0.736809,101.0,189.0,28.0,47.0,68.0,91.0,0.239753,0.272049,0.103555,0.101837,0.227408,0.251969,0.310284,0.322638,0.368421,0.439961,0.678705,0.762599,26.0,36.0,4.0,10.0,13.0,21.0,0.230387,0.261811,0.120159,0.104331,-1.5,138.0,-116.0,1.5,-157.0,106.0,8.5,-120.0,-100.0
57348,20231001,0,Sun,OAK,AL,162,ANA,AL,162,3,7,51,D,,,,ANA01,26539.0,152,000000111,10113100x,34,10,2,0,1,3,0,0,0,4,0,6,1,0,2,0,8,4,7,7,1,1,24,6,1,0,1,0,33,10,2,0,3,5,0,0,2,6,1,10,1,0,1,0,10,3,3,3,1,1,27,14,1,0,2,0,walsb901,Brian Walsh,may-b901,Ben May,nelsj901,Jeff Nelson,navaj901,Jose Navas,,(none),,(none),kotsm001,Mark Kotsay,nevip001,Phil Nevin,fulmc001,Carson Fulmer,searj001,JP Sears,,(none),drurb001,Brandon Drury,searj001,JP Sears,fulmc001,Carson Fulmer,ruize001,Esteury Ruiz,9,geloz001,Zack Gelof,4,nodar001,Ryan Noda,3,rookb001,Brent Rooker,10,bledj001,JJ Bleday,7,butll001,Lawrence Butler,8,diazj008,Jordan Diaz,5,sodet001,Tyler Soderstrom,2,allen002,Nick Allen,6,gricr001,Randal Grichuk,7,netoz001,Zach Neto,6,drurb001,Brandon Drury,3,ohopl001,Logan O'Hoppe,2,adelj001,Jo Adell,9,escoe001,Eduardo Escobar,10,stefm001,Michael Stefanic,5,fletd002,David Fletcher,4,philb002,Brett Phillips,8,,Y,2023,4,1,10,202310010,0.244578,0.222662,0.309167,0.289138,0.424640,0.369532,0.733807,0.658670,71.0,149.0,31.0,31.0,94.0,101.0,0.276654,0.282428,0.093494,0.093514,0.229557,0.224049,0.283226,0.279580,0.389163,0.388489,0.672389,0.668069,8.0,28.0,8.0,7.0,14.0,20.0,0.287685,0.294964,0.074877,0.077081,,,,,,,,,


In [35]:
# Remove games with no odds
no_nans = merged_df[~merged_df['home_point_spread'].isna()]
no_nans.rename(columns={'date_x':'date'}, inplace= True)

no_nans.head()

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  return super().rename(


Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season_x,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OPS_162_h,OPS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,SO_perc_162_h,SO_perc_162_v,BB_perc_162_h,BB_perc_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OPS_30_h,OPS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,SO_perc_30_h,SO_perc_30_v,BB_perc_30_h,BB_perc_30_v,away_point_spread,away_point_spread_line,away_money_line,home_point_spread,home_point_spread_line,home_money_line,over_under,over_line,under_line
34011,20140322,0,Sat,LAN,NL,1,ARI,NL,1,3,1,54,N,,,,SYD01,38266.0,169,10200000,000001000,33,5,2,0,1,3,0,0,1,3,0,11,0,0,0,0,7,4,1,1,1,0,27,13,1,0,0,0,33,5,1,0,0,1,0,0,0,2,0,10,0,0,0,0,7,5,3,3,1,0,27,10,1,0,0,0,welkt901,Tim Welke,scotd901,Dale Scott,diazl901,Laz Diaz,carlm901,Mark Carlson,,(none),,(none),mattd001,Don Mattingly,gibsk001,Kirk Gibson,kersc001,Clayton Kershaw,milew001,Wade Miley,jansk001,Kenley Jansen,ethia001,Andre Ethier,kersc001,Clayton Kershaw,milew001,Wade Miley,puigy001,Yasiel Puig,9,turnj001,Justin Turner,4,ramih003,Hanley Ramirez,6,gonza003,Adrian Gonzalez,3,vanss001,Scott Van Slyke,7,uribj002,Juan Uribe,5,ethia001,Andre Ethier,8,ellia001,A.J. Ellis,2,kersc001,Clayton Kershaw,1,polla001,A.J. Pollock,8,hilla001,Aaron Hill,4,goldp001,Paul Goldschmidt,3,pradm001,Martin Prado,5,trumm001,Mark Trumbo,7,montm001,Miguel Montero,2,owinc001,Chris Owings,6,parrg001,Gerardo Parra,9,milew001,Wade Miley,1,,Y,2014,-2,0,4,201403220,0.258633,0.263522,0.320743,0.322272,0.391473,0.396285,0.712215,0.718557,62.0,78.0,41.0,28.0,75.0,109.0,0.201198,0.208705,0.091438,0.086687,0.253644,0.256335,0.313673,0.311372,0.377065,0.41423,0.690738,0.725602,14.0,12.0,6.0,8.0,11.0,16.0,0.190476,0.222222,0.087464,0.079922,-1.5,-103.0,-170.0,1.5,-115.0,150.0,6.5,-110.0,-110.0
34012,20140322,0,Sat,LAN,NL,1,ARI,NL,1,3,1,54,N,,,,SYD01,38266.0,169,10200000,000001000,33,5,2,0,1,3,0,0,1,3,0,11,0,0,0,0,7,4,1,1,1,0,27,13,1,0,0,0,33,5,1,0,0,1,0,0,0,2,0,10,0,0,0,0,7,5,3,3,1,0,27,10,1,0,0,0,welkt901,Tim Welke,scotd901,Dale Scott,diazl901,Laz Diaz,carlm901,Mark Carlson,,(none),,(none),mattd001,Don Mattingly,gibsk001,Kirk Gibson,kersc001,Clayton Kershaw,milew001,Wade Miley,jansk001,Kenley Jansen,ethia001,Andre Ethier,kersc001,Clayton Kershaw,milew001,Wade Miley,puigy001,Yasiel Puig,9,turnj001,Justin Turner,4,ramih003,Hanley Ramirez,6,gonza003,Adrian Gonzalez,3,vanss001,Scott Van Slyke,7,uribj002,Juan Uribe,5,ethia001,Andre Ethier,8,ellia001,A.J. Ellis,2,kersc001,Clayton Kershaw,1,polla001,A.J. Pollock,8,hilla001,Aaron Hill,4,goldp001,Paul Goldschmidt,3,pradm001,Martin Prado,5,trumm001,Mark Trumbo,7,montm001,Miguel Montero,2,owinc001,Chris Owings,6,parrg001,Gerardo Parra,9,milew001,Wade Miley,1,,Y,2014,-2,0,4,201403220,0.258633,0.263522,0.320743,0.322272,0.391473,0.396285,0.712215,0.718557,62.0,78.0,41.0,28.0,75.0,109.0,0.201198,0.208705,0.091438,0.086687,0.253644,0.256335,0.313673,0.311372,0.377065,0.41423,0.690738,0.725602,14.0,12.0,6.0,8.0,11.0,16.0,0.190476,0.222222,0.087464,0.079922,-1.5,132.0,-119.0,1.5,-152.0,109.0,7.5,-110.0,-110.0
34014,20140330,0,Sun,LAN,NL,3,SDN,NL,1,1,3,51,N,,,,SAN02,45567.0,169,10000,00000003x,31,4,0,0,0,1,0,0,0,3,0,9,0,0,0,0,6,4,2,2,0,0,24,12,2,0,2,0,27,5,0,0,1,3,2,0,0,4,0,10,1,0,2,0,6,5,1,1,1,0,27,10,0,0,0,0,culbf901,Fieldin Culbreth,gonzm901,Manny Gonzalez,reynj901,Jim Reynolds,barbs901,Sean Barber,,(none),,(none),mattd001,Don Mattingly,blacb001,Buddy Black,thayd001,Dale Thayer,wilsb001,Brian Wilson,streh001,Huston Street,denoc001,Chris Denorfia,ryu-h001,Hyun-Jin Ryu,casha001,Andrew Cashner,crawc002,Carl Crawford,7,puigy001,Yasiel Puig,9,ramih003,Hanley Ramirez,6,gonza003,Adrian Gonzalez,3,ethia001,Andre Ethier,8,uribj002,Juan Uribe,5,ellia001,A.J. Ellis,2,gordd002,Dee Strange-Gordon,4,ryu-h001,Hyun-Jin Ryu,1,cabre001,Everth Cabrera,6,denoc001,Chris Denorfia,9,headc001,Chase Headley,5,gyorj001,Jedd Gyorko,4,alony001,Yonder Alonso,3,medit001,Tommy Medica,7,venaw001,Will Venable,8,river003,Rene Rivera,2,casha001,Andrew Cashner,1,,Y,2014,2,1,4,201403300,0.244517,0.264775,0.303476,0.324252,0.377923,0.397527,0.681399,0.721779,118.0,79.0,34.0,27.0,82.0,109.0,0.237267,0.208765,0.084647,0.088016,0.233533,0.25561,0.296059,0.315695,0.359281,0.401951,0.65534,0.717646,21.0,10.0,6.0,8.0,13.0,16.0,0.266467,0.229268,0.088822,0.087805,-1.5,141.0,-115.0,1.5,-162.0,105.0,6.5,-110.0,-110.0
34015,20140331,0,Mon,SEA,AL,1,ANA,AL,1,10,3,54,N,,,,ANA01,44152.0,197,10001206,201000000,36,11,4,2,1,10,0,1,0,8,1,11,1,1,0,0,8,5,2,2,2,0,27,5,1,0,0,0,34,6,1,0,1,3,0,0,1,1,0,13,1,0,0,0,6,5,9,9,0,0,27,7,1,0,0,0,westj901,Joe West,fostm901,Marty Foster,drakr901,Rob Drake,porta901,Alan Porter,,(none),,(none),mccll001,Lloyd McClendon,sciom001,Mike Scioscia,hernf002,Felix Hernandez,weavj003,Jered Weaver,,(none),almoa001,Abraham Almonte,hernf002,Felix Hernandez,weavj003,Jered Weaver,almoa001,Abraham Almonte,8,millb002,Brad Miller,6,canor001,Robinson Cano,4,smoaj001,Justin Smoak,3,morrl001,Logan Morrison,10,seagk001,Kyle Seager,5,saunm001,Michael Saunders,9,ackld001,Dustin Ackley,7,zunim001,Mike Zunino,2,calhk001,Kole Calhoun,9,troum001,Mike Trout,8,pujoa001,Albert Pujols,3,hamij003,Josh Hamilton,7,freed001,David Freese,5,ibanr001,Raul Ibanez,10,kendh001,Howie Kendrick,4,iannc001,Chris Iannetta,2,aybae001,Erick Aybar,6,,Y,2014,-7,0,13,201403310,0.264137,0.237136,0.327115,0.303434,0.41446,0.389529,0.741575,0.692962,82.0,49.0,34.0,23.0,112.0,88.0,0.218504,0.243433,0.093593,0.095178,0.269455,0.216749,0.327061,0.29646,0.419261,0.360591,0.746322,0.657051,15.0,11.0,7.0,6.0,21.0,20.0,0.2393,0.252217,0.085603,0.1133,1.5,-199.0,104.0,-1.5,169.0,-114.0,7.0,-110.0,-110.0
34016,20140331,0,Mon,BOS,AL,1,BAL,AL,1,1,2,51,D,,,,BAL12,46685.0,173,100000,01000010x,36,9,2,0,1,1,0,0,1,3,0,6,0,0,0,0,12,2,2,2,0,0,24,11,0,0,2,0,28,6,0,0,1,1,0,0,0,1,0,9,0,0,2,0,3,5,1,1,0,0,27,13,0,0,0,0,demud901,Dana DeMuth,kulpr901,Ron Kulpa,hicke901,Ed Hickox,barrl901,Lance Barrett,,(none),,(none),farrj001,John Farrell,showb801,Buck Showalter,britz001,Zack Britton,lestj001,Jon Lester,huntt002,Tommy Hunter,cruzn002,Nelson Cruz,lestj001,Jon Lester,tillc001,Chris Tillman,navad002,Daniel Nava,9,pedrd001,Dustin Pedroia,4,ortid001,David Ortiz,10,napom001,Mike Napoli,3,carpm001,Mike Carp,7,sizeg001,Grady Sizemore,8,bogax001,Xander Bogaerts,6,piera001,A.J. Pierzynski,2,middw001,Will Middlebrooks,5,markn001,Nick Markakis,9,hardj003,J.J. Hardy,6,jonea003,Adam Jones,8,davic003,Chris Davis,3,cruzn002,Nelson Cruz,7,wietm001,Matt Wieters,2,yound003,Delmon Young,10,flahr001,Ryan Flaherty,5,schoj001,Jonathan Schoop,4,,Y,2014,1,1,3,201403310,0.259786,0.277119,0.310802,0.344512,0.430961,0.446116,0.741763,0.790628,79.0,123.0,29.0,19.0,54.0,80.0,0.200178,0.231463,0.074021,0.102814,0.24283,0.293447,0.296625,0.360275,0.397706,0.488129,0.694331,0.848404,11.0,24.0,5.0,0.0,15.0,8.0,0.208413,0.235518,0.076482,0.104463,-1.5,141.0,-115.0,1.5,-162.0,105.0,9.0,-110.0,-110.0


In [45]:
# Add the implied win probability as columns
def line_to_prob(line):
    prob_underdog = 100/(np.abs(line)+100) # this is the probability for the 
    add_term = ((1-np.sign(line))/2) # 0 if negative, 1 if positive
    mult_factor = np.sign(line) # -1 if negative, 1 if positive
    # if line is positive, team is underdog, give 0 + 1*prob_underdog
    # if line is negative, team is favoritesm give 1 + (-1)*prob_underdog
    imp_prob = add_term + mult_factor * prob_underdog 
    return(imp_prob)

implied_prob_h_ls = []
implied_prob_v_ls = []

for home_ml, away_ml in zip(no_nans['home_money_line'], no_nans['away_money_line']):
    implied_prob_h_ls.append(line_to_prob(home_ml))
    implied_prob_v_ls.append(line_to_prob(away_ml))

no_nans['implied_prob_h'] = implied_prob_h_ls
no_nans['implied_prob_v'] = implied_prob_v_ls

no_nans.head()

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  no_nans['implied_prob_h'] = implied_prob_h_ls
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  no_nans['implied_prob_v'] = implied_prob_v_ls


Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season_x,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OPS_162_h,OPS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,SO_perc_162_h,SO_perc_162_v,BB_perc_162_h,BB_perc_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OPS_30_h,OPS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,SO_perc_30_h,SO_perc_30_v,BB_perc_30_h,BB_perc_30_v,away_point_spread,away_point_spread_line,away_money_line,home_point_spread,home_point_spread_line,home_money_line,over_under,over_line,under_line,implied_prob_h,implied_prob_v
34011,20140322,0,Sat,LAN,NL,1,ARI,NL,1,3,1,54,N,,,,SYD01,38266.0,169,10200000,000001000,33,5,2,0,1,3,0,0,1,3,0,11,0,0,0,0,7,4,1,1,1,0,27,13,1,0,0,0,33,5,1,0,0,1,0,0,0,2,0,10,0,0,0,0,7,5,3,3,1,0,27,10,1,0,0,0,welkt901,Tim Welke,scotd901,Dale Scott,diazl901,Laz Diaz,carlm901,Mark Carlson,,(none),,(none),mattd001,Don Mattingly,gibsk001,Kirk Gibson,kersc001,Clayton Kershaw,milew001,Wade Miley,jansk001,Kenley Jansen,ethia001,Andre Ethier,kersc001,Clayton Kershaw,milew001,Wade Miley,puigy001,Yasiel Puig,9,turnj001,Justin Turner,4,ramih003,Hanley Ramirez,6,gonza003,Adrian Gonzalez,3,vanss001,Scott Van Slyke,7,uribj002,Juan Uribe,5,ethia001,Andre Ethier,8,ellia001,A.J. Ellis,2,kersc001,Clayton Kershaw,1,polla001,A.J. Pollock,8,hilla001,Aaron Hill,4,goldp001,Paul Goldschmidt,3,pradm001,Martin Prado,5,trumm001,Mark Trumbo,7,montm001,Miguel Montero,2,owinc001,Chris Owings,6,parrg001,Gerardo Parra,9,milew001,Wade Miley,1,,Y,2014,-2,0,4,201403220,0.258633,0.263522,0.320743,0.322272,0.391473,0.396285,0.712215,0.718557,62.0,78.0,41.0,28.0,75.0,109.0,0.201198,0.208705,0.091438,0.086687,0.253644,0.256335,0.313673,0.311372,0.377065,0.41423,0.690738,0.725602,14.0,12.0,6.0,8.0,11.0,16.0,0.190476,0.222222,0.087464,0.079922,-1.5,-103.0,-170.0,1.5,-115.0,150.0,6.5,-110.0,-110.0,0.4,0.62963
34012,20140322,0,Sat,LAN,NL,1,ARI,NL,1,3,1,54,N,,,,SYD01,38266.0,169,10200000,000001000,33,5,2,0,1,3,0,0,1,3,0,11,0,0,0,0,7,4,1,1,1,0,27,13,1,0,0,0,33,5,1,0,0,1,0,0,0,2,0,10,0,0,0,0,7,5,3,3,1,0,27,10,1,0,0,0,welkt901,Tim Welke,scotd901,Dale Scott,diazl901,Laz Diaz,carlm901,Mark Carlson,,(none),,(none),mattd001,Don Mattingly,gibsk001,Kirk Gibson,kersc001,Clayton Kershaw,milew001,Wade Miley,jansk001,Kenley Jansen,ethia001,Andre Ethier,kersc001,Clayton Kershaw,milew001,Wade Miley,puigy001,Yasiel Puig,9,turnj001,Justin Turner,4,ramih003,Hanley Ramirez,6,gonza003,Adrian Gonzalez,3,vanss001,Scott Van Slyke,7,uribj002,Juan Uribe,5,ethia001,Andre Ethier,8,ellia001,A.J. Ellis,2,kersc001,Clayton Kershaw,1,polla001,A.J. Pollock,8,hilla001,Aaron Hill,4,goldp001,Paul Goldschmidt,3,pradm001,Martin Prado,5,trumm001,Mark Trumbo,7,montm001,Miguel Montero,2,owinc001,Chris Owings,6,parrg001,Gerardo Parra,9,milew001,Wade Miley,1,,Y,2014,-2,0,4,201403220,0.258633,0.263522,0.320743,0.322272,0.391473,0.396285,0.712215,0.718557,62.0,78.0,41.0,28.0,75.0,109.0,0.201198,0.208705,0.091438,0.086687,0.253644,0.256335,0.313673,0.311372,0.377065,0.41423,0.690738,0.725602,14.0,12.0,6.0,8.0,11.0,16.0,0.190476,0.222222,0.087464,0.079922,-1.5,132.0,-119.0,1.5,-152.0,109.0,7.5,-110.0,-110.0,0.478469,0.543379
34014,20140330,0,Sun,LAN,NL,3,SDN,NL,1,1,3,51,N,,,,SAN02,45567.0,169,10000,00000003x,31,4,0,0,0,1,0,0,0,3,0,9,0,0,0,0,6,4,2,2,0,0,24,12,2,0,2,0,27,5,0,0,1,3,2,0,0,4,0,10,1,0,2,0,6,5,1,1,1,0,27,10,0,0,0,0,culbf901,Fieldin Culbreth,gonzm901,Manny Gonzalez,reynj901,Jim Reynolds,barbs901,Sean Barber,,(none),,(none),mattd001,Don Mattingly,blacb001,Buddy Black,thayd001,Dale Thayer,wilsb001,Brian Wilson,streh001,Huston Street,denoc001,Chris Denorfia,ryu-h001,Hyun-Jin Ryu,casha001,Andrew Cashner,crawc002,Carl Crawford,7,puigy001,Yasiel Puig,9,ramih003,Hanley Ramirez,6,gonza003,Adrian Gonzalez,3,ethia001,Andre Ethier,8,uribj002,Juan Uribe,5,ellia001,A.J. Ellis,2,gordd002,Dee Strange-Gordon,4,ryu-h001,Hyun-Jin Ryu,1,cabre001,Everth Cabrera,6,denoc001,Chris Denorfia,9,headc001,Chase Headley,5,gyorj001,Jedd Gyorko,4,alony001,Yonder Alonso,3,medit001,Tommy Medica,7,venaw001,Will Venable,8,river003,Rene Rivera,2,casha001,Andrew Cashner,1,,Y,2014,2,1,4,201403300,0.244517,0.264775,0.303476,0.324252,0.377923,0.397527,0.681399,0.721779,118.0,79.0,34.0,27.0,82.0,109.0,0.237267,0.208765,0.084647,0.088016,0.233533,0.25561,0.296059,0.315695,0.359281,0.401951,0.65534,0.717646,21.0,10.0,6.0,8.0,13.0,16.0,0.266467,0.229268,0.088822,0.087805,-1.5,141.0,-115.0,1.5,-162.0,105.0,6.5,-110.0,-110.0,0.487805,0.534884
34015,20140331,0,Mon,SEA,AL,1,ANA,AL,1,10,3,54,N,,,,ANA01,44152.0,197,10001206,201000000,36,11,4,2,1,10,0,1,0,8,1,11,1,1,0,0,8,5,2,2,2,0,27,5,1,0,0,0,34,6,1,0,1,3,0,0,1,1,0,13,1,0,0,0,6,5,9,9,0,0,27,7,1,0,0,0,westj901,Joe West,fostm901,Marty Foster,drakr901,Rob Drake,porta901,Alan Porter,,(none),,(none),mccll001,Lloyd McClendon,sciom001,Mike Scioscia,hernf002,Felix Hernandez,weavj003,Jered Weaver,,(none),almoa001,Abraham Almonte,hernf002,Felix Hernandez,weavj003,Jered Weaver,almoa001,Abraham Almonte,8,millb002,Brad Miller,6,canor001,Robinson Cano,4,smoaj001,Justin Smoak,3,morrl001,Logan Morrison,10,seagk001,Kyle Seager,5,saunm001,Michael Saunders,9,ackld001,Dustin Ackley,7,zunim001,Mike Zunino,2,calhk001,Kole Calhoun,9,troum001,Mike Trout,8,pujoa001,Albert Pujols,3,hamij003,Josh Hamilton,7,freed001,David Freese,5,ibanr001,Raul Ibanez,10,kendh001,Howie Kendrick,4,iannc001,Chris Iannetta,2,aybae001,Erick Aybar,6,,Y,2014,-7,0,13,201403310,0.264137,0.237136,0.327115,0.303434,0.41446,0.389529,0.741575,0.692962,82.0,49.0,34.0,23.0,112.0,88.0,0.218504,0.243433,0.093593,0.095178,0.269455,0.216749,0.327061,0.29646,0.419261,0.360591,0.746322,0.657051,15.0,11.0,7.0,6.0,21.0,20.0,0.2393,0.252217,0.085603,0.1133,1.5,-199.0,104.0,-1.5,169.0,-114.0,7.0,-110.0,-110.0,0.53271,0.490196
34016,20140331,0,Mon,BOS,AL,1,BAL,AL,1,1,2,51,D,,,,BAL12,46685.0,173,100000,01000010x,36,9,2,0,1,1,0,0,1,3,0,6,0,0,0,0,12,2,2,2,0,0,24,11,0,0,2,0,28,6,0,0,1,1,0,0,0,1,0,9,0,0,2,0,3,5,1,1,0,0,27,13,0,0,0,0,demud901,Dana DeMuth,kulpr901,Ron Kulpa,hicke901,Ed Hickox,barrl901,Lance Barrett,,(none),,(none),farrj001,John Farrell,showb801,Buck Showalter,britz001,Zack Britton,lestj001,Jon Lester,huntt002,Tommy Hunter,cruzn002,Nelson Cruz,lestj001,Jon Lester,tillc001,Chris Tillman,navad002,Daniel Nava,9,pedrd001,Dustin Pedroia,4,ortid001,David Ortiz,10,napom001,Mike Napoli,3,carpm001,Mike Carp,7,sizeg001,Grady Sizemore,8,bogax001,Xander Bogaerts,6,piera001,A.J. Pierzynski,2,middw001,Will Middlebrooks,5,markn001,Nick Markakis,9,hardj003,J.J. Hardy,6,jonea003,Adam Jones,8,davic003,Chris Davis,3,cruzn002,Nelson Cruz,7,wietm001,Matt Wieters,2,yound003,Delmon Young,10,flahr001,Ryan Flaherty,5,schoj001,Jonathan Schoop,4,,Y,2014,1,1,3,201403310,0.259786,0.277119,0.310802,0.344512,0.430961,0.446116,0.741763,0.790628,79.0,123.0,29.0,19.0,54.0,80.0,0.200178,0.231463,0.074021,0.102814,0.24283,0.293447,0.296625,0.360275,0.397706,0.488129,0.694331,0.848404,11.0,24.0,5.0,0.0,15.0,8.0,0.208413,0.235518,0.076482,0.104463,-1.5,141.0,-115.0,1.5,-162.0,105.0,9.0,-110.0,-110.0,0.487805,0.534884


In [46]:
no_nans.shape

(22801, 213)

In [47]:
no_nans.to_csv('./hidden_data/mlb_game_and_odds.csv', index = False)