Baseball Prediction: 5b - Adding Starting Pitching Features

    - Now that we have raw game-level data for each pitcher, we can derive features based on the starting pitchers to help our prediction model for individual games.


In [78]:

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline

import warnings
warnings.simplefilter(action='ignore', category=pd.errors.PerformanceWarning)

pd.set_option('display.max_columns',1000)
pd.set_option('display.max_rows',1000)

Overall Plan of Attack

    - For each starting pitcher we will load their raw data, create features for each game based on their previous performance, and then save the dataframe in a dictionary structure for easy lookup

    - Then we can iterate through our game-level dataframe, add in the features for each starting pitcher, and use those to improve our model

Once again, we will use C.C. Sabathia as our example candidate

In [79]:
df_cc = pd.read_csv('/Volumes/CharmedXi/beatVegas/SP_2000/pitching_data_sabac001.csv')

In [80]:
df_cc.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 561 entries, 0 to 560
Data columns (total 31 columns):
 #   Column       Non-Null Count  Dtype  
---  ------       --------------  -----  
 0   at_vs        561 non-null    object 
 1   Opponent     561 non-null    object 
 2   League       561 non-null    object 
 3   GS           561 non-null    int64  
 4   CG           561 non-null    int64  
 5   SHO          561 non-null    int64  
 6   GF           561 non-null    int64  
 7   SV           561 non-null    int64  
 8   IP           561 non-null    float64
 9   H            561 non-null    int64  
 10  BFP          561 non-null    int64  
 11  HR           561 non-null    int64  
 12  R            561 non-null    int64  
 13  ER           561 non-null    int64  
 14  BB           561 non-null    int64  
 15  IB           561 non-null    int64  
 16  SO           561 non-null    int64  
 17  SH           561 non-null    int64  
 18  SF           561 non-null    int64  
 19  WP      

In [81]:
df_cc.head(10)

Unnamed: 0,at_vs,Opponent,League,GS,CG,SHO,GF,SV,IP,H,BFP,HR,R,ER,BB,IB,SO,SH,SF,WP,HBP,BK,2B,3B,GDP,ROE,W,L,ERA,date,dblhead_num
0,VS,BAL,A,1,0,0,0,0,5.2,3,22,1,3,3,2,0,3,0,0,1,0,0,2,0,0,0,0,0,4.76,4- 8-2001,
1,AT,DET,A,1,0,0,0,0,5.0,5,21,0,4,4,2,0,2,0,0,0,0,0,1,0,1,0,1,0,5.91,4-13-2001,
2,AT,BAL,A,1,0,0,0,0,6.0,6,23,0,2,2,2,0,3,0,0,0,0,1,1,0,0,0,1,0,4.86,4-19-2001,
3,VS,ANA,A,1,0,0,0,0,5.0,5,24,0,3,2,4,0,1,0,0,0,0,0,1,1,0,1,0,1,4.57,4-25-2001,
4,AT,KC,A,1,0,0,0,0,5.0,4,19,1,1,1,1,0,2,0,0,0,0,0,0,0,1,0,1,0,4.05,5- 2-2001,
5,VS,KC,A,1,0,0,0,0,5.2,5,23,0,1,1,1,0,5,0,1,1,1,0,1,0,0,0,1,0,3.62,5- 9-2001,
6,AT,TEX,A,1,0,0,0,0,5.0,6,23,0,3,3,3,0,5,0,0,1,0,0,0,0,1,0,1,0,3.86,5-15-2001,
7,AT,ANA,A,1,0,0,0,0,4.1,9,24,1,6,6,3,0,4,0,0,1,0,0,3,0,0,0,0,0,4.75,5-20-2001,
8,VS,NY,A,1,0,0,0,0,4.2,7,25,2,5,5,4,1,3,0,0,0,0,1,2,0,0,0,0,1,5.24,5-26-2001,
9,AT,NY,A,1,0,0,0,0,4.0,4,20,1,4,3,5,0,2,0,0,0,0,0,0,0,1,0,1,0,5.36,6- 1-2001,


In [82]:
# Baseball statisticans report partial innings pitched as X.1 & X.2 where X is the integer number of innings pitched
# However, for calculation purposes, we need to tell the computer to recognize X.1 & X.2 as X & (one-third) and (two-thirds), respectively
# The following line of code does that for us.

df_cc['IP_real'] = df_cc['IP_real'] = (df_cc.IP - (df_cc.IP % 1)) + (df_cc.IP % 1) * (10/3)

In [83]:
df_cc.columns

Index(['at_vs', 'Opponent', 'League', 'GS', 'CG', 'SHO', 'GF', 'SV', 'IP', 'H',
       'BFP', 'HR', 'R', 'ER', 'BB', 'IB', 'SO', 'SH', 'SF', 'WP', 'HBP', 'BK',
       '2B', '3B', 'GDP', 'ROE', 'W', 'L', 'ERA', 'date', 'dblhead_num',
       'IP_real'],
      dtype='object')

Generating Features for a Starting Pitcher

    - Want to creature features based on a lookback across games for each pitcher

    - Need to aggregate statistics like innings pitched (IP), runs or earned runs given up, hits and walks given up, strikeouts, and so on

    - We will also need to decide how to handle pitchers early in their career when they have relatively few games on which to base their performance.

In [84]:
def roll_column(df, col, winsize):
    # do the standard Pandas rolling calc
    t_col = df[col].rolling(winsize, closed='left').sum().to_numpy()
    
    # for the early columns, just do a rolling sum from the beginning
    t_col[:winsize] = np.concatenate(([0],df[col].iloc[:(winsize)].cumsum().to_numpy()[:-1]))

    return(t_col)

In [85]:
def load_and_process_pitch_df(p_id, filepath=''):
    fname = filepath+'pitching_data_'+p_id+'.csv'
    pitch_df = pd.read_csv(fname)
    
    # Convert date, fix dblhead_num to be 0,1,2
    pitch_df['date'] = (pd.to_datetime(pitch_df.date).astype(str).str.replace('-','')).astype(int)
    pitch_df.dblhead_num.fillna(0, inplace=True)
    pitch_df['dblhead_num'] = pitch_df['dblhead_num'].astype(int)
    
    # Convert IP to proper mathematical format
    pitch_df['IP_real'] = (pitch_df.IP - (pitch_df.IP % 1)) + (pitch_df.IP % 1) * (10/3)
    
    cols_to_agg = ['IP_real', 'H','BFP', 'HR', 'R', 'ER', 'BB', 'IB', 'SO', 'SH', 'SF', 'WP', 'HBP', 'BK',
       '2B', '3B']
    winsizes = [6,15,30]
    for winsize in winsizes:
        for raw_col in cols_to_agg:
            new_colname = 'rollsum_'+raw_col+'_'+str(winsize)        
            pitch_df[new_colname] = roll_column(pitch_df, raw_col, winsize)

    
    er_per_ip_def = (5/9)
    h_bb_per_ip_def = 1.5
    h_bb_per_bf_def = .37
    so_per_bf_def = .2
    ip_per_game_def = 3
    bf_per_game_def = 12
    tb_bb_perc_def = .45
    fip_numer_per_ip_def = .124*13 + 1.5*3 - 2*.8
    fip_numer_per_bf_def = .03*13 + .37*3 - 2*.2
    for winsize in winsizes:
        hit_col = 'rollsum_H_'+str(winsize)
        bb_col = 'rollsum_BB_'+str(winsize)
        h_bb_col = 'H_BB_roll_'+str(winsize)
        double_col = 'rollsum_2B_'+str(winsize)
        triple_col = 'rollsum_3B_'+str(winsize)
        hr_col = 'rollsum_HR_'+str(winsize)
        xb_col = 'XB_roll_'+str(winsize)
        tb_col = 'TB_roll_'+str(winsize)
        so_col = 'rollsum_SO_'+str(winsize)
        so_mod_col = 'SO_mod_'+str(winsize)
        ip_col = 'rollsum_IP_real_'+str(winsize)
        ip_mod_col = 'IP_mod_'+str(winsize)
        er_col = 'rollsum_ER_'+str(winsize)
        er_mod_col = 'ER_mod_'+str(winsize)
        bf_col = 'rollsum_BFP_'+str(winsize)
        bf_mod_col = 'BF_mod_'+str(winsize)
        era_col = 'ERA_'+str(winsize)
        fip_col = 'FIP_'+str(winsize)
        fip_perc_col = 'FIP_perc_'+str(winsize)
        fip_numer_col = 'FIP_numer_'+str(winsize)
        fip_numer_mod_col = 'FIP_numer_mod_'+str(winsize)
        fip_numer_mod2_col = 'FIP_numer_mod2_'+str(winsize)
        whip_col = 'WHIP_'+str(winsize)
        so_perc_col = 'SO_perc_'+str(winsize)
        h_bb_perc_col = 'H_BB_perc_'+str(winsize)
        h_bb_mod_col = 'H_BB_mod_'+str(winsize)
        h_bb_mod2_col = 'H_BB_mod2_'+str(winsize)
        tb_bb_mod_col = 'TB_BB_mod_'+str(winsize)
        tb_bb_perc_col = 'TB_BB_perc_'+str(winsize)
        pitch_df[h_bb_col] = pitch_df[hit_col]+pitch_df[bb_col]
        pitch_df[xb_col] = pitch_df[double_col]+2*pitch_df[triple_col]+3*pitch_df[hr_col]
        pitch_df[tb_col] = pitch_df[hit_col]+pitch_df[xb_col]
        pitch_df[ip_mod_col] = np.maximum(pitch_df[ip_col], winsize*ip_per_game_def)
        pitch_df[bf_mod_col] = np.maximum(pitch_df[bf_col], winsize*bf_per_game_def)
        pitch_df[er_mod_col] = pitch_df[er_col] + er_per_ip_def*(pitch_df[ip_mod_col]-pitch_df[ip_col])
        pitch_df[fip_numer_col] = 13*pitch_df[hr_col] + 3*pitch_df[h_bb_col] -2*pitch_df[so_col]
        pitch_df[fip_numer_mod_col] = pitch_df[fip_numer_col] + fip_numer_per_ip_def*(pitch_df[ip_mod_col]-pitch_df[ip_col])
        pitch_df[fip_numer_mod2_col] = pitch_df[fip_numer_col] + fip_numer_per_bf_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[h_bb_mod_col] = pitch_df[h_bb_col] + h_bb_per_ip_def*(pitch_df[ip_mod_col]-pitch_df[ip_col])
        pitch_df[h_bb_mod2_col] = pitch_df[h_bb_col] + h_bb_per_bf_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[so_mod_col] = pitch_df[so_col] + so_per_bf_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[tb_bb_mod_col] = (pitch_df[tb_col] + pitch_df[bb_col])+ tb_bb_perc_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[era_col] = (pitch_df[er_mod_col]/pitch_df[ip_mod_col])*9
        pitch_df[fip_col] = (pitch_df[fip_numer_mod_col]/pitch_df[ip_mod_col])
        pitch_df[fip_perc_col] = (pitch_df[fip_numer_mod_col]/pitch_df[bf_mod_col])
        pitch_df[whip_col] = pitch_df[h_bb_mod_col]/pitch_df[ip_mod_col]
        pitch_df[so_perc_col] = pitch_df[so_mod_col]/pitch_df[bf_mod_col]
        pitch_df[tb_bb_perc_col] = pitch_df[tb_bb_mod_col]/pitch_df[bf_mod_col]
        pitch_df[h_bb_perc_col] = pitch_df[h_bb_mod2_col]/pitch_df[bf_mod_col]
    pitch_df['date_dblhead'] = (pitch_df['date'].astype(str) + pitch_df['dblhead_num'].astype(str)).astype(int)
    pitch_df.set_index('date_dblhead', inplace=True)
    return(pitch_df)

In [86]:
df_cc = load_and_process_pitch_df('sabac001','SP_2000/')

df_cc.head(15)

Unnamed: 0_level_0,at_vs,Opponent,League,GS,CG,SHO,GF,SV,IP,H,BFP,HR,R,ER,BB,IB,SO,SH,SF,WP,HBP,BK,2B,3B,GDP,ROE,W,L,ERA,date,dblhead_num,IP_real,rollsum_IP_real_6,rollsum_H_6,rollsum_BFP_6,rollsum_HR_6,rollsum_R_6,rollsum_ER_6,rollsum_BB_6,rollsum_IB_6,rollsum_SO_6,rollsum_SH_6,rollsum_SF_6,rollsum_WP_6,rollsum_HBP_6,rollsum_BK_6,rollsum_2B_6,rollsum_3B_6,rollsum_IP_real_15,rollsum_H_15,rollsum_BFP_15,rollsum_HR_15,rollsum_R_15,rollsum_ER_15,rollsum_BB_15,rollsum_IB_15,rollsum_SO_15,rollsum_SH_15,rollsum_SF_15,rollsum_WP_15,rollsum_HBP_15,rollsum_BK_15,rollsum_2B_15,rollsum_3B_15,rollsum_IP_real_30,rollsum_H_30,rollsum_BFP_30,rollsum_HR_30,rollsum_R_30,rollsum_ER_30,rollsum_BB_30,rollsum_IB_30,rollsum_SO_30,rollsum_SH_30,rollsum_SF_30,rollsum_WP_30,rollsum_HBP_30,rollsum_BK_30,rollsum_2B_30,rollsum_3B_30,H_BB_roll_6,XB_roll_6,TB_roll_6,IP_mod_6,BF_mod_6,ER_mod_6,FIP_numer_6,FIP_numer_mod_6,FIP_numer_mod2_6,H_BB_mod_6,H_BB_mod2_6,SO_mod_6,TB_BB_mod_6,ERA_6,FIP_6,FIP_perc_6,WHIP_6,SO_perc_6,TB_BB_perc_6,H_BB_perc_6,H_BB_roll_15,XB_roll_15,TB_roll_15,IP_mod_15,BF_mod_15,ER_mod_15,FIP_numer_15,FIP_numer_mod_15,FIP_numer_mod2_15,H_BB_mod_15,H_BB_mod2_15,SO_mod_15,TB_BB_mod_15,ERA_15,FIP_15,FIP_perc_15,WHIP_15,SO_perc_15,TB_BB_perc_15,H_BB_perc_15,H_BB_roll_30,XB_roll_30,TB_roll_30,IP_mod_30,BF_mod_30,ER_mod_30,FIP_numer_30,FIP_numer_mod_30,FIP_numer_mod2_30,H_BB_mod_30,H_BB_mod2_30,SO_mod_30,TB_BB_mod_30,ERA_30,FIP_30,FIP_perc_30,WHIP_30,SO_perc_30,TB_BB_perc_30,H_BB_perc_30
date_dblhead,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1
200104080,VS,BAL,A,1,0,0,0,0,5.2,3,22,1,3,3,2,0,3,0,0,1,0,0,2,0,0,0,0,0,4.76,20010408,0,5.666667,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18.0,72.0,10.0,0.0,81.216,79.2,27.0,26.64,14.4,32.4,5.0,4.512,1.128,1.5,0.2,0.45,0.37,0.0,0.0,0.0,45.0,180.0,25.0,0.0,203.04,198.0,67.5,66.6,36.0,81.0,5.0,4.512,1.128,1.5,0.2,0.45,0.37,0.0,0.0,0.0,90.0,360.0,50.0,0.0,406.08,396.0,135.0,133.2,72.0,162.0,5.0,4.512,1.128,1.5,0.2,0.45,0.37
200104130,AT,DET,A,1,0,0,0,0,5.0,5,21,0,4,4,2,0,2,0,0,0,0,0,1,0,1,0,1,0,5.91,20010413,0,5.0,5.666667,3.0,22.0,1.0,3.0,3.0,2.0,0.0,3.0,0.0,0.0,1.0,0.0,0.0,2.0,0.0,5.666667,3.0,22.0,1.0,3.0,3.0,2.0,0.0,3.0,0.0,0.0,1.0,0.0,0.0,2.0,0.0,5.666667,3.0,22.0,1.0,3.0,3.0,2.0,0.0,3.0,0.0,0.0,1.0,0.0,0.0,2.0,0.0,5.0,5.0,8.0,18.0,72.0,9.851852,22.0,77.648,77.0,23.5,23.5,13.0,32.5,4.925926,4.313778,1.078444,1.305556,0.180556,0.451389,0.326389,5.0,5.0,8.0,45.0,180.0,24.851852,22.0,199.472,195.8,64.0,63.46,34.6,81.1,4.97037,4.432711,1.108178,1.422222,0.192222,0.450556,0.352556,5.0,5.0,8.0,90.0,360.0,49.851852,22.0,402.512,393.8,131.5,130.06,70.6,162.1,4.985185,4.472356,1.118089,1.461111,0.196111,0.450278,0.361278
200104190,AT,BAL,A,1,0,0,0,0,6.0,6,23,0,2,2,2,0,3,0,0,0,0,1,1,0,0,0,1,0,4.86,20010419,0,6.0,10.666667,8.0,43.0,1.0,7.0,7.0,4.0,0.0,5.0,0.0,0.0,1.0,0.0,0.0,3.0,0.0,10.666667,8.0,43.0,1.0,7.0,7.0,4.0,0.0,5.0,0.0,0.0,1.0,0.0,0.0,3.0,0.0,10.666667,8.0,43.0,1.0,7.0,7.0,4.0,0.0,5.0,0.0,0.0,1.0,0.0,0.0,3.0,0.0,12.0,6.0,14.0,18.0,72.0,11.074074,39.0,72.088,70.9,23.0,22.73,10.8,31.05,5.537037,4.004889,1.001222,1.277778,0.15,0.43125,0.315694,12.0,6.0,14.0,45.0,180.0,26.074074,39.0,193.912,189.7,63.5,62.69,32.4,79.65,5.214815,4.309156,1.077289,1.411111,0.18,0.4425,0.348278,12.0,6.0,14.0,90.0,360.0,51.074074,39.0,396.952,387.7,131.0,129.29,68.4,160.65,5.107407,4.410578,1.102644,1.455556,0.19,0.44625,0.359139
200104250,VS,ANA,A,1,0,0,0,0,5.0,5,24,0,3,2,4,0,1,0,0,0,0,0,1,1,0,1,0,1,4.57,20010425,0,5.0,16.666667,14.0,66.0,1.0,9.0,9.0,6.0,0.0,8.0,0.0,0.0,1.0,0.0,1.0,4.0,0.0,16.666667,14.0,66.0,1.0,9.0,9.0,6.0,0.0,8.0,0.0,0.0,1.0,0.0,1.0,4.0,0.0,16.666667,14.0,66.0,1.0,9.0,9.0,6.0,0.0,8.0,0.0,0.0,1.0,0.0,1.0,4.0,0.0,20.0,7.0,21.0,18.0,72.0,9.740741,57.0,63.016,63.6,22.0,22.22,9.2,29.7,4.87037,3.500889,0.875222,1.222222,0.127778,0.4125,0.308611,20.0,7.0,21.0,45.0,180.0,24.740741,57.0,184.84,182.4,62.5,62.18,30.8,78.3,4.948148,4.107556,1.026889,1.388889,0.171111,0.435,0.345444,20.0,7.0,21.0,90.0,360.0,49.740741,57.0,387.88,380.4,130.0,128.78,66.8,159.3,4.974074,4.309778,1.077444,1.444444,0.185556,0.4425,0.357722
200105020,AT,KC,A,1,0,0,0,0,5.0,4,19,1,1,1,1,0,2,0,0,0,0,0,0,0,1,0,1,0,4.05,20010502,0,5.0,21.666667,19.0,90.0,1.0,12.0,11.0,10.0,0.0,9.0,0.0,0.0,1.0,0.0,1.0,5.0,1.0,21.666667,19.0,90.0,1.0,12.0,11.0,10.0,0.0,9.0,0.0,0.0,1.0,0.0,1.0,5.0,1.0,21.666667,19.0,90.0,1.0,12.0,11.0,10.0,0.0,9.0,0.0,0.0,1.0,0.0,1.0,5.0,1.0,29.0,10.0,29.0,21.666667,90.0,11.0,82.0,82.0,82.0,29.0,29.0,9.0,39.0,4.569231,3.784615,0.911111,1.338462,0.1,0.433333,0.322222,29.0,10.0,29.0,45.0,180.0,23.962963,82.0,187.28,181.0,64.0,62.3,27.0,79.5,4.792593,4.161778,1.040444,1.422222,0.15,0.441667,0.346111,29.0,10.0,29.0,90.0,360.0,48.962963,82.0,390.32,379.0,131.5,128.9,63.0,160.5,4.896296,4.336889,1.084222,1.461111,0.175,0.445833,0.358056
200105090,VS,KC,A,1,0,0,0,0,5.2,5,23,0,1,1,1,0,5,0,1,1,1,0,1,0,0,0,1,0,3.62,20010509,0,5.666667,26.666667,23.0,109.0,2.0,13.0,12.0,11.0,0.0,11.0,0.0,0.0,1.0,0.0,1.0,5.0,1.0,26.666667,23.0,109.0,2.0,13.0,12.0,11.0,0.0,11.0,0.0,0.0,1.0,0.0,1.0,5.0,1.0,26.666667,23.0,109.0,2.0,13.0,12.0,11.0,0.0,11.0,0.0,0.0,1.0,0.0,1.0,5.0,1.0,34.0,13.0,36.0,26.666667,109.0,12.0,106.0,106.0,106.0,34.0,34.0,11.0,47.0,4.05,3.975,0.972477,1.275,0.100917,0.431193,0.311927,34.0,13.0,36.0,45.0,180.0,22.185185,106.0,188.72,184.1,61.5,60.27,25.2,78.95,4.437037,4.193778,1.048444,1.366667,0.14,0.438611,0.334833,34.0,13.0,36.0,90.0,360.0,47.185185,106.0,391.76,382.1,129.0,126.87,61.2,159.95,4.718519,4.352889,1.088222,1.433333,0.17,0.444306,0.352417
200105150,AT,TEX,A,1,0,0,0,0,5.0,6,23,0,3,3,3,0,5,0,0,1,0,0,0,0,1,0,1,0,3.86,20010515,0,5.0,32.333333,28.0,132.0,2.0,14.0,13.0,12.0,0.0,16.0,0.0,1.0,2.0,1.0,1.0,6.0,1.0,32.333333,28.0,132.0,2.0,14.0,13.0,12.0,0.0,16.0,0.0,1.0,2.0,1.0,1.0,6.0,1.0,32.333333,28.0,132.0,2.0,14.0,13.0,12.0,0.0,16.0,0.0,1.0,2.0,1.0,1.0,6.0,1.0,40.0,14.0,42.0,32.333333,132.0,13.0,114.0,114.0,114.0,40.0,40.0,16.0,54.0,3.618557,3.525773,0.863636,1.237113,0.121212,0.409091,0.30303,40.0,14.0,42.0,45.0,180.0,20.037037,114.0,171.152,166.8,59.0,57.76,25.6,75.6,4.007407,3.803378,0.950844,1.311111,0.142222,0.42,0.320889,40.0,14.0,42.0,90.0,360.0,45.037037,114.0,374.192,364.8,126.5,124.36,61.6,156.6,4.503704,4.157689,1.039422,1.405556,0.171111,0.435,0.345444
200105200,AT,ANA,A,1,0,0,0,0,4.1,9,24,1,6,6,3,0,4,0,0,1,0,0,3,0,0,0,0,0,4.75,20010520,0,4.333333,31.666667,31.0,133.0,1.0,14.0,13.0,13.0,0.0,18.0,0.0,1.0,2.0,1.0,1.0,4.0,1.0,37.333333,34.0,155.0,2.0,17.0,16.0,15.0,0.0,21.0,0.0,1.0,3.0,1.0,1.0,6.0,1.0,37.333333,34.0,155.0,2.0,17.0,16.0,15.0,0.0,21.0,0.0,1.0,3.0,1.0,1.0,6.0,1.0,44.0,9.0,40.0,31.666667,133.0,13.0,109.0,109.0,109.0,44.0,44.0,18.0,53.0,3.694737,3.442105,0.819549,1.389474,0.135338,0.398496,0.330827,49.0,14.0,48.0,45.0,180.0,20.259259,131.0,165.592,158.5,60.5,58.25,26.0,74.25,4.051852,3.679822,0.919956,1.344444,0.144444,0.4125,0.323611,49.0,14.0,48.0,90.0,360.0,45.259259,131.0,368.632,356.5,128.0,124.85,62.0,155.25,4.525926,4.095911,1.023978,1.422222,0.172222,0.43125,0.346806
200105260,VS,NY,A,1,0,0,0,0,4.2,7,25,2,5,5,4,1,3,0,0,0,0,1,2,0,0,0,0,1,5.24,20010526,0,4.666667,31.0,35.0,136.0,2.0,16.0,15.0,14.0,0.0,20.0,0.0,1.0,3.0,1.0,1.0,6.0,1.0,41.666667,43.0,179.0,3.0,23.0,22.0,18.0,0.0,25.0,0.0,1.0,4.0,1.0,1.0,9.0,1.0,41.666667,43.0,179.0,3.0,23.0,22.0,18.0,0.0,25.0,0.0,1.0,4.0,1.0,1.0,9.0,1.0,49.0,14.0,49.0,31.0,136.0,15.0,133.0,133.0,133.0,49.0,49.0,20.0,63.0,4.354839,4.290323,0.977941,1.580645,0.147059,0.463235,0.360294,61.0,20.0,63.0,45.0,180.0,23.851852,172.0,187.04,173.1,66.0,61.37,25.2,81.45,4.77037,4.156444,1.039111,1.466667,0.14,0.4525,0.340944,61.0,20.0,63.0,90.0,360.0,48.851852,172.0,390.08,371.1,133.5,127.97,61.2,162.45,4.885185,4.334222,1.083556,1.483333,0.17,0.45125,0.355472
200106010,AT,NY,A,1,0,0,0,0,4.0,4,20,1,4,3,5,0,2,0,0,0,0,0,0,0,1,0,1,0,5.36,20010601,0,4.0,29.666667,36.0,138.0,4.0,19.0,18.0,16.0,1.0,20.0,0.0,1.0,3.0,1.0,1.0,7.0,1.0,46.333333,50.0,204.0,5.0,28.0,27.0,22.0,1.0,28.0,0.0,1.0,4.0,1.0,2.0,11.0,1.0,46.333333,50.0,204.0,5.0,28.0,27.0,22.0,1.0,28.0,0.0,1.0,4.0,1.0,2.0,11.0,1.0,52.0,21.0,57.0,29.666667,138.0,18.0,168.0,168.0,168.0,52.0,52.0,20.0,73.0,5.460674,5.662921,1.217391,1.752809,0.144928,0.528986,0.376812,72.0,28.0,78.0,46.333333,204.0,27.0,225.0,225.0,225.0,72.0,72.0,28.0,100.0,5.244604,4.856115,1.102941,1.553957,0.137255,0.490196,0.352941,72.0,28.0,78.0,90.0,360.0,51.259259,225.0,422.024,396.6,137.5,129.72,59.2,170.2,5.125926,4.689156,1.172289,1.527778,0.164444,0.472778,0.360333


LOAD IN GAME LEVEL DATA

In [87]:
df = pd.read_csv('df_bp3.csv', low_memory=False)

In [88]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 56771 entries, 0 to 56770
Columns: 199 entries, date to over_under_result
dtypes: float64(34), int64(87), object(78)
memory usage: 86.2+ MB


In [89]:
start_pitchers_h = df.pitcher_start_id_h.unique()
start_pitchers_v = df.pitcher_start_id_v.unique()
start_pitchers_all = np.union1d(start_pitchers_h.astype(str), start_pitchers_v.astype(str))

In [90]:
pitcher_data_dict = {}
for i, p_id in enumerate(start_pitchers_all):
    if i % 250 == 0:
        print(i)
    try:  
        pitcher_data_dict[p_id] = load_and_process_pitch_df(p_id,'SP_2000/')
    except:
       pass

0
250
500
750
1000
1250
1500
1750
2000


In [91]:
raw_cols_to_add = ['GS', 'IP',
       'H', 'BFP', 'HR', 'R', 'ER', 'BB', 'IB', 'SO', 'SH', 'SF', 'WP',
       'HBP', 'BK', '2B', '3B', 'IP_real', 'rollsum_IP_real_6', 'rollsum_H_6',
       'rollsum_BFP_6', 'rollsum_HR_6', 'rollsum_R_6', 'rollsum_ER_6',
       'rollsum_BB_6', 'rollsum_IB_6', 'rollsum_SO_6', 'rollsum_SH_6',
       'rollsum_SF_6', 'rollsum_WP_6', 'rollsum_HBP_6',
       'rollsum_BK_6', 'rollsum_2B_6', 'rollsum_3B_6',
       'rollsum_IP_real_15', 'rollsum_H_15', 'rollsum_BFP_15',
       'rollsum_HR_15', 'rollsum_R_15', 'rollsum_ER_15', 'rollsum_BB_15',
       'rollsum_IB_15', 'rollsum_SO_15', 'rollsum_SH_15', 'rollsum_SF_15',
       'rollsum_WP_15', 'rollsum_HBP_15', 'rollsum_BK_15',
       'rollsum_2B_15', 'rollsum_3B_15', 'rollsum_IP_real_30',
       'rollsum_H_30', 'rollsum_BFP_30', 'rollsum_HR_30', 'rollsum_R_30',
       'rollsum_ER_30', 'rollsum_BB_30', 'rollsum_IB_30', 'rollsum_SO_30',
       'rollsum_SH_30', 'rollsum_SF_30', 'rollsum_WP_30',
       'rollsum_HBP_30', 'rollsum_BK_30', 'rollsum_2B_30',
       'rollsum_3B_30', 'H_BB_roll_6', 'XB_roll_6', 'TB_roll_6',
       'IP_mod_6', 'BF_mod_6', 'ER_mod_6', 'FIP_numer_6',
       'FIP_numer_mod_6', 'FIP_numer_mod2_6', 'H_BB_mod_6',
       'H_BB_mod2_6', 'SO_mod_6', 'TB_BB_mod_6', 'ERA_6', 'FIP_6',
       'FIP_perc_6', 'WHIP_6', 'SO_perc_6', 'TB_BB_perc_6',
       'H_BB_perc_6', 'H_BB_roll_15', 'XB_roll_15', 'TB_roll_15',
       'IP_mod_15', 'BF_mod_15', 'ER_mod_15', 'FIP_numer_15',
       'FIP_numer_mod_15', 'FIP_numer_mod2_15', 'H_BB_mod_15',
       'H_BB_mod2_15', 'SO_mod_15', 'TB_BB_mod_15', 'ERA_15', 'FIP_15',
       'FIP_perc_15', 'WHIP_15', 'SO_perc_15', 'TB_BB_perc_15',
       'H_BB_perc_15', 'H_BB_roll_30', 'XB_roll_30', 'TB_roll_30',
       'IP_mod_30', 'BF_mod_30', 'ER_mod_30', 'FIP_numer_30',
       'FIP_numer_mod_30', 'FIP_numer_mod2_30', 'H_BB_mod_30',
       'H_BB_mod2_30', 'SO_mod_30', 'TB_BB_mod_30', 'ERA_30', 'FIP_30',
       'FIP_perc_30', 'WHIP_30', 'SO_perc_30', 'TB_BB_perc_30',
       'H_BB_perc_30']
cols_to_add = ['Strt_'+col+suff for col in raw_cols_to_add for suff in ['_h','_v']]

col_add_dict = {col:np.zeros(df.shape[0]) for col in cols_to_add}

In [92]:
for i in range(df.shape[0]):
    row = df.iloc[i,:]
    if i % 1000 == 0:
        print(i)
    sp_id_v = row['pitcher_start_id_v']
    sp_id_h = row['pitcher_start_id_h']
    date_dblhead = row['date_dblhead']
    if sp_id_v in pitcher_data_dict.keys():
        curr_df = pitcher_data_dict[sp_id_v]
        if date_dblhead in curr_df.index:
            for col in raw_cols_to_add:
                col_add_dict['Strt_'+col+'_v'][i] = curr_df.loc[date_dblhead,col]
        else:
            print(f'no match for {sp_id_v} date {date_dblhead}')
    if sp_id_h in pitcher_data_dict.keys():
        curr_df = pitcher_data_dict[sp_id_h]
        if date_dblhead in curr_df.index:
            for col in raw_cols_to_add:
                col_add_dict['Strt_'+col+'_h'][i] = curr_df.loc[date_dblhead,col]
        else:
            print(f'no match for {sp_id_h} date {date_dblhead}')

0
1000
2000
3000
4000
5000
6000
7000
8000
9000
10000
11000
12000
13000
14000
15000
16000
17000
18000
19000
20000
21000
22000
23000
24000
25000
26000
27000
28000
29000
30000
31000
32000
33000
34000
35000
36000
37000
38000
39000
40000
41000
42000
43000
44000
45000
46000
47000
48000
49000
50000
51000
52000
53000
54000
55000
56000


In [93]:
for col in cols_to_add:
    df[col] = col_add_dict[col]

In [94]:
df.sample(10)

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,Strt_GS_h,Strt_GS_v,Strt_IP_h,Strt_IP_v,Strt_H_h,Strt_H_v,Strt_BFP_h,Strt_BFP_v,Strt_HR_h,Strt_HR_v,Strt_R_h,Strt_R_v,Strt_ER_h,Strt_ER_v,Strt_BB_h,Strt_BB_v,Strt_IB_h,Strt_IB_v,Strt_SO_h,Strt_SO_v,Strt_SH_h,Strt_SH_v,Strt_SF_h,Strt_SF_v,Strt_WP_h,Strt_WP_v,Strt_HBP_h,Strt_HBP_v,Strt_BK_h,Strt_BK_v,Strt_2B_h,Strt_2B_v,Strt_3B_h,Strt_3B_v,Strt_IP_real_h,Strt_IP_real_v,Strt_rollsum_IP_real_6_h,Strt_rollsum_IP_real_6_v,Strt_rollsum_H_6_h,Strt_rollsum_H_6_v,Strt_rollsum_BFP_6_h,Strt_rollsum_BFP_6_v,Strt_rollsum_HR_6_h,Strt_rollsum_HR_6_v,Strt_rollsum_R_6_h,Strt_rollsum_R_6_v,Strt_rollsum_ER_6_h,Strt_rollsum_ER_6_v,Strt_rollsum_BB_6_h,Strt_rollsum_BB_6_v,Strt_rollsum_IB_6_h,Strt_rollsum_IB_6_v,Strt_rollsum_SO_6_h,Strt_rollsum_SO_6_v,Strt_rollsum_SH_6_h,Strt_rollsum_SH_6_v,Strt_rollsum_SF_6_h,Strt_rollsum_SF_6_v,Strt_rollsum_WP_6_h,Strt_rollsum_WP_6_v,Strt_rollsum_HBP_6_h,Strt_rollsum_HBP_6_v,Strt_rollsum_BK_6_h,Strt_rollsum_BK_6_v,Strt_rollsum_2B_6_h,Strt_rollsum_2B_6_v,Strt_rollsum_3B_6_h,Strt_rollsum_3B_6_v,Strt_rollsum_IP_real_15_h,Strt_rollsum_IP_real_15_v,Strt_rollsum_H_15_h,Strt_rollsum_H_15_v,Strt_rollsum_BFP_15_h,Strt_rollsum_BFP_15_v,Strt_rollsum_HR_15_h,Strt_rollsum_HR_15_v,Strt_rollsum_R_15_h,Strt_rollsum_R_15_v,Strt_rollsum_ER_15_h,Strt_rollsum_ER_15_v,Strt_rollsum_BB_15_h,Strt_rollsum_BB_15_v,Strt_rollsum_IB_15_h,Strt_rollsum_IB_15_v,Strt_rollsum_SO_15_h,Strt_rollsum_SO_15_v,Strt_rollsum_SH_15_h,Strt_rollsum_SH_15_v,Strt_rollsum_SF_15_h,Strt_rollsum_SF_15_v,Strt_rollsum_WP_15_h,Strt_rollsum_WP_15_v,Strt_rollsum_HBP_15_h,Strt_rollsum_HBP_15_v,Strt_rollsum_BK_15_h,Strt_rollsum_BK_15_v,Strt_rollsum_2B_15_h,Strt_rollsum_2B_15_v,Strt_rollsum_3B_15_h,Strt_rollsum_3B_15_v,Strt_rollsum_IP_real_30_h,Strt_rollsum_IP_real_30_v,Strt_rollsum_H_30_h,Strt_rollsum_H_30_v,Strt_rollsum_BFP_30_h,Strt_rollsum_BFP_30_v,Strt_rollsum_HR_30_h,Strt_rollsum_HR_30_v,Strt_rollsum_R_30_h,Strt_rollsum_R_30_v,Strt_rollsum_ER_30_h,Strt_rollsum_ER_30_v,Strt_rollsum_BB_30_h,Strt_rollsum_BB_30_v,Strt_rollsum_IB_30_h,Strt_rollsum_IB_30_v,Strt_rollsum_SO_30_h,Strt_rollsum_SO_30_v,Strt_rollsum_SH_30_h,Strt_rollsum_SH_30_v,Strt_rollsum_SF_30_h,Strt_rollsum_SF_30_v,Strt_rollsum_WP_30_h,Strt_rollsum_WP_30_v,Strt_rollsum_HBP_30_h,Strt_rollsum_HBP_30_v,Strt_rollsum_BK_30_h,Strt_rollsum_BK_30_v,Strt_rollsum_2B_30_h,Strt_rollsum_2B_30_v,Strt_rollsum_3B_30_h,Strt_rollsum_3B_30_v,Strt_H_BB_roll_6_h,Strt_H_BB_roll_6_v,Strt_XB_roll_6_h,Strt_XB_roll_6_v,Strt_TB_roll_6_h,Strt_TB_roll_6_v,Strt_IP_mod_6_h,Strt_IP_mod_6_v,Strt_BF_mod_6_h,Strt_BF_mod_6_v,Strt_ER_mod_6_h,Strt_ER_mod_6_v,Strt_FIP_numer_6_h,Strt_FIP_numer_6_v,Strt_FIP_numer_mod_6_h,Strt_FIP_numer_mod_6_v,Strt_FIP_numer_mod2_6_h,Strt_FIP_numer_mod2_6_v,Strt_H_BB_mod_6_h,Strt_H_BB_mod_6_v,Strt_H_BB_mod2_6_h,Strt_H_BB_mod2_6_v,Strt_SO_mod_6_h,Strt_SO_mod_6_v,Strt_TB_BB_mod_6_h,Strt_TB_BB_mod_6_v,Strt_ERA_6_h,Strt_ERA_6_v,Strt_FIP_6_h,Strt_FIP_6_v,Strt_FIP_perc_6_h,Strt_FIP_perc_6_v,Strt_WHIP_6_h,Strt_WHIP_6_v,Strt_SO_perc_6_h,Strt_SO_perc_6_v,Strt_TB_BB_perc_6_h,Strt_TB_BB_perc_6_v,Strt_H_BB_perc_6_h,Strt_H_BB_perc_6_v,Strt_H_BB_roll_15_h,Strt_H_BB_roll_15_v,Strt_XB_roll_15_h,Strt_XB_roll_15_v,Strt_TB_roll_15_h,Strt_TB_roll_15_v,Strt_IP_mod_15_h,Strt_IP_mod_15_v,Strt_BF_mod_15_h,Strt_BF_mod_15_v,Strt_ER_mod_15_h,Strt_ER_mod_15_v,Strt_FIP_numer_15_h,Strt_FIP_numer_15_v,Strt_FIP_numer_mod_15_h,Strt_FIP_numer_mod_15_v,Strt_FIP_numer_mod2_15_h,Strt_FIP_numer_mod2_15_v,Strt_H_BB_mod_15_h,Strt_H_BB_mod_15_v,Strt_H_BB_mod2_15_h,Strt_H_BB_mod2_15_v,Strt_SO_mod_15_h,Strt_SO_mod_15_v,Strt_TB_BB_mod_15_h,Strt_TB_BB_mod_15_v,Strt_ERA_15_h,Strt_ERA_15_v,Strt_FIP_15_h,Strt_FIP_15_v,Strt_FIP_perc_15_h,Strt_FIP_perc_15_v,Strt_WHIP_15_h,Strt_WHIP_15_v,Strt_SO_perc_15_h,Strt_SO_perc_15_v,Strt_TB_BB_perc_15_h,Strt_TB_BB_perc_15_v,Strt_H_BB_perc_15_h,Strt_H_BB_perc_15_v,Strt_H_BB_roll_30_h,Strt_H_BB_roll_30_v,Strt_XB_roll_30_h,Strt_XB_roll_30_v,Strt_TB_roll_30_h,Strt_TB_roll_30_v,Strt_IP_mod_30_h,Strt_IP_mod_30_v,Strt_BF_mod_30_h,Strt_BF_mod_30_v,Strt_ER_mod_30_h,Strt_ER_mod_30_v,Strt_FIP_numer_30_h,Strt_FIP_numer_30_v,Strt_FIP_numer_mod_30_h,Strt_FIP_numer_mod_30_v,Strt_FIP_numer_mod2_30_h,Strt_FIP_numer_mod2_30_v,Strt_H_BB_mod_30_h,Strt_H_BB_mod_30_v,Strt_H_BB_mod2_30_h,Strt_H_BB_mod2_30_v,Strt_SO_mod_30_h,Strt_SO_mod_30_v,Strt_TB_BB_mod_30_h,Strt_TB_BB_mod_30_v,Strt_ERA_30_h,Strt_ERA_30_v,Strt_FIP_30_h,Strt_FIP_30_v,Strt_FIP_perc_30_h,Strt_FIP_perc_30_v,Strt_WHIP_30_h,Strt_WHIP_30_v,Strt_SO_perc_30_h,Strt_SO_perc_30_v,Strt_TB_BB_perc_30_h,Strt_TB_BB_perc_30_v,Strt_H_BB_perc_30_h,Strt_H_BB_perc_30_v
50546,20210620,0,Sun,NYN,NL,66,WAS,NL,69,2,5,51,D,,,,WAS11,30371.0,169,10000100,10101020x,30,4,0,0,2,2,0,0,0,1,0,11,0,0,1,0,2,3,5,5,1,0,24,13,0,0,2,0,35,13,3,0,3,5,0,0,0,1,0,8,3,0,2,0,7,4,2,2,0,0,27,8,0,0,1,0,fairc901,Chad Fairchild,danlk901,Kerwin Danley,hamaa901,Adam Hamari,buckc901,CB Bucknor,,(none),,(none),rojal801,Luis Rojas,martd002,Dave Martinez,corbp001,Patrick Corbin,walkt004,Taijuan Walker,handb001,Brad Hand,bellj005,Josh Bell,walkt004,Taijuan Walker,corbp001,Patrick Corbin,peraj003,Jose Peraza,5,lindf001,Francisco Lindor,6,mccaj001,James McCann,2,alonp001,Pete Alonso,3,pillk001,Kevin Pillar,9,drurb001,Brandon Drury,7,almoa002,Albert Almora,8,guill001,Luis Guillorme,4,walkt004,Taijuan Walker,1,schwk001,Kyle Schwarber,7,turnt001,Trea Turner,6,sotoj001,Juan Soto,9,bellj005,Josh Bell,3,gomey001,Yan Gomes,2,harrj002,Josh Harrison,4,casts001,Starlin Castro,5,roblv001,Victor Robles,8,corbp001,Patrick Corbin,1,,Y,2021,3,1,7,202106200,0.25753,0.252005,0.323847,0.318838,0.418675,0.425667,0.742522,0.744505,86.0,53.0,30.0,28.0,94.0,79.0,0.238147,0.229958,0.307542,0.29195,0.376078,0.407173,0.683619,0.699123,11.0,12.0,6.0,7.0,15.0,12.0,0.528302,0.49505,0.516626,8.5,U,1.0,1.0,6.0,6.1,4.0,10.0,23.0,27.0,2.0,2.0,2.0,4.0,2.0,4.0,1.0,0.0,0.0,0.0,7.0,5.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,6.0,6.333333,34.333333,34.0,40.0,24.0,149.0,132.0,2.0,2.0,19.0,8.0,19.0,7.0,13.0,9.0,0.0,0.0,26.0,37.0,3.0,0.0,2.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,5.0,3.0,1.0,0.0,83.666667,81.666667,100.0,55.0,371.0,325.0,15.0,3.0,55.0,23.0,54.0,20.0,30.0,26.0,1.0,0.0,65.0,90.0,3.0,2.0,3.0,2.0,0.0,2.0,2.0,3.0,1.0,0.0,18.0,10.0,1.0,0.0,169.666667,148.666667,191.0,119.0,751.0,616.0,28.0,13.0,97.0,58.0,92.0,44.0,64.0,52.0,2.0,0.0,160.0,150.0,6.0,3.0,6.0,4.0,1.0,4.0,2.0,8.0,1.0,0.0,37.0,23.0,3.0,0.0,53.0,33.0,13.0,9.0,53.0,33.0,34.333333,34.0,149.0,132.0,19.0,7.0,133.0,51.0,133.0,51.0,133.0,51.0,53.0,33.0,53.0,33.0,26.0,37.0,66.0,42.0,4.980583,1.852941,3.873786,1.5,0.892617,0.386364,1.543689,0.970588,0.174497,0.280303,0.442953,0.318182,0.355705,0.25,130.0,81.0,65.0,19.0,165.0,74.0,83.666667,81.666667,371.0,325.0,54.0,20.0,455.0,102.0,455.0,102.0,455.0,102.0,130.0,81.0,130.0,81.0,65.0,90.0,195.0,100.0,5.808765,2.204082,5.438247,1.24898,1.226415,0.313846,1.553785,0.991837,0.175202,0.276923,0.525606,0.307692,0.350404,0.249231,255.0,171.0,127.0,62.0,318.0,181.0,169.666667,148.666667,751.0,616.0,92.0,44.0,809.0,382.0,809.0,382.0,809.0,382.0,255.0,171.0,255.0,171.0,160.0,150.0,382.0,233.0,4.880157,2.663677,4.768173,2.569507,1.07723,0.62013,1.502947,1.150224,0.213049,0.243506,0.508655,0.378247,0.339547,0.277597
46990,20190530,0,Thu,MIL,NL,57,PIT,NL,55,11,5,54,N,,,,PIT08,13059.0,219,212000024,010100030,44,18,6,1,4,11,0,0,0,6,3,7,0,0,0,0,12,5,5,5,0,0,27,8,0,0,0,0,37,10,2,0,1,5,0,0,1,2,0,10,0,0,0,0,8,3,11,11,1,0,27,10,0,1,0,0,marqa901,Alfonso Marquez,belld901,Dan Bellino,cuzzp901,Phil Cuzzi,barbs901,Sean Barber,,(none),,(none),counc001,Craig Counsell,hurdc001,Clint Hurdle,andec001,Chase Anderson,musgj001,Joe Musgrove,,(none),mousm001,Mike Moustakas,andec001,Chase Anderson,musgj001,Joe Musgrove,gameb001,Ben Gamel,7,yelic001,Christian Yelich,9,cainl001,Lorenzo Cain,8,mousm001,Mike Moustakas,5,grany001,Yasmani Grandal,2,hiurk001,Keston Hiura,4,thame001,Eric Thames,3,arcio002,Orlando Arcia,6,andec001,Chase Anderson,1,newmk001,Kevin Newman,6,polag001,Gregory Polanco,9,marts002,Starling Marte,8,bellj005,Josh Bell,3,reynb001,Bryan Reynolds,7,morac001,Colin Moran,5,diaze005,Elias Diaz,2,fraza001,Adam Frazier,4,musgj001,Joe Musgrove,1,,Y,2019,-6,0,16,201905300,0.252313,0.25221,0.30746,0.320937,0.400508,0.435324,0.707968,0.756261,69.0,117.0,32.0,33.0,111.0,100.0,0.266481,0.250943,0.311847,0.327688,0.424327,0.419811,0.736174,0.7475,8.0,23.0,2.0,8.0,17.0,20.0,0.47619,0.545455,0.465368,9.0,O,1.0,1.0,6.0,5.0,11.0,6.0,30.0,23.0,3.0,1.0,5.0,2.0,5.0,2.0,2.0,1.0,1.0,0.0,6.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,3.0,1.0,1.0,0.0,6.0,5.0,30.666667,21.666667,33.0,19.0,138.0,92.0,1.0,1.0,28.0,7.0,23.0,6.0,11.0,9.0,0.0,0.0,19.0,21.0,0.0,0.0,2.0,2.0,0.0,0.0,2.0,0.0,0.0,0.0,11.0,7.0,1.0,0.0,83.333333,56.333333,75.0,50.0,346.0,234.0,5.0,9.0,51.0,23.0,44.0,22.0,20.0,20.0,0.0,1.0,72.0,53.0,1.0,0.0,4.0,2.0,2.0,2.0,4.0,1.0,0.0,0.0,24.0,13.0,1.0,0.0,174.333333,134.333333,164.0,116.0,731.0,555.0,14.0,22.0,91.0,60.0,80.0,57.0,40.0,51.0,3.0,1.0,145.0,124.0,3.0,2.0,7.0,3.0,5.0,2.0,11.0,2.0,0.0,0.0,38.0,24.0,4.0,1.0,44.0,28.0,16.0,10.0,49.0,29.0,30.666667,21.666667,138.0,92.0,23.0,6.0,107.0,55.0,107.0,55.0,107.0,55.0,44.0,28.0,44.0,28.0,19.0,21.0,60.0,38.0,6.75,2.492308,3.48913,2.538462,0.775362,0.597826,1.434783,1.292308,0.137681,0.228261,0.434783,0.413043,0.318841,0.304348,95.0,70.0,41.0,40.0,116.0,90.0,83.333333,56.333333,346.0,234.0,44.0,22.0,206.0,221.0,206.0,221.0,206.0,221.0,95.0,70.0,95.0,70.0,72.0,53.0,136.0,110.0,4.752,3.514793,2.472,3.923077,0.595376,0.944444,1.14,1.242604,0.208092,0.226496,0.393064,0.470085,0.274566,0.299145,204.0,167.0,88.0,92.0,252.0,208.0,174.333333,134.333333,731.0,555.0,80.0,57.0,504.0,539.0,504.0,539.0,504.0,539.0,204.0,167.0,204.0,167.0,145.0,124.0,292.0,259.0,4.130019,3.818859,2.891013,4.012407,0.689466,0.971171,1.170172,1.243176,0.198358,0.223423,0.399453,0.466667,0.27907,0.300901
44231,20180506,0,Sun,TOR,AL,35,TBA,AL,32,2,1,54,D,,,,STP01,14032.0,176,10001,000000010,34,7,2,0,0,1,0,0,0,1,0,8,1,0,0,0,6,4,1,1,0,1,27,11,0,0,2,0,31,8,0,0,1,1,0,0,0,5,0,7,1,2,1,0,8,3,2,2,1,0,27,8,0,0,0,0,rehaj901,Jeremie Rehak,onorb901,Brian O'Nora,culbf901,Fieldin Culbreth,buckc901,CB Bucknor,,(none),,(none),gibbj001,John Gibbons,cashk001,Kevin Cash,teper001,Ryan Tepera,coloa001,Alex Colome,osunr001,Roberto Osuna,,(none),estrm001,Marco Estrada,archc001,Chris Archer,hernt002,Teoscar Hernandez,9,donaj001,Josh Donaldson,5,solay001,Yangervis Solarte,4,smoaj001,Justin Smoak,3,pillk001,Kevin Pillar,8,morak001,Kendrys Morales,10,alfoa002,Anthony Alford,7,maill001,Luke Maile,2,diaza003,Aledmys Diaz,6,spand001,Denard Span,7,cronc002,C.J. Cron,10,duffm002,Matt Duffy,5,millb002,Brad Miller,3,ramow001,Wilson Ramos,2,wendj002,Joey Wendle,4,robed004,Daniel Robertson,6,smitm007,Mallex Smith,8,gomec002,Carlos Gomez,9,,Y,2018,-1,0,3,201805060,0.248908,0.240771,0.31353,0.311851,0.423343,0.424441,0.736873,0.736292,94.0,58.0,37.0,22.0,97.0,90.0,0.2657,0.235694,0.328028,0.313589,0.409662,0.436469,0.73769,0.750058,21.0,10.0,8.0,4.0,14.0,16.0,0.0,0.0,0.5,0.0,,1.0,1.0,7.0,6.0,5.0,4.0,26.0,22.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,4.0,0.0,0.0,6.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,7.0,6.0,32.666667,32.0,41.0,37.0,147.0,140.0,5.0,9.0,23.0,22.0,22.0,22.0,11.0,10.0,0.0,0.0,36.0,26.0,0.0,0.0,1.0,2.0,1.0,0.0,1.0,0.0,0.0,0.0,10.0,11.0,0.0,0.0,73.333333,82.666667,87.0,89.0,327.0,358.0,13.0,19.0,52.0,53.0,46.0,52.0,22.0,25.0,0.0,0.0,84.0,62.0,0.0,0.0,2.0,3.0,3.0,0.0,1.0,1.0,0.0,0.0,21.0,22.0,0.0,0.0,167.333333,163.0,180.0,173.0,725.0,718.0,27.0,33.0,98.0,104.0,88.0,103.0,47.0,66.0,0.0,0.0,203.0,144.0,1.0,0.0,3.0,8.0,11.0,0.0,4.0,1.0,0.0,0.0,38.0,44.0,2.0,3.0,52.0,47.0,25.0,38.0,66.0,75.0,32.666667,32.0,147.0,140.0,22.0,22.0,149.0,206.0,149.0,206.0,149.0,206.0,52.0,47.0,52.0,47.0,36.0,26.0,77.0,85.0,6.061224,6.1875,4.561224,6.4375,1.013605,1.471429,1.591837,1.46875,0.244898,0.185714,0.52381,0.607143,0.353741,0.335714,109.0,114.0,60.0,79.0,147.0,168.0,73.333333,82.666667,327.0,358.0,46.0,52.0,328.0,465.0,328.0,465.0,328.0,465.0,109.0,114.0,109.0,114.0,84.0,62.0,169.0,193.0,5.645455,5.66129,4.472727,5.625,1.003058,1.298883,1.486364,1.379032,0.256881,0.173184,0.51682,0.539106,0.333333,0.318436,227.0,239.0,123.0,149.0,303.0,322.0,167.333333,163.0,725.0,718.0,88.0,103.0,626.0,858.0,626.0,858.0,626.0,858.0,227.0,239.0,227.0,239.0,203.0,144.0,350.0,388.0,4.733068,5.687117,3.741036,5.263804,0.863448,1.194986,1.356574,1.466258,0.28,0.200557,0.482759,0.54039,0.313103,0.332869
31315,20120915,0,Sat,ANA,AL,146,KCA,AL,145,2,3,52,N,,,,KAN06,23027.0,143,10010,000000003,33,6,0,0,1,2,0,0,0,1,0,2,1,0,0,0,5,2,3,3,0,0,25,15,0,0,2,0,30,7,0,0,2,3,0,0,0,2,0,3,1,0,2,0,4,2,2,2,0,0,27,18,2,0,0,0,barrt901,Ted Barrett,fagac901,Clint Fagan,mcclt901,Tim McClelland,reybd901,D.J. Reyburn,,(none),,(none),sciom001,Mike Scioscia,yoste001,Ned Yost,herrk001,Kelvin Herrera,friee001,Ernesto Frieri,,(none),peres002,Salvador Perez,greiz001,Zack Greinke,guthj001,Jeremy Guthrie,troum001,Mike Trout,8,huntt001,Torii Hunter,9,pujoa001,Albert Pujols,3,morak001,Kendrys Morales,10,kendh001,Howie Kendrick,4,aybae001,Erick Aybar,6,wellv001,Vernon Wells,7,calla001,Alberto Callaspo,5,iannc001,Chris Iannetta,2,lougd001,David Lough,8,escoa003,Alcides Escobar,6,gorda001,Alex Gordon,7,butlb003,Billy Butler,10,peres002,Salvador Perez,2,mousm001,Mike Moustakas,5,franj004,Jeff Francoeur,9,hosme001,Eric Hosmer,3,giavj001,Johnny Giavotella,4,,Y,2012,1,1,5,201209150,0.273736,0.271452,0.320758,0.325112,0.415008,0.43479,0.735766,0.759903,139.0,139.0,39.0,36.0,102.0,98.0,0.276254,0.287476,0.327177,0.336572,0.396405,0.443074,0.723582,0.779646,34.0,28.0,5.0,6.0,13.0,16.0,0.0,0.0,0.5,0.0,,1.0,1.0,8.0,8.1,5.0,5.0,30.0,30.0,1.0,0.0,2.0,1.0,2.0,1.0,1.0,2.0,0.0,0.0,2.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.0,8.333333,39.666667,41.666667,33.0,34.0,153.0,168.0,3.0,6.0,12.0,16.0,9.0,16.0,7.0,12.0,0.0,0.0,26.0,36.0,2.0,1.0,1.0,1.0,0.0,1.0,0.0,2.0,0.0,0.0,5.0,5.0,0.0,0.0,85.333333,87.666667,87.0,85.0,350.0,369.0,12.0,13.0,43.0,46.0,38.0,45.0,17.0,27.0,0.0,0.0,53.0,74.0,3.0,3.0,3.0,1.0,1.0,4.0,4.0,2.0,0.0,0.0,12.0,15.0,0.0,2.0,160.666667,183.666667,188.0,177.0,703.0,756.0,28.0,16.0,102.0,77.0,91.0,75.0,45.0,48.0,2.0,0.0,91.0,173.0,7.0,6.0,7.0,1.0,2.0,7.0,8.0,2.0,1.0,0.0,45.0,28.0,1.0,4.0,40.0,46.0,14.0,23.0,47.0,57.0,39.666667,41.666667,153.0,168.0,9.0,16.0,107.0,144.0,107.0,144.0,107.0,144.0,40.0,46.0,40.0,46.0,26.0,36.0,54.0,69.0,2.042017,3.456,2.697479,3.456,0.699346,0.857143,1.008403,1.104,0.169935,0.214286,0.352941,0.410714,0.261438,0.27381,104.0,112.0,48.0,58.0,135.0,143.0,85.333333,87.666667,350.0,369.0,38.0,45.0,362.0,357.0,362.0,357.0,362.0,357.0,104.0,112.0,104.0,112.0,53.0,74.0,152.0,170.0,4.007812,4.619772,4.242188,4.072243,1.034286,0.96748,1.21875,1.277567,0.151429,0.200542,0.434286,0.460705,0.297143,0.303523,233.0,225.0,131.0,84.0,319.0,261.0,160.666667,183.666667,703.0,756.0,91.0,75.0,881.0,537.0,881.0,537.0,881.0,537.0,233.0,225.0,233.0,225.0,91.0,173.0,364.0,309.0,5.09751,3.675136,5.483402,2.923775,1.253201,0.710317,1.450207,1.225045,0.129445,0.228836,0.517781,0.40873,0.331437,0.297619
44582,20180602,0,Sat,CIN,NL,59,SDN,NL,60,2,8,51,N,,,,SAN02,31710.0,170,10000001,14000030x,33,8,2,0,2,2,0,0,1,2,0,12,0,0,1,0,7,3,7,7,1,0,24,12,2,0,2,0,33,12,1,0,0,8,0,2,0,2,0,4,2,1,1,0,5,5,2,2,0,0,27,6,0,0,1,0,barkl901,Lance Barksdale,barrs901,Scott Barry,torrc901,Carlos Torres,nauep901,Paul Nauert,,(none),,(none),riggj801,Jim Riggleman,greea001,Andy Green,lauee001,Eric Lauer,harvm001,Matt Harvey,,(none),margm001,Manuel Margot,harvm001,Matt Harvey,lauee001,Eric Lauer,peraj003,Jose Peraza,6,genns001,Scooter Gennett,4,vottj001,Joey Votto,3,suare001,Eugenio Suarez,5,duvaa001,Adam Duvall,7,sches001,Scott Schebler,9,casac001,Curt Casali,2,harvm001,Matt Harvey,1,hamib001,Billy Hamilton,8,jankt001,Travis Jankowski,7,hosme001,Eric Hosmer,3,pirej001,Jose Pirela,4,villc002,Christian Villanueva,5,reyef001,Franmil Reyes,9,galvf001,Freddy Galvis,6,ellia001,A.J. Ellis,2,margm001,Manuel Margot,8,lauee001,Eric Lauer,1,,Y,2018,6,1,10,201806020,0.236627,0.247241,0.297556,0.32004,0.391159,0.404341,0.688715,0.724381,93.0,87.0,35.0,31.0,107.0,88.0,0.228718,0.247544,0.291235,0.316682,0.363077,0.397839,0.654312,0.71452,21.0,13.0,7.0,5.0,13.0,17.0,0.0,0.0,0.5,0.0,,1.0,1.0,5.0,5.0,5.0,6.0,21.0,22.0,1.0,0.0,1.0,5.0,1.0,4.0,2.0,1.0,0.0,0.0,4.0,3.0,0.0,0.0,0.0,2.0,0.0,1.0,0.0,0.0,0.0,0.0,2.0,1.0,0.0,0.0,5.0,5.0,26.333333,22.333333,40.0,24.0,128.0,98.0,5.0,5.0,19.0,13.0,19.0,13.0,11.0,7.0,0.0,0.0,25.0,17.0,2.0,1.0,1.0,2.0,2.0,0.0,0.0,0.0,0.0,0.0,7.0,5.0,1.0,1.0,29.333333,58.333333,46.0,76.0,147.0,269.0,6.0,14.0,26.0,43.0,25.0,43.0,15.0,20.0,0.0,1.0,28.0,43.0,3.0,3.0,1.0,4.0,2.0,2.0,0.0,2.0,0.0,1.0,7.0,16.0,1.0,1.0,29.333333,132.333333,46.0,160.0,147.0,614.0,6.0,29.0,26.0,97.0,25.0,96.0,15.0,60.0,0.0,3.0,28.0,99.0,3.0,6.0,1.0,5.0,2.0,7.0,0.0,7.0,0.0,1.0,7.0,28.0,1.0,2.0,51.0,31.0,24.0,22.0,64.0,46.0,26.333333,22.333333,128.0,98.0,19.0,13.0,168.0,124.0,168.0,124.0,168.0,124.0,51.0,31.0,51.0,31.0,25.0,17.0,75.0,53.0,6.493671,5.238806,6.379747,5.552239,1.3125,1.265306,1.936709,1.38806,0.195312,0.173469,0.585938,0.540816,0.398438,0.316327,61.0,96.0,27.0,60.0,73.0,136.0,45.0,58.333333,180.0,269.0,33.703704,43.0,205.0,384.0,275.688,384.0,241.3,384.0,84.5,96.0,73.21,96.0,34.6,43.0,102.85,156.0,6.740741,6.634286,6.1264,6.582857,1.5316,1.427509,1.877778,1.645714,0.192222,0.159851,0.571389,0.579926,0.406722,0.356877,61.0,220.0,27.0,119.0,73.0,279.0,90.0,132.333333,360.0,614.0,58.703704,96.0,205.0,839.0,478.728,839.0,439.3,839.0,152.0,220.0,139.81,220.0,70.6,99.0,183.85,339.0,5.87037,6.528967,5.3192,6.34005,1.3298,1.36645,1.688889,1.662469,0.196111,0.161238,0.510694,0.552117,0.388361,0.358306
17138,20070413,0,Fri,WAS,NL,11,NYN,NL,10,2,3,51,N,,,,NYC17,47311.0,167,20000000,10000110x,31,7,0,0,0,1,0,0,0,5,0,2,0,0,3,0,7,4,3,3,1,0,24,6,0,0,1,0,27,5,0,0,0,3,0,0,0,4,0,5,3,0,1,0,4,5,2,2,0,0,27,16,0,0,3,0,rungb901,Brian Runge,wintm901,Mike Winters,wegnm901,Mark Wegner,froeb901,Bruce Froemming,,(none),,(none),actam801,Manny Acta,randw001,Willie Randolph,heila001,Aaron Heilman,wagnr001,Ryan Wagner,wagnb001,Billy Wagner,franj002,Julio Franco,pattj004,John Patterson,pelfm001,Mike Pelfrey,lopef001,Felipe Lopez,6,bellr002,Ronnie Belliard,4,zimmr001,Ryan Zimmerman,5,yound001,Dmitri Young,3,keara001,Austin Kearns,9,churr001,Ryan Church,8,schnb001,Brian Schneider,2,snelc001,Chris Snelling,7,pattj004,John Patterson,1,reyej001,Jose Reyes,6,lodup001,Paul Lo Duca,2,beltc001,Carlos Beltran,8,delgc001,Carlos Delgado,3,wrigd002,David Wright,5,aloum001,Moises Alou,7,grees001,Shawn Green,9,valej003,Jose Valentin,4,pelfm001,Mike Pelfrey,1,,Y,2007,1,1,5,200704130,0.262826,0.260997,0.330226,0.333827,0.438704,0.414492,0.76893,0.748319,148.0,118.0,36.0,60.0,101.0,136.0,0.261811,0.252704,0.337456,0.322034,0.394685,0.362832,0.732141,0.684866,24.0,21.0,6.0,10.0,21.0,19.0,0.0,0.0,0.5,0.0,,1.0,1.0,5.2,5.1,6.0,2.0,24.0,20.0,0.0,0.0,2.0,2.0,2.0,2.0,4.0,3.0,0.0,0.0,2.0,3.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.666667,5.333333,21.333333,23.666667,25.0,30.0,99.0,114.0,1.0,1.0,14.0,19.0,13.0,18.0,12.0,11.0,0.0,0.0,13.0,14.0,1.0,3.0,1.0,3.0,2.0,1.0,3.0,1.0,0.0,0.0,6.0,8.0,0.0,1.0,21.333333,81.666667,25.0,80.0,99.0,355.0,1.0,13.0,14.0,54.0,13.0,53.0,12.0,29.0,0.0,5.0,13.0,76.0,1.0,4.0,1.0,5.0,2.0,1.0,3.0,4.0,0.0,0.0,6.0,18.0,0.0,3.0,21.333333,182.333333,25.0,162.0,99.0,759.0,1.0,22.0,14.0,80.0,13.0,77.0,12.0,57.0,0.0,8.0,13.0,175.0,1.0,5.0,1.0,8.0,2.0,7.0,3.0,7.0,0.0,0.0,6.0,34.0,0.0,3.0,37.0,41.0,9.0,13.0,34.0,43.0,21.333333,23.666667,99.0,114.0,13.0,18.0,98.0,108.0,98.0,108.0,98.0,108.0,37.0,41.0,37.0,41.0,13.0,14.0,46.0,54.0,5.484375,6.84507,4.59375,4.56338,0.989899,0.947368,1.734375,1.732394,0.131313,0.122807,0.464646,0.473684,0.373737,0.359649,37.0,109.0,9.0,63.0,34.0,143.0,45.0,81.666667,180.0,355.0,26.148148,53.0,98.0,344.0,204.784,344.0,187.1,344.0,72.5,109.0,66.97,109.0,29.2,76.0,82.45,172.0,5.22963,5.840816,4.550756,4.212245,1.137689,0.969014,1.611111,1.334694,0.162222,0.214085,0.458056,0.484507,0.372056,0.307042,37.0,219.0,9.0,106.0,34.0,268.0,90.0,182.333333,360.0,759.0,51.148148,77.0,98.0,593.0,407.824,593.0,385.1,593.0,140.0,219.0,133.57,219.0,65.2,175.0,163.45,325.0,5.114815,3.800731,4.531378,3.252285,1.132844,0.781291,1.555556,1.201097,0.181111,0.230567,0.454028,0.428195,0.371028,0.288538
23475,20090806,0,Thu,MIN,AL,108,CLE,AL,108,1,2,51,D,,,,CLE08,21657.0,157,100000,00010010x,33,7,2,0,0,0,1,0,0,3,0,5,1,0,0,0,9,2,2,2,0,0,24,10,0,0,2,0,28,8,2,0,0,2,0,1,0,2,0,2,1,0,1,0,5,4,1,1,1,0,27,15,0,0,0,0,barrt901,Ted Barrett,hoyej901,James Hoye,holbs901,Sam Holbrook,vanol901,Larry Vanover,,(none),,(none),gardr001,Ron Gardenhire,wedge001,Eric Wedge,sippt001,Tony Sipp,blacn001,Nick Blackburn,woodk002,Kerry Wood,crowt001,Trevor Crowe,blacn001,Nick Blackburn,carmf001,Fausto Carmona,spand001,Denard Span,8,cabro001,Orlando Cabrera,6,mauej001,Joe Mauer,10,mornj001,Justin Morneau,3,kubej002,Jason Kubel,7,cuddm001,Michael Cuddyer,9,credj001,Joe Crede,5,redmm001,Mike Redmond,2,casia001,Alexi Casilla,4,sizeg001,Grady Sizemore,8,cabra002,Asdrubal Cabrera,6,choos001,Shin-Soo Choo,9,peraj001,Jhonny Peralta,5,hafnt001,Travis Hafner,10,gimec001,Chris Gimenez,3,valbl001,Luis Valbuena,4,crowt001,Trevor Crowe,7,torew001,Wyatt Toregas,2,,Y,2009,1,1,3,200908060,0.270227,0.271314,0.344457,0.341782,0.433113,0.417337,0.77757,0.759119,80.0,99.0,35.0,31.0,97.0,84.0,0.273166,0.256291,0.344077,0.324301,0.451737,0.420317,0.795814,0.744618,14.0,17.0,9.0,6.0,13.0,17.0,0.0,0.0,0.5,0.0,,1.0,1.0,6.0,6.1,6.0,7.0,27.0,26.0,0.0,0.0,1.0,2.0,1.0,2.0,3.0,2.0,0.0,0.0,2.0,2.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,0.0,0.0,6.0,6.333333,23.666667,37.333333,30.0,57.0,123.0,172.0,4.0,7.0,30.0,26.0,26.0,24.0,22.0,4.0,0.0,0.0,12.0,17.0,1.0,0.0,0.0,2.0,3.0,0.0,0.0,0.0,1.0,0.0,4.0,12.0,0.0,0.0,73.0,104.0,83.0,116.0,348.0,436.0,11.0,11.0,65.0,43.0,60.0,39.0,46.0,20.0,0.0,0.0,43.0,45.0,2.0,1.0,1.0,2.0,4.0,1.0,5.0,1.0,1.0,0.0,17.0,28.0,1.0,1.0,158.333333,187.333333,173.0,220.0,739.0,807.0,15.0,23.0,127.0,98.0,116.0,86.0,93.0,45.0,0.0,4.0,84.0,78.0,3.0,4.0,4.0,4.0,11.0,1.0,10.0,1.0,2.0,0.0,38.0,45.0,3.0,3.0,52.0,61.0,16.0,33.0,46.0,90.0,23.666667,37.333333,123.0,172.0,26.0,24.0,184.0,240.0,184.0,240.0,184.0,240.0,52.0,61.0,52.0,61.0,12.0,17.0,68.0,94.0,9.887324,5.785714,7.774648,6.428571,1.495935,1.395349,2.197183,1.633929,0.097561,0.098837,0.552846,0.546512,0.422764,0.354651,129.0,136.0,52.0,63.0,135.0,179.0,73.0,104.0,348.0,436.0,60.0,39.0,444.0,461.0,444.0,461.0,444.0,461.0,129.0,136.0,129.0,136.0,43.0,45.0,181.0,199.0,7.39726,3.375,6.082192,4.432692,1.275862,1.057339,1.767123,1.307692,0.123563,0.103211,0.520115,0.456422,0.37069,0.311927,266.0,265.0,89.0,120.0,262.0,340.0,158.333333,187.333333,739.0,807.0,116.0,86.0,825.0,938.0,825.0,938.0,825.0,938.0,266.0,265.0,266.0,265.0,84.0,78.0,355.0,385.0,6.593684,4.131673,5.210526,5.007117,1.116373,1.16233,1.68,1.414591,0.113667,0.096654,0.480379,0.477076,0.359946,0.328377
54403,20230403,0,Mon,PHI,NL,4,NYA,AL,4,1,8,51,N,,,,NYC21,37202.0,161,100000,20105000x,37,11,2,0,0,1,0,0,0,0,0,7,0,0,0,0,9,4,8,8,0,1,24,8,0,0,0,0,33,9,1,1,2,8,0,0,0,9,0,7,1,0,0,0,10,4,1,1,0,0,27,9,0,0,0,0,emmep901,Paul Emmel,fairc901,Chad Fairchild,lentn901,Nic Lentz,rehaj901,Jeremie Rehak,,(none),,(none),giraj001,Joe Girardi,boona001,Aaron Boone,cortn001,Nestor Cortes,walkt004,Taijuan Walker,,(none),stanm004,Giancarlo Stanton,walkt004,Taijuan Walker,cortn001,Nestor Cortes,turnt001,Trea Turner,6,schwk001,Kyle Schwarber,7,realj001,J.T. Realmuto,2,castn001,Nick Castellanos,9,bohma001,Alec Bohm,10,halld003,Darick Hall,3,sosae001,Edmundo Sosa,5,stotb001,Bryson Stott,4,marsb002,Brandon Marsh,8,lemad001,DJ LeMahieu,5,judga001,Aaron Judge,8,rizza001,Anthony Rizzo,3,stanm004,Giancarlo Stanton,10,torrg001,Gleyber Torres,4,cordf003,Franchy Cordero,9,hicka001,Aaron Hicks,7,trevj001,Jose Trevino,2,volpa001,Anthony Volpe,6,,Y,2023,7,1,9,202304030,0.241602,0.254219,0.319364,0.313283,0.427649,0.422609,0.747013,0.735893,106.0,107.0,34.0,28.0,74.0,68.0,0.258193,0.252725,0.337178,0.315168,0.449851,0.435084,0.787029,0.750252,28.0,19.0,7.0,7.0,10.0,10.0,0.636364,0.409836,0.613264,7.5,O,1.0,1.0,5.0,4.1,7.0,4.0,21.0,20.0,0.0,1.0,1.0,4.0,1.0,4.0,0.0,3.0,0.0,0.0,3.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,1.0,5.0,4.333333,33.333333,34.666667,15.0,32.0,123.0,142.0,1.0,5.0,5.0,15.0,5.0,14.0,9.0,7.0,0.0,0.0,35.0,39.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,4.0,6.0,0.0,0.0,84.333333,78.666667,54.0,75.0,326.0,333.0,7.0,11.0,24.0,37.0,24.0,36.0,21.0,23.0,0.0,0.0,85.0,71.0,0.0,0.0,3.0,2.0,1.0,0.0,1.0,5.0,0.0,0.0,9.0,16.0,0.0,0.0,167.333333,164.666667,117.0,145.0,650.0,674.0,18.0,15.0,48.0,65.0,47.0,63.0,38.0,48.0,0.0,1.0,172.0,137.0,0.0,0.0,3.0,2.0,1.0,0.0,2.0,6.0,0.0,0.0,23.0,28.0,1.0,1.0,24.0,39.0,7.0,21.0,22.0,53.0,33.333333,34.666667,123.0,142.0,5.0,14.0,15.0,104.0,15.0,104.0,15.0,104.0,24.0,39.0,24.0,39.0,35.0,39.0,31.0,60.0,1.35,3.634615,0.45,3.0,0.121951,0.732394,0.72,1.125,0.284553,0.274648,0.252033,0.422535,0.195122,0.274648,75.0,98.0,30.0,49.0,84.0,124.0,84.333333,78.666667,326.0,333.0,24.0,36.0,146.0,295.0,146.0,295.0,146.0,295.0,75.0,98.0,75.0,98.0,85.0,71.0,105.0,147.0,2.561265,4.118644,1.731225,3.75,0.447853,0.885886,0.889328,1.245763,0.260736,0.213213,0.322086,0.441441,0.230061,0.294294,155.0,193.0,79.0,75.0,196.0,220.0,167.333333,164.666667,650.0,674.0,47.0,63.0,355.0,500.0,355.0,500.0,355.0,500.0,155.0,193.0,155.0,193.0,172.0,137.0,234.0,268.0,2.527888,3.44332,2.121514,3.036437,0.546154,0.74184,0.926295,1.172065,0.264615,0.203264,0.36,0.397626,0.238462,0.28635
28608,20110821,0,Sun,CIN,NL,127,PIT,NL,125,5,4,54,D,,,,PIT08,29967.0,173,3002,200002000,32,7,1,0,1,5,0,0,1,6,0,9,1,0,2,0,7,3,4,4,0,0,27,9,0,0,0,0,33,7,2,1,2,4,0,0,0,1,0,7,0,1,0,0,3,5,5,5,0,0,27,8,0,0,2,0,davib902,Bob Davidson,wendh902,Hunter Wendelstedt,knigb901,Brian Knight,laynj901,Jerry Layne,,(none),,(none),baked002,Dusty Baker,hurdc001,Clint Hurdle,arrej001,Jose Arredondo,hanrj001,Joel Hanrahan,cordf002,Francisco Cordero,philb001,Brandon Phillips,leakm001,Mike Leake,mcdoj004,James McDonald,philb001,Brandon Phillips,4,lewif001,Fred Lewis,7,vottj001,Joey Votto,3,brucj001,Jay Bruce,9,frazt001,Todd Frazier,5,stubd001,Drew Stubbs,8,hanir001,Ryan Hanigan,2,janip001,Paul Janish,6,leakm001,Mike Leake,1,tabaj002,Jose Tabata,9,joneg002,Garrett Jones,3,mccua001,Andrew McCutchen,8,doumr001,Ryan Doumit,2,walkn001,Neil Walker,4,ludwr001,Ryan Ludwick,7,woodb003,Brandon Wood,5,ceder002,Ronny Cedeno,6,mcdoj004,James McDonald,1,,Y,2011,-1,0,9,201108210,0.245788,0.261676,0.309987,0.326614,0.371062,0.418538,0.681049,0.745152,104.0,92.0,47.0,49.0,131.0,92.0,0.236538,0.258383,0.297345,0.324349,0.348077,0.42998,0.645422,0.754329,18.0,15.0,11.0,8.0,27.0,21.0,0.0,0.0,0.5,0.0,,1.0,1.0,6.0,6.0,3.0,5.0,23.0,24.0,1.0,2.0,3.0,4.0,3.0,4.0,3.0,1.0,0.0,0.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,6.0,6.0,35.333333,38.0,36.0,42.0,152.0,164.0,7.0,6.0,14.0,16.0,14.0,14.0,10.0,9.0,2.0,2.0,32.0,29.0,2.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,7.0,9.0,0.0,0.0,85.666667,96.333333,90.0,95.0,376.0,401.0,12.0,12.0,35.0,38.0,33.0,36.0,36.0,20.0,3.0,2.0,71.0,66.0,3.0,1.0,3.0,4.0,3.0,1.0,3.0,6.0,1.0,1.0,17.0,20.0,0.0,1.0,168.0,156.333333,172.0,171.0,733.0,675.0,22.0,24.0,74.0,90.0,71.0,80.0,72.0,42.0,8.0,3.0,140.0,116.0,7.0,3.0,5.0,6.0,6.0,2.0,5.0,8.0,1.0,1.0,36.0,34.0,0.0,2.0,46.0,51.0,28.0,27.0,64.0,69.0,35.333333,38.0,152.0,164.0,14.0,14.0,165.0,173.0,165.0,173.0,165.0,173.0,46.0,51.0,46.0,51.0,32.0,29.0,74.0,78.0,3.566038,3.315789,4.669811,4.552632,1.085526,1.054878,1.301887,1.342105,0.210526,0.176829,0.486842,0.47561,0.302632,0.310976,126.0,115.0,53.0,58.0,143.0,153.0,85.666667,96.333333,376.0,401.0,33.0,36.0,392.0,369.0,392.0,369.0,392.0,369.0,126.0,115.0,126.0,115.0,71.0,66.0,179.0,173.0,3.466926,3.363322,4.575875,3.83045,1.042553,0.9202,1.470817,1.193772,0.18883,0.164589,0.476064,0.431421,0.335106,0.286783,244.0,213.0,102.0,110.0,274.0,281.0,168.0,156.333333,733.0,675.0,71.0,80.0,738.0,719.0,738.0,719.0,738.0,719.0,244.0,213.0,244.0,213.0,140.0,116.0,346.0,323.0,3.803571,4.605544,4.392857,4.599147,1.006821,1.065185,1.452381,1.362473,0.190996,0.171852,0.472033,0.478519,0.332879,0.315556
19486,20080404,0,Fri,LAN,NL,4,SDN,NL,5,7,1,54,N,,,,SAN02,42474.0,180,100600,000001000,34,8,1,0,0,6,0,2,0,7,0,7,0,0,0,0,9,2,1,1,0,0,27,10,0,0,0,0,31,4,0,1,1,1,0,0,0,1,0,6,0,0,0,0,4,4,6,6,1,0,27,11,1,0,0,0,tscht901,Tim Tschida,joycj901,Jim Joyce,nelsj901,Jeff Nelson,ticht901,Todd Tichenor,,(none),,(none),torrj101,Joe Torre,blacb001,Buddy Black,kuroh001,Hiroki Kuroda,thatj001,Joe Thatcher,,(none),martr004,Russell Martin,kuroh001,Hiroki Kuroda,germj001,Justin Germano,furcr001,Rafael Furcal,6,martr004,Russell Martin,2,lonej001,James Loney,3,kentj001,Jeff Kent,4,ethia001,Andre Ethier,7,jonea002,Andruw Jones,8,kempm001,Matt Kemp,9,dewib001,Blake DeWitt,5,kuroh001,Hiroki Kuroda,1,gileb002,Brian Giles,9,iguct001,Tadahito Iguchi,4,kouzk001,Kevin Kouzmanoff,5,gonza003,Adrian Gonzalez,3,hairs001,Scott Hairston,8,greek002,Khalil Greene,6,barrm003,Michael Barrett,2,mcanp001,Paul McAnulty,7,germj001,Justin Germano,1,,Y,2008,-6,0,8,200804040,0.252378,0.27666,0.320333,0.33741,0.411596,0.406445,0.731929,0.743855,55.0,141.0,24.0,51.0,91.0,116.0,0.26558,0.289549,0.335646,0.343085,0.430489,0.440077,0.766135,0.783162,4.0,32.0,3.0,11.0,12.0,18.0,0.0,0.0,0.5,0.0,,1.0,1.0,6.0,7.0,3.0,3.0,24.0,24.0,0.0,1.0,1.0,1.0,0.0,1.0,2.0,0.0,0.0,0.0,3.0,4.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,6.0,7.0,19.0,0.0,28.0,0.0,91.0,0.0,3.0,0.0,16.0,0.0,12.0,0.0,6.0,0.0,0.0,0.0,13.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,9.0,0.0,1.0,0.0,68.666667,0.0,73.0,0.0,307.0,0.0,7.0,0.0,43.0,0.0,38.0,0.0,27.0,0.0,3.0,0.0,45.0,0.0,3.0,0.0,0.0,0.0,1.0,0.0,5.0,0.0,0.0,0.0,20.0,0.0,1.0,0.0,140.0,0.0,145.0,0.0,601.0,0.0,15.0,0.0,78.0,0.0,72.0,0.0,43.0,0.0,4.0,0.0,86.0,0.0,4.0,0.0,0.0,0.0,1.0,0.0,9.0,0.0,0.0,0.0,35.0,0.0,2.0,0.0,34.0,0.0,20.0,0.0,48.0,0.0,19.0,18.0,91.0,72.0,12.0,10.0,115.0,0.0,115.0,81.216,115.0,79.2,34.0,27.0,34.0,26.64,13.0,14.4,54.0,32.4,5.684211,5.0,6.052632,4.512,1.263736,1.128,1.789474,1.5,0.142857,0.2,0.593407,0.45,0.373626,0.37,100.0,0.0,43.0,0.0,116.0,0.0,68.666667,45.0,307.0,180.0,38.0,25.0,301.0,0.0,301.0,203.04,301.0,198.0,100.0,67.5,100.0,66.6,45.0,36.0,143.0,81.0,4.980583,5.0,4.383495,4.512,0.980456,1.128,1.456311,1.5,0.14658,0.2,0.465798,0.45,0.325733,0.37,188.0,0.0,84.0,0.0,229.0,0.0,140.0,90.0,601.0,360.0,72.0,50.0,587.0,0.0,587.0,406.08,587.0,396.0,188.0,135.0,188.0,133.2,86.0,72.0,272.0,162.0,4.628571,5.0,4.192857,4.512,0.976705,1.128,1.342857,1.5,0.143095,0.2,0.452579,0.45,0.312812,0.37


In [95]:
df.shape

(56771, 451)

In [96]:
(df.Strt_IP_mod_6_h==0).sum()

0

In [97]:
(df.Strt_IP_mod_6_v==0).sum()

0

In [98]:
df.loc[df.Strt_IP_mod_6_v==0]

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,Strt_GS_h,Strt_GS_v,Strt_IP_h,Strt_IP_v,Strt_H_h,Strt_H_v,Strt_BFP_h,Strt_BFP_v,Strt_HR_h,Strt_HR_v,Strt_R_h,Strt_R_v,Strt_ER_h,Strt_ER_v,Strt_BB_h,Strt_BB_v,Strt_IB_h,Strt_IB_v,Strt_SO_h,Strt_SO_v,Strt_SH_h,Strt_SH_v,Strt_SF_h,Strt_SF_v,Strt_WP_h,Strt_WP_v,Strt_HBP_h,Strt_HBP_v,Strt_BK_h,Strt_BK_v,Strt_2B_h,Strt_2B_v,Strt_3B_h,Strt_3B_v,Strt_IP_real_h,Strt_IP_real_v,Strt_rollsum_IP_real_6_h,Strt_rollsum_IP_real_6_v,Strt_rollsum_H_6_h,Strt_rollsum_H_6_v,Strt_rollsum_BFP_6_h,Strt_rollsum_BFP_6_v,Strt_rollsum_HR_6_h,Strt_rollsum_HR_6_v,Strt_rollsum_R_6_h,Strt_rollsum_R_6_v,Strt_rollsum_ER_6_h,Strt_rollsum_ER_6_v,Strt_rollsum_BB_6_h,Strt_rollsum_BB_6_v,Strt_rollsum_IB_6_h,Strt_rollsum_IB_6_v,Strt_rollsum_SO_6_h,Strt_rollsum_SO_6_v,Strt_rollsum_SH_6_h,Strt_rollsum_SH_6_v,Strt_rollsum_SF_6_h,Strt_rollsum_SF_6_v,Strt_rollsum_WP_6_h,Strt_rollsum_WP_6_v,Strt_rollsum_HBP_6_h,Strt_rollsum_HBP_6_v,Strt_rollsum_BK_6_h,Strt_rollsum_BK_6_v,Strt_rollsum_2B_6_h,Strt_rollsum_2B_6_v,Strt_rollsum_3B_6_h,Strt_rollsum_3B_6_v,Strt_rollsum_IP_real_15_h,Strt_rollsum_IP_real_15_v,Strt_rollsum_H_15_h,Strt_rollsum_H_15_v,Strt_rollsum_BFP_15_h,Strt_rollsum_BFP_15_v,Strt_rollsum_HR_15_h,Strt_rollsum_HR_15_v,Strt_rollsum_R_15_h,Strt_rollsum_R_15_v,Strt_rollsum_ER_15_h,Strt_rollsum_ER_15_v,Strt_rollsum_BB_15_h,Strt_rollsum_BB_15_v,Strt_rollsum_IB_15_h,Strt_rollsum_IB_15_v,Strt_rollsum_SO_15_h,Strt_rollsum_SO_15_v,Strt_rollsum_SH_15_h,Strt_rollsum_SH_15_v,Strt_rollsum_SF_15_h,Strt_rollsum_SF_15_v,Strt_rollsum_WP_15_h,Strt_rollsum_WP_15_v,Strt_rollsum_HBP_15_h,Strt_rollsum_HBP_15_v,Strt_rollsum_BK_15_h,Strt_rollsum_BK_15_v,Strt_rollsum_2B_15_h,Strt_rollsum_2B_15_v,Strt_rollsum_3B_15_h,Strt_rollsum_3B_15_v,Strt_rollsum_IP_real_30_h,Strt_rollsum_IP_real_30_v,Strt_rollsum_H_30_h,Strt_rollsum_H_30_v,Strt_rollsum_BFP_30_h,Strt_rollsum_BFP_30_v,Strt_rollsum_HR_30_h,Strt_rollsum_HR_30_v,Strt_rollsum_R_30_h,Strt_rollsum_R_30_v,Strt_rollsum_ER_30_h,Strt_rollsum_ER_30_v,Strt_rollsum_BB_30_h,Strt_rollsum_BB_30_v,Strt_rollsum_IB_30_h,Strt_rollsum_IB_30_v,Strt_rollsum_SO_30_h,Strt_rollsum_SO_30_v,Strt_rollsum_SH_30_h,Strt_rollsum_SH_30_v,Strt_rollsum_SF_30_h,Strt_rollsum_SF_30_v,Strt_rollsum_WP_30_h,Strt_rollsum_WP_30_v,Strt_rollsum_HBP_30_h,Strt_rollsum_HBP_30_v,Strt_rollsum_BK_30_h,Strt_rollsum_BK_30_v,Strt_rollsum_2B_30_h,Strt_rollsum_2B_30_v,Strt_rollsum_3B_30_h,Strt_rollsum_3B_30_v,Strt_H_BB_roll_6_h,Strt_H_BB_roll_6_v,Strt_XB_roll_6_h,Strt_XB_roll_6_v,Strt_TB_roll_6_h,Strt_TB_roll_6_v,Strt_IP_mod_6_h,Strt_IP_mod_6_v,Strt_BF_mod_6_h,Strt_BF_mod_6_v,Strt_ER_mod_6_h,Strt_ER_mod_6_v,Strt_FIP_numer_6_h,Strt_FIP_numer_6_v,Strt_FIP_numer_mod_6_h,Strt_FIP_numer_mod_6_v,Strt_FIP_numer_mod2_6_h,Strt_FIP_numer_mod2_6_v,Strt_H_BB_mod_6_h,Strt_H_BB_mod_6_v,Strt_H_BB_mod2_6_h,Strt_H_BB_mod2_6_v,Strt_SO_mod_6_h,Strt_SO_mod_6_v,Strt_TB_BB_mod_6_h,Strt_TB_BB_mod_6_v,Strt_ERA_6_h,Strt_ERA_6_v,Strt_FIP_6_h,Strt_FIP_6_v,Strt_FIP_perc_6_h,Strt_FIP_perc_6_v,Strt_WHIP_6_h,Strt_WHIP_6_v,Strt_SO_perc_6_h,Strt_SO_perc_6_v,Strt_TB_BB_perc_6_h,Strt_TB_BB_perc_6_v,Strt_H_BB_perc_6_h,Strt_H_BB_perc_6_v,Strt_H_BB_roll_15_h,Strt_H_BB_roll_15_v,Strt_XB_roll_15_h,Strt_XB_roll_15_v,Strt_TB_roll_15_h,Strt_TB_roll_15_v,Strt_IP_mod_15_h,Strt_IP_mod_15_v,Strt_BF_mod_15_h,Strt_BF_mod_15_v,Strt_ER_mod_15_h,Strt_ER_mod_15_v,Strt_FIP_numer_15_h,Strt_FIP_numer_15_v,Strt_FIP_numer_mod_15_h,Strt_FIP_numer_mod_15_v,Strt_FIP_numer_mod2_15_h,Strt_FIP_numer_mod2_15_v,Strt_H_BB_mod_15_h,Strt_H_BB_mod_15_v,Strt_H_BB_mod2_15_h,Strt_H_BB_mod2_15_v,Strt_SO_mod_15_h,Strt_SO_mod_15_v,Strt_TB_BB_mod_15_h,Strt_TB_BB_mod_15_v,Strt_ERA_15_h,Strt_ERA_15_v,Strt_FIP_15_h,Strt_FIP_15_v,Strt_FIP_perc_15_h,Strt_FIP_perc_15_v,Strt_WHIP_15_h,Strt_WHIP_15_v,Strt_SO_perc_15_h,Strt_SO_perc_15_v,Strt_TB_BB_perc_15_h,Strt_TB_BB_perc_15_v,Strt_H_BB_perc_15_h,Strt_H_BB_perc_15_v,Strt_H_BB_roll_30_h,Strt_H_BB_roll_30_v,Strt_XB_roll_30_h,Strt_XB_roll_30_v,Strt_TB_roll_30_h,Strt_TB_roll_30_v,Strt_IP_mod_30_h,Strt_IP_mod_30_v,Strt_BF_mod_30_h,Strt_BF_mod_30_v,Strt_ER_mod_30_h,Strt_ER_mod_30_v,Strt_FIP_numer_30_h,Strt_FIP_numer_30_v,Strt_FIP_numer_mod_30_h,Strt_FIP_numer_mod_30_v,Strt_FIP_numer_mod2_30_h,Strt_FIP_numer_mod2_30_v,Strt_H_BB_mod_30_h,Strt_H_BB_mod_30_v,Strt_H_BB_mod2_30_h,Strt_H_BB_mod2_30_v,Strt_SO_mod_30_h,Strt_SO_mod_30_v,Strt_TB_BB_mod_30_h,Strt_TB_BB_mod_30_v,Strt_ERA_30_h,Strt_ERA_30_v,Strt_FIP_30_h,Strt_FIP_30_v,Strt_FIP_perc_30_h,Strt_FIP_perc_30_v,Strt_WHIP_30_h,Strt_WHIP_30_v,Strt_SO_perc_30_h,Strt_SO_perc_30_v,Strt_TB_BB_perc_30_h,Strt_TB_BB_perc_30_v,Strt_H_BB_perc_30_h,Strt_H_BB_perc_30_v


In [99]:
df.loc[df.Strt_IP_mod_6_h==0]

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,Strt_GS_h,Strt_GS_v,Strt_IP_h,Strt_IP_v,Strt_H_h,Strt_H_v,Strt_BFP_h,Strt_BFP_v,Strt_HR_h,Strt_HR_v,Strt_R_h,Strt_R_v,Strt_ER_h,Strt_ER_v,Strt_BB_h,Strt_BB_v,Strt_IB_h,Strt_IB_v,Strt_SO_h,Strt_SO_v,Strt_SH_h,Strt_SH_v,Strt_SF_h,Strt_SF_v,Strt_WP_h,Strt_WP_v,Strt_HBP_h,Strt_HBP_v,Strt_BK_h,Strt_BK_v,Strt_2B_h,Strt_2B_v,Strt_3B_h,Strt_3B_v,Strt_IP_real_h,Strt_IP_real_v,Strt_rollsum_IP_real_6_h,Strt_rollsum_IP_real_6_v,Strt_rollsum_H_6_h,Strt_rollsum_H_6_v,Strt_rollsum_BFP_6_h,Strt_rollsum_BFP_6_v,Strt_rollsum_HR_6_h,Strt_rollsum_HR_6_v,Strt_rollsum_R_6_h,Strt_rollsum_R_6_v,Strt_rollsum_ER_6_h,Strt_rollsum_ER_6_v,Strt_rollsum_BB_6_h,Strt_rollsum_BB_6_v,Strt_rollsum_IB_6_h,Strt_rollsum_IB_6_v,Strt_rollsum_SO_6_h,Strt_rollsum_SO_6_v,Strt_rollsum_SH_6_h,Strt_rollsum_SH_6_v,Strt_rollsum_SF_6_h,Strt_rollsum_SF_6_v,Strt_rollsum_WP_6_h,Strt_rollsum_WP_6_v,Strt_rollsum_HBP_6_h,Strt_rollsum_HBP_6_v,Strt_rollsum_BK_6_h,Strt_rollsum_BK_6_v,Strt_rollsum_2B_6_h,Strt_rollsum_2B_6_v,Strt_rollsum_3B_6_h,Strt_rollsum_3B_6_v,Strt_rollsum_IP_real_15_h,Strt_rollsum_IP_real_15_v,Strt_rollsum_H_15_h,Strt_rollsum_H_15_v,Strt_rollsum_BFP_15_h,Strt_rollsum_BFP_15_v,Strt_rollsum_HR_15_h,Strt_rollsum_HR_15_v,Strt_rollsum_R_15_h,Strt_rollsum_R_15_v,Strt_rollsum_ER_15_h,Strt_rollsum_ER_15_v,Strt_rollsum_BB_15_h,Strt_rollsum_BB_15_v,Strt_rollsum_IB_15_h,Strt_rollsum_IB_15_v,Strt_rollsum_SO_15_h,Strt_rollsum_SO_15_v,Strt_rollsum_SH_15_h,Strt_rollsum_SH_15_v,Strt_rollsum_SF_15_h,Strt_rollsum_SF_15_v,Strt_rollsum_WP_15_h,Strt_rollsum_WP_15_v,Strt_rollsum_HBP_15_h,Strt_rollsum_HBP_15_v,Strt_rollsum_BK_15_h,Strt_rollsum_BK_15_v,Strt_rollsum_2B_15_h,Strt_rollsum_2B_15_v,Strt_rollsum_3B_15_h,Strt_rollsum_3B_15_v,Strt_rollsum_IP_real_30_h,Strt_rollsum_IP_real_30_v,Strt_rollsum_H_30_h,Strt_rollsum_H_30_v,Strt_rollsum_BFP_30_h,Strt_rollsum_BFP_30_v,Strt_rollsum_HR_30_h,Strt_rollsum_HR_30_v,Strt_rollsum_R_30_h,Strt_rollsum_R_30_v,Strt_rollsum_ER_30_h,Strt_rollsum_ER_30_v,Strt_rollsum_BB_30_h,Strt_rollsum_BB_30_v,Strt_rollsum_IB_30_h,Strt_rollsum_IB_30_v,Strt_rollsum_SO_30_h,Strt_rollsum_SO_30_v,Strt_rollsum_SH_30_h,Strt_rollsum_SH_30_v,Strt_rollsum_SF_30_h,Strt_rollsum_SF_30_v,Strt_rollsum_WP_30_h,Strt_rollsum_WP_30_v,Strt_rollsum_HBP_30_h,Strt_rollsum_HBP_30_v,Strt_rollsum_BK_30_h,Strt_rollsum_BK_30_v,Strt_rollsum_2B_30_h,Strt_rollsum_2B_30_v,Strt_rollsum_3B_30_h,Strt_rollsum_3B_30_v,Strt_H_BB_roll_6_h,Strt_H_BB_roll_6_v,Strt_XB_roll_6_h,Strt_XB_roll_6_v,Strt_TB_roll_6_h,Strt_TB_roll_6_v,Strt_IP_mod_6_h,Strt_IP_mod_6_v,Strt_BF_mod_6_h,Strt_BF_mod_6_v,Strt_ER_mod_6_h,Strt_ER_mod_6_v,Strt_FIP_numer_6_h,Strt_FIP_numer_6_v,Strt_FIP_numer_mod_6_h,Strt_FIP_numer_mod_6_v,Strt_FIP_numer_mod2_6_h,Strt_FIP_numer_mod2_6_v,Strt_H_BB_mod_6_h,Strt_H_BB_mod_6_v,Strt_H_BB_mod2_6_h,Strt_H_BB_mod2_6_v,Strt_SO_mod_6_h,Strt_SO_mod_6_v,Strt_TB_BB_mod_6_h,Strt_TB_BB_mod_6_v,Strt_ERA_6_h,Strt_ERA_6_v,Strt_FIP_6_h,Strt_FIP_6_v,Strt_FIP_perc_6_h,Strt_FIP_perc_6_v,Strt_WHIP_6_h,Strt_WHIP_6_v,Strt_SO_perc_6_h,Strt_SO_perc_6_v,Strt_TB_BB_perc_6_h,Strt_TB_BB_perc_6_v,Strt_H_BB_perc_6_h,Strt_H_BB_perc_6_v,Strt_H_BB_roll_15_h,Strt_H_BB_roll_15_v,Strt_XB_roll_15_h,Strt_XB_roll_15_v,Strt_TB_roll_15_h,Strt_TB_roll_15_v,Strt_IP_mod_15_h,Strt_IP_mod_15_v,Strt_BF_mod_15_h,Strt_BF_mod_15_v,Strt_ER_mod_15_h,Strt_ER_mod_15_v,Strt_FIP_numer_15_h,Strt_FIP_numer_15_v,Strt_FIP_numer_mod_15_h,Strt_FIP_numer_mod_15_v,Strt_FIP_numer_mod2_15_h,Strt_FIP_numer_mod2_15_v,Strt_H_BB_mod_15_h,Strt_H_BB_mod_15_v,Strt_H_BB_mod2_15_h,Strt_H_BB_mod2_15_v,Strt_SO_mod_15_h,Strt_SO_mod_15_v,Strt_TB_BB_mod_15_h,Strt_TB_BB_mod_15_v,Strt_ERA_15_h,Strt_ERA_15_v,Strt_FIP_15_h,Strt_FIP_15_v,Strt_FIP_perc_15_h,Strt_FIP_perc_15_v,Strt_WHIP_15_h,Strt_WHIP_15_v,Strt_SO_perc_15_h,Strt_SO_perc_15_v,Strt_TB_BB_perc_15_h,Strt_TB_BB_perc_15_v,Strt_H_BB_perc_15_h,Strt_H_BB_perc_15_v,Strt_H_BB_roll_30_h,Strt_H_BB_roll_30_v,Strt_XB_roll_30_h,Strt_XB_roll_30_v,Strt_TB_roll_30_h,Strt_TB_roll_30_v,Strt_IP_mod_30_h,Strt_IP_mod_30_v,Strt_BF_mod_30_h,Strt_BF_mod_30_v,Strt_ER_mod_30_h,Strt_ER_mod_30_v,Strt_FIP_numer_30_h,Strt_FIP_numer_30_v,Strt_FIP_numer_mod_30_h,Strt_FIP_numer_mod_30_v,Strt_FIP_numer_mod2_30_h,Strt_FIP_numer_mod2_30_v,Strt_H_BB_mod_30_h,Strt_H_BB_mod_30_v,Strt_H_BB_mod2_30_h,Strt_H_BB_mod2_30_v,Strt_SO_mod_30_h,Strt_SO_mod_30_v,Strt_TB_BB_mod_30_h,Strt_TB_BB_mod_30_v,Strt_ERA_30_h,Strt_ERA_30_v,Strt_FIP_30_h,Strt_FIP_30_v,Strt_FIP_perc_30_h,Strt_FIP_perc_30_v,Strt_WHIP_30_h,Strt_WHIP_30_v,Strt_SO_perc_30_h,Strt_SO_perc_30_v,Strt_TB_BB_perc_30_h,Strt_TB_BB_perc_30_v,Strt_H_BB_perc_30_h,Strt_H_BB_perc_30_v


In [100]:
df.drop(df.index[df.Strt_IP_mod_6_v==0],inplace=True)
df.drop(df.index[df.Strt_IP_mod_6_h==0],inplace=True)
df.shape

(56771, 451)

In [101]:
df.reset_index(drop=True, inplace=True)

In [102]:
df.to_csv('df_bp5.csv', index=False)