## Baseball Prediction: 5b - Adding Starting Pitching Features
Now that we have raw game-level data for each pitcher, we can derive features based on the starting pitchers to help our prediction model for individual games.

In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline

pd.set_option('display.max_columns',1000)
pd.set_option('display.max_rows',1000)



## Overall Plan of Attack
- For each starting pitcher we will load their raw data, create features for each game based on their previous performance, and then save the dataframe in a dictionary structure for easy lookup
- Then we can iterate through our game-level dataframe, add in the features for each starting pitcher, and use those to improve our model


In [2]:
df_gooden = pd.read_csv('data/pitcher_data/pitching_data_goodd001.csv')

In [3]:
df_gooden.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 430 entries, 0 to 429
Data columns (total 31 columns):
 #   Column       Non-Null Count  Dtype  
---  ------       --------------  -----  
 0   at_vs        430 non-null    object 
 1   Opponent     430 non-null    object 
 2   League       430 non-null    object 
 3   GS           430 non-null    int64  
 4   CG           430 non-null    int64  
 5   SHO          430 non-null    int64  
 6   GF           430 non-null    int64  
 7   SV           430 non-null    int64  
 8   IP           430 non-null    float64
 9   H            430 non-null    int64  
 10  BFP          430 non-null    int64  
 11  HR           430 non-null    int64  
 12  R            430 non-null    int64  
 13  ER           430 non-null    int64  
 14  BB           430 non-null    int64  
 15  IB           430 non-null    int64  
 16  SO           430 non-null    int64  
 17  SH           430 non-null    int64  
 18  SF           430 non-null    int64  
 19  WP      

In [4]:
df_gooden.head(20)

Unnamed: 0,at_vs,Opponent,League,GS,CG,SHO,GF,SV,IP,H,BFP,HR,R,ER,BB,IB,SO,SH,SF,WP,HBP,BK,2B,3B,GDP,ROE,W,L,ERA,Date,dblhead_num
0,AT,HOU,N,1,0,0,0,0,5.0,3,20,0,1,1,2,0,5,0,0,0,0,0,0,0,0,0,1,0,1.8,4- 7-1984,
1,AT,CHI,N,1,0,0,0,0,3.1,7,20,0,6,6,3,0,4,0,0,0,0,0,1,0,0,0,0,1,7.56,4-13-1984,
2,VS,MON,N,1,0,0,0,0,5.0,5,26,0,4,0,4,0,7,0,0,0,1,0,0,0,0,1,0,0,4.72,4-19-1984,
3,AT,MON,N,1,0,0,0,0,7.0,2,24,0,1,0,1,0,10,0,0,0,0,1,0,0,0,1,0,0,3.1,4-25-1984,
4,VS,CHI,N,1,0,0,0,0,7.0,4,30,0,1,1,5,0,10,0,0,1,0,0,2,0,0,0,1,0,2.63,5- 1-1984,
5,VS,HOU,N,1,0,0,0,0,2.1,6,15,0,8,8,2,0,4,0,0,0,0,1,0,0,0,0,0,1,4.85,5- 6-1984,
6,AT,LA,N,1,1,1,0,0,9.0,4,32,0,0,0,2,0,11,0,0,0,0,1,0,0,0,0,1,0,3.72,5-11-1984,
7,AT,SD,N,1,0,0,0,0,4.2,5,22,0,4,4,3,0,8,0,0,0,0,0,1,1,0,0,0,1,4.15,5-18-1984,
8,VS,LA,N,1,0,0,0,0,8.0,3,30,1,1,1,3,0,14,0,0,0,0,0,1,0,0,0,1,0,3.68,5-25-1984,
9,VS,STL,N,1,0,0,0,0,7.0,4,28,0,1,1,3,0,7,1,1,0,0,0,0,0,0,0,0,0,3.39,6- 1-1984,


In [5]:
df_gooden['IP_real'] = df_gooden['IP_real'] = (df_gooden.IP - (df_gooden.IP % 1)) + (df_gooden.IP % 1) * (10/3)
df_gooden.head(10)

Unnamed: 0,at_vs,Opponent,League,GS,CG,SHO,GF,SV,IP,H,BFP,HR,R,ER,BB,IB,SO,SH,SF,WP,HBP,BK,2B,3B,GDP,ROE,W,L,ERA,Date,dblhead_num,IP_real
0,AT,HOU,N,1,0,0,0,0,5.0,3,20,0,1,1,2,0,5,0,0,0,0,0,0,0,0,0,1,0,1.8,4- 7-1984,,5.0
1,AT,CHI,N,1,0,0,0,0,3.1,7,20,0,6,6,3,0,4,0,0,0,0,0,1,0,0,0,0,1,7.56,4-13-1984,,3.333333
2,VS,MON,N,1,0,0,0,0,5.0,5,26,0,4,0,4,0,7,0,0,0,1,0,0,0,0,1,0,0,4.72,4-19-1984,,5.0
3,AT,MON,N,1,0,0,0,0,7.0,2,24,0,1,0,1,0,10,0,0,0,0,1,0,0,0,1,0,0,3.1,4-25-1984,,7.0
4,VS,CHI,N,1,0,0,0,0,7.0,4,30,0,1,1,5,0,10,0,0,1,0,0,2,0,0,0,1,0,2.63,5- 1-1984,,7.0
5,VS,HOU,N,1,0,0,0,0,2.1,6,15,0,8,8,2,0,4,0,0,0,0,1,0,0,0,0,0,1,4.85,5- 6-1984,,2.333333
6,AT,LA,N,1,1,1,0,0,9.0,4,32,0,0,0,2,0,11,0,0,0,0,1,0,0,0,0,1,0,3.72,5-11-1984,,9.0
7,AT,SD,N,1,0,0,0,0,4.2,5,22,0,4,4,3,0,8,0,0,0,0,0,1,1,0,0,0,1,4.15,5-18-1984,,4.666667
8,VS,LA,N,1,0,0,0,0,8.0,3,30,1,1,1,3,0,14,0,0,0,0,0,1,0,0,0,1,0,3.68,5-25-1984,,8.0
9,VS,STL,N,1,0,0,0,0,7.0,4,28,0,1,1,3,0,7,1,1,0,0,0,0,0,0,0,0,0,3.39,6- 1-1984,,7.0


In [6]:
df_gooden.columns

Index(['at_vs', 'Opponent', 'League', 'GS', 'CG', 'SHO', 'GF', 'SV', 'IP', 'H',
       'BFP', 'HR', 'R', 'ER', 'BB', 'IB', 'SO', 'SH', 'SF', 'WP', 'HBP', 'BK',
       '2B', '3B', 'GDP', 'ROE', 'W', 'L', 'ERA', 'Date', 'dblhead_num',
       'IP_real'],
      dtype='object')

### Generating Features for a Starting Pitcher
- Want to creature features based on a lookback across $n$ games for each pitcher
- Need to aggregate statistics like innings pitched (IP), runs or earned runs given up, hits and walks given up, strikeouts, and so on
- We will also need to decide how to handle pitchers early in their career when they have relatively few games on which to base their performance.

In [7]:
def roll_column(df, col, winsize):
    # do the standard Pandas rolling calc
    t_col = df[col].rolling(winsize, closed='left').sum().to_numpy()
    
    # for the early columns, just do a rolling sum from the beginning
    t_col[:winsize] = np.concatenate(([0],df[col].iloc[:(winsize)].cumsum().to_numpy()[:-1]))

    return(t_col)

In [8]:
def load_and_process_pitch_df(p_id, filepath=''):
    fname = filepath+'pitching_data_'+p_id+'.csv'
    pitch_df = pd.read_csv(fname)
    
    # Convert date, fix dblhead_num to be 0,1,2
    pitch_df['Date'] = (pd.to_datetime(pitch_df.Date).astype(str).str.replace('-','')).astype(int)
    pitch_df.dblhead_num.fillna(0, inplace=True)
    pitch_df['dblhead_num'] = pitch_df['dblhead_num'].astype(int)
    
    # Convert IP to proper mathematical format
    pitch_df['IP_real'] = (pitch_df.IP - (pitch_df.IP % 1)) + (pitch_df.IP % 1) * (10/3)
    
    cols_to_agg = ['IP_real', 'H','BFP', 'HR', 'R', 'ER', 'BB', 'IB', 'SO', 'SH', 'SF', 'WP', 'HBP', 'BK',
       '2B', '3B']
    winsizes = [10,35]
    for winsize in winsizes:
        for raw_col in cols_to_agg:
            new_colname = 'rollsum_'+raw_col+'_'+str(winsize)        
            pitch_df[new_colname] = roll_column(pitch_df, raw_col, winsize)

    
    er_per_ip_def = (5/9)
    h_bb_per_ip_def = 1.5
    h_bb_per_bf_def = .37
    so_per_bf_def = .2
    ip_per_game_def = 3
    bf_per_game_def = 12
    tb_bb_perc_def = .45
    for winsize in winsizes:
        hit_col = 'rollsum_H_'+str(winsize)
        bb_col = 'rollsum_BB_'+str(winsize)
        h_bb_col = 'H_BB_roll_'+str(winsize)
        double_col = 'rollsum_2B_'+str(winsize)
        triple_col = 'rollsum_3B_'+str(winsize)
        hr_col = 'rollsum_HR_'+str(winsize)
        xb_col = 'XB_roll_'+str(winsize)
        tb_col = 'TB_roll_'+str(winsize)
        so_col = 'rollsum_SO_'+str(winsize)
        so_mod_col = 'SO_mod_'+str(winsize)
        ip_col = 'rollsum_IP_real_'+str(winsize)
        ip_mod_col = 'IP_mod_'+str(winsize)
        er_col = 'rollsum_ER_'+str(winsize)
        er_mod_col = 'ER_mod_'+str(winsize)
        bf_col = 'rollsum_BFP_'+str(winsize)
        bf_mod_col = 'BF_mod_'+str(winsize)
        era_col = 'ERA_'+str(winsize)
        whip_col = 'WHIP_'+str(winsize)
        so_perc_col = 'SO_perc_'+str(winsize)
        h_bb_perc_col = 'H_BB_perc_'+str(winsize)
        h_bb_mod_col = 'H_BB_mod_'+str(winsize)
        h_bb_mod2_col = 'H_BB_mod2_'+str(winsize)
        tb_bb_mod_col = 'TB_BB_mod_'+str(winsize)
        tb_bb_perc_col = 'TB_BB_perc_'+str(winsize)
        pitch_df[h_bb_col] = pitch_df[hit_col]+pitch_df[bb_col]
        pitch_df[xb_col] = pitch_df[double_col]+2*pitch_df[triple_col]+2*pitch_df[hr_col]
        pitch_df[tb_col] = pitch_df[hit_col]+pitch_df[xb_col]
        pitch_df[ip_mod_col] = np.maximum(pitch_df[ip_col], winsize*ip_per_game_def)
        pitch_df[bf_mod_col] = np.maximum(pitch_df[bf_col], winsize*bf_per_game_def)
        pitch_df[er_mod_col] = pitch_df[er_col] + er_per_ip_def*(pitch_df[ip_mod_col]-pitch_df[ip_col])
        pitch_df[h_bb_mod_col] = pitch_df[h_bb_col] + h_bb_per_ip_def*(pitch_df[ip_mod_col]-pitch_df[ip_col])
        pitch_df[h_bb_mod2_col] = pitch_df[h_bb_col] + h_bb_per_bf_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[so_mod_col] = pitch_df[so_col] + so_per_bf_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[tb_bb_mod_col] = (pitch_df[tb_col] + pitch_df[bb_col])+ tb_bb_perc_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[era_col] = (pitch_df[er_mod_col]/pitch_df[ip_mod_col])*9
        pitch_df[whip_col] = pitch_df[h_bb_mod_col]/pitch_df[ip_mod_col]
        pitch_df[so_perc_col] = pitch_df[so_mod_col]/pitch_df[bf_mod_col]
        pitch_df[tb_bb_perc_col] = pitch_df[tb_bb_mod_col]/pitch_df[bf_mod_col]
        pitch_df[h_bb_perc_col] = pitch_df[h_bb_mod2_col]/pitch_df[bf_mod_col]
    pitch_df['date_dblhead'] = (pitch_df['Date'].astype(str) + pitch_df['dblhead_num'].astype(str)).astype(int)
    pitch_df.set_index('date_dblhead', inplace=True)
    return(pitch_df)

In [9]:
df_good = load_and_process_pitch_df('goodd001','data/pitcher_data/')

In [10]:
df_good.head(50)

Unnamed: 0_level_0,at_vs,Opponent,League,GS,CG,SHO,GF,SV,IP,H,BFP,HR,R,ER,BB,IB,SO,SH,SF,WP,HBP,BK,2B,3B,GDP,ROE,W,L,ERA,Date,dblhead_num,IP_real,rollsum_IP_real_10,rollsum_H_10,rollsum_BFP_10,rollsum_HR_10,rollsum_R_10,rollsum_ER_10,rollsum_BB_10,rollsum_IB_10,rollsum_SO_10,rollsum_SH_10,rollsum_SF_10,rollsum_WP_10,rollsum_HBP_10,rollsum_BK_10,rollsum_2B_10,rollsum_3B_10,rollsum_IP_real_35,rollsum_H_35,rollsum_BFP_35,rollsum_HR_35,rollsum_R_35,rollsum_ER_35,rollsum_BB_35,rollsum_IB_35,rollsum_SO_35,rollsum_SH_35,rollsum_SF_35,rollsum_WP_35,rollsum_HBP_35,rollsum_BK_35,rollsum_2B_35,rollsum_3B_35,H_BB_roll_10,XB_roll_10,TB_roll_10,IP_mod_10,BF_mod_10,ER_mod_10,H_BB_mod_10,H_BB_mod2_10,SO_mod_10,TB_BB_mod_10,ERA_10,WHIP_10,SO_perc_10,TB_BB_perc_10,H_BB_perc_10,H_BB_roll_35,XB_roll_35,TB_roll_35,IP_mod_35,BF_mod_35,ER_mod_35,H_BB_mod_35,H_BB_mod2_35,SO_mod_35,TB_BB_mod_35,ERA_35,WHIP_35,SO_perc_35,TB_BB_perc_35,H_BB_perc_35
date_dblhead,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1
198404070,AT,HOU,N,1,0,0,0,0,5.0,3,20,0,1,1,2,0,5,0,0,0,0,0,0,0,0,0,1,0,1.8,19840407,0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,30.0,120.0,16.666667,45.0,44.4,24.0,54.0,5.0,1.5,0.2,0.45,0.37,0.0,0.0,0.0,105.0,420.0,58.333333,157.5,155.4,84.0,189.0,5.0,1.5,0.2,0.45,0.37
198404130,AT,CHI,N,1,0,0,0,0,3.1,7,20,0,6,6,3,0,4,0,0,0,0,0,1,0,0,0,0,1,7.56,19840413,0,3.333333,5.0,3.0,20.0,0.0,1.0,1.0,2.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,3.0,20.0,0.0,1.0,1.0,2.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,3.0,30.0,120.0,14.888889,42.5,42.0,25.0,50.0,4.466667,1.416667,0.208333,0.416667,0.35,5.0,0.0,3.0,105.0,420.0,56.555556,155.0,153.0,85.0,185.0,4.847619,1.47619,0.202381,0.440476,0.364286
198404190,VS,MON,N,1,0,0,0,0,5.0,5,26,0,4,0,4,0,7,0,0,0,1,0,0,0,0,1,0,0,4.72,19840419,0,5.0,8.333333,10.0,40.0,0.0,7.0,7.0,5.0,0.0,9.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,8.333333,10.0,40.0,0.0,7.0,7.0,5.0,0.0,9.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,15.0,1.0,11.0,30.0,120.0,19.037037,47.5,44.6,25.0,52.0,5.711111,1.583333,0.208333,0.433333,0.371667,15.0,1.0,11.0,105.0,420.0,60.703704,160.0,155.6,85.0,187.0,5.203175,1.52381,0.202381,0.445238,0.370476
198404250,AT,MON,N,1,0,0,0,0,7.0,2,24,0,1,0,1,0,10,0,0,0,0,1,0,0,0,1,0,0,3.1,19840425,0,7.0,13.333333,15.0,66.0,0.0,11.0,7.0,9.0,0.0,16.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,13.333333,15.0,66.0,0.0,11.0,7.0,9.0,0.0,16.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,24.0,1.0,16.0,30.0,120.0,16.259259,49.0,43.98,26.8,49.3,4.877778,1.633333,0.223333,0.410833,0.3665,24.0,1.0,16.0,105.0,420.0,57.925926,161.5,154.98,86.8,184.3,4.965079,1.538095,0.206667,0.43881,0.369
198405010,VS,CHI,N,1,0,0,0,0,7.0,4,30,0,1,1,5,0,10,0,0,1,0,0,2,0,0,0,1,0,2.63,19840501,0,7.0,20.333333,17.0,90.0,0.0,12.0,7.0,10.0,0.0,26.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,20.333333,17.0,90.0,0.0,12.0,7.0,10.0,0.0,26.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,27.0,1.0,18.0,30.0,120.0,12.37037,41.5,38.1,32.0,41.5,3.711111,1.383333,0.266667,0.345833,0.3175,27.0,1.0,18.0,105.0,420.0,54.037037,154.0,149.1,92.0,176.5,4.631746,1.466667,0.219048,0.420238,0.355
198405060,VS,HOU,N,1,0,0,0,0,2.1,6,15,0,8,8,2,0,4,0,0,0,0,1,0,0,0,0,0,1,4.85,19840506,0,2.333333,27.333333,21.0,120.0,0.0,13.0,8.0,15.0,0.0,36.0,0.0,0.0,1.0,1.0,1.0,3.0,0.0,27.333333,21.0,120.0,0.0,13.0,8.0,15.0,0.0,36.0,0.0,0.0,1.0,1.0,1.0,3.0,0.0,36.0,3.0,24.0,30.0,120.0,9.481481,40.0,36.0,36.0,39.0,2.844444,1.333333,0.3,0.325,0.3,36.0,3.0,24.0,105.0,420.0,51.148148,152.5,147.0,96.0,174.0,4.384127,1.452381,0.228571,0.414286,0.35
198405110,AT,LA,N,1,1,1,0,0,9.0,4,32,0,0,0,2,0,11,0,0,0,0,1,0,0,0,0,1,0,3.72,19840511,0,9.0,29.666667,27.0,135.0,0.0,21.0,16.0,17.0,0.0,40.0,0.0,0.0,1.0,1.0,2.0,3.0,0.0,29.666667,27.0,135.0,0.0,21.0,16.0,17.0,0.0,40.0,0.0,0.0,1.0,1.0,2.0,3.0,0.0,44.0,3.0,30.0,30.0,135.0,16.185185,44.5,44.0,40.0,47.0,4.855556,1.483333,0.296296,0.348148,0.325926,44.0,3.0,30.0,105.0,420.0,57.851852,157.0,149.45,97.0,175.25,4.95873,1.495238,0.230952,0.417262,0.355833
198405180,AT,SD,N,1,0,0,0,0,4.2,5,22,0,4,4,3,0,8,0,0,0,0,0,1,1,0,0,0,1,4.15,19840518,0,4.666667,38.666667,31.0,167.0,0.0,21.0,16.0,19.0,0.0,51.0,0.0,0.0,1.0,1.0,3.0,3.0,0.0,38.666667,31.0,167.0,0.0,21.0,16.0,19.0,0.0,51.0,0.0,0.0,1.0,1.0,3.0,3.0,0.0,50.0,3.0,34.0,38.666667,167.0,16.0,50.0,50.0,51.0,53.0,3.724138,1.293103,0.305389,0.317365,0.299401,50.0,3.0,34.0,105.0,420.0,52.851852,149.5,143.61,101.6,166.85,4.530159,1.42381,0.241905,0.397262,0.341929
198405250,VS,LA,N,1,0,0,0,0,8.0,3,30,1,1,1,3,0,14,0,0,0,0,0,1,0,0,0,1,0,3.68,19840525,0,8.0,43.333333,36.0,189.0,0.0,25.0,20.0,22.0,0.0,59.0,0.0,0.0,1.0,1.0,3.0,4.0,1.0,43.333333,36.0,189.0,0.0,25.0,20.0,22.0,0.0,59.0,0.0,0.0,1.0,1.0,3.0,4.0,1.0,58.0,6.0,42.0,43.333333,189.0,20.0,58.0,58.0,59.0,64.0,4.153846,1.338462,0.312169,0.338624,0.306878,58.0,6.0,42.0,105.0,420.0,54.259259,150.5,143.47,105.2,167.95,4.650794,1.433333,0.250476,0.399881,0.341595
198406010,VS,STL,N,1,0,0,0,0,7.0,4,28,0,1,1,3,0,7,1,1,0,0,0,0,0,0,0,0,0,3.39,19840601,0,7.0,51.333333,39.0,219.0,1.0,26.0,21.0,25.0,0.0,73.0,0.0,0.0,1.0,1.0,3.0,5.0,1.0,51.333333,39.0,219.0,1.0,26.0,21.0,25.0,0.0,73.0,0.0,0.0,1.0,1.0,3.0,5.0,1.0,64.0,9.0,48.0,51.333333,219.0,21.0,64.0,64.0,73.0,73.0,3.681818,1.246753,0.333333,0.333333,0.292237,64.0,9.0,48.0,105.0,420.0,50.814815,144.5,138.37,113.2,163.45,4.355556,1.37619,0.269524,0.389167,0.329452


## Load in our game level data

In [11]:
df=pd.read_csv('df_bp3.csv')

  exec(code_obj, self.user_global_ns, self.user_ns)


In [12]:
start_pitchers_h = df.pitcher_start_id_h.unique()
start_pitchers_v = df.pitcher_start_id_v.unique()
start_pitchers_all = np.union1d(start_pitchers_h, start_pitchers_v)


In [13]:
pitcher_data_dict = {}
for i, p_id in enumerate(start_pitchers_all):
    if i%100==0:
        print(i)
    pitcher_data_dict[p_id] = load_and_process_pitch_df(p_id,'data/pitcher_data/')

0
100
200
300
400
500
600
700
800
900
1000
1100
1200
1300
1400
1500
1600
1700
1800
1900
2000
2100
2200
2300
2400
2500
2600
2700
2800
2900
3000


In [14]:
raw_cols_to_add = ['IP_real', 'rollsum_IP_real_10', 'rollsum_H_10',
       'rollsum_BFP_10', 'rollsum_HR_10', 'rollsum_R_10', 'rollsum_ER_10',
       'rollsum_BB_10', 'rollsum_IB_10', 'rollsum_SO_10', 'rollsum_SH_10',
       'rollsum_SF_10', 'rollsum_WP_10', 'rollsum_HBP_10',
       'rollsum_BK_10', 'rollsum_2B_10', 'rollsum_3B_10',
       'rollsum_IP_real_35', 'rollsum_H_35', 'rollsum_BFP_35',
       'rollsum_HR_35', 'rollsum_R_35', 'rollsum_ER_35', 'rollsum_BB_35',
       'rollsum_IB_35', 'rollsum_SO_35', 'rollsum_SH_35', 'rollsum_SF_35',
       'rollsum_WP_35', 'rollsum_HBP_35', 'rollsum_BK_35',
       'rollsum_2B_35', 'rollsum_3B_35', 'H_BB_roll_10', 'XB_roll_10',
       'TB_roll_10', 'IP_mod_10', 'BF_mod_10', 'ER_mod_10', 'H_BB_mod_10', 'H_BB_perc_10',
       'SO_mod_10', 'TB_BB_mod_10', 'ERA_10', 'WHIP_10', 'SO_perc_10',
       'TB_BB_perc_10', 'H_BB_roll_35', 'XB_roll_35', 'TB_roll_35',
       'IP_mod_35', 'BF_mod_35', 'ER_mod_35', 'H_BB_mod_35','H_BB_perc_35', 'SO_mod_35',
       'TB_BB_mod_35', 'ERA_35', 'WHIP_35', 'SO_perc_35', 'TB_BB_perc_35']
cols_to_add = [col+suff for col in raw_cols_to_add for suff in ['_h','_v']]

col_add_dict = {col:np.zeros(df.shape[0]) for col in cols_to_add}

In [15]:
for i in range(df.shape[0]):
    row = df.iloc[i,:]
    if i%1000==0:
        print(i)
    sp_id_v = row['pitcher_start_id_v']
    sp_id_h = row['pitcher_start_id_h']
    date_dblhead = row['date_dblhead']
    if sp_id_v in pitcher_data_dict.keys():
        curr_df = pitcher_data_dict[sp_id_v]
        if date_dblhead in curr_df.index:
            for col in raw_cols_to_add:
                col_add_dict[col+'_v'][i] = curr_df.loc[date_dblhead,col]
        else:
            print(f'no match for {sp_id_v} date {date_dblhead}')
    if sp_id_h in pitcher_data_dict.keys():
        curr_df = pitcher_data_dict[sp_id_h]
        if date_dblhead in curr_df.index:
            for col in raw_cols_to_add:
                col_add_dict[col+'_h'][i] = curr_df.loc[date_dblhead,col]
        else:
            print(f'no match for {sp_id_h} date {date_dblhead}')

0
1000
2000
3000
4000
no match for wilcm001 date 198206020
5000
6000
7000
no match for laskb001 date 198308280
8000
9000
10000
11000
12000
no match for sotom001 date 198605260
13000
14000
15000
no match for ferns001 date 198708030
16000
17000
18000
19000
20000
21000
no match for jackd001 date 199008130
22000
no match for candt001 date 199009160
23000
24000
25000
26000
no match for harkm001 date 199208250
no match for tewkb001 date 199304150
27000
28000
29000
no match for cormr001 date 199405200
30000
no match for herso001 date 199407160
31000
32000
33000
34000
35000
36000
37000
38000
39000
no match for merck001 date 199809200
40000
41000
42000
43000
44000
45000
46000
47000
48000
no match for milte001 date 200208060
49000
50000
51000
52000
53000
no match for armat002 date 200408030
54000
55000
56000
57000
no match for mitrs001 date 200605120
58000
59000
60000
61000
62000
63000
64000
65000
66000
67000
68000
no match for volqe001 date 201104220
69000
70000
no match for oswar001 date 20110

In [16]:
for col in cols_to_add:
    df[col] = col_add_dict[col]

  df[col] = col_add_dict[col]


In [17]:
df.sample(5)

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,SObat_perc_162_h,SObat_perc_162_v,SLGmod_162_h,SLGmod_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,SObat_perc_30_h,SObat_perc_30_v,SLGmod_30_h,SLGmod_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,IP_real_h,IP_real_v,rollsum_IP_real_10_h,rollsum_IP_real_10_v,rollsum_H_10_h,rollsum_H_10_v,rollsum_BFP_10_h,rollsum_BFP_10_v,rollsum_HR_10_h,rollsum_HR_10_v,rollsum_R_10_h,rollsum_R_10_v,rollsum_ER_10_h,rollsum_ER_10_v,rollsum_BB_10_h,rollsum_BB_10_v,rollsum_IB_10_h,rollsum_IB_10_v,rollsum_SO_10_h,rollsum_SO_10_v,rollsum_SH_10_h,rollsum_SH_10_v,rollsum_SF_10_h,rollsum_SF_10_v,rollsum_WP_10_h,rollsum_WP_10_v,rollsum_HBP_10_h,rollsum_HBP_10_v,rollsum_BK_10_h,rollsum_BK_10_v,rollsum_2B_10_h,rollsum_2B_10_v,rollsum_3B_10_h,rollsum_3B_10_v,rollsum_IP_real_35_h,rollsum_IP_real_35_v,rollsum_H_35_h,rollsum_H_35_v,rollsum_BFP_35_h,rollsum_BFP_35_v,rollsum_HR_35_h,rollsum_HR_35_v,rollsum_R_35_h,rollsum_R_35_v,rollsum_ER_35_h,rollsum_ER_35_v,rollsum_BB_35_h,rollsum_BB_35_v,rollsum_IB_35_h,rollsum_IB_35_v,rollsum_SO_35_h,rollsum_SO_35_v,rollsum_SH_35_h,rollsum_SH_35_v,rollsum_SF_35_h,rollsum_SF_35_v,rollsum_WP_35_h,rollsum_WP_35_v,rollsum_HBP_35_h,rollsum_HBP_35_v,rollsum_BK_35_h,rollsum_BK_35_v,rollsum_2B_35_h,rollsum_2B_35_v,rollsum_3B_35_h,rollsum_3B_35_v,H_BB_roll_10_h,H_BB_roll_10_v,XB_roll_10_h,XB_roll_10_v,TB_roll_10_h,TB_roll_10_v,IP_mod_10_h,IP_mod_10_v,BF_mod_10_h,BF_mod_10_v,ER_mod_10_h,ER_mod_10_v,H_BB_mod_10_h,H_BB_mod_10_v,H_BB_perc_10_h,H_BB_perc_10_v,SO_mod_10_h,SO_mod_10_v,TB_BB_mod_10_h,TB_BB_mod_10_v,ERA_10_h,ERA_10_v,WHIP_10_h,WHIP_10_v,SO_perc_10_h,SO_perc_10_v,TB_BB_perc_10_h,TB_BB_perc_10_v,H_BB_roll_35_h,H_BB_roll_35_v,XB_roll_35_h,XB_roll_35_v,TB_roll_35_h,TB_roll_35_v,IP_mod_35_h,IP_mod_35_v,BF_mod_35_h,BF_mod_35_v,ER_mod_35_h,ER_mod_35_v,H_BB_mod_35_h,H_BB_mod_35_v,H_BB_perc_35_h,H_BB_perc_35_v,SO_mod_35_h,SO_mod_35_v,TB_BB_mod_35_h,TB_BB_mod_35_v,ERA_35_h,ERA_35_v,WHIP_35_h,WHIP_35_v,SO_perc_35_h,SO_perc_35_v,TB_BB_perc_35_h,TB_BB_perc_35_v
90497,20190928,0,Sat,BAL,AL,161,BOS,AL,161,9,4,54,D,,,,BOS07,36414.0,217,211004001,300001000,37,12,3,0,4,9,1,0,0,4,0,10,2,1,0,0,6,6,4,4,0,0,27,12,0,0,2,0,35,9,0,0,2,4,0,0,0,5,0,7,0,0,2,0,9,7,9,9,0,0,27,11,0,0,0,0,onorb901,Brian O'Nora,rippm901,Mark Ripperger,hoyej901,James Hoye,lives901,Shane Livensparger,,(none),,(none),hydeb801,Brandon Hyde,coraa001,Alex Cora,meanj001,John Means,chacj001,Jhoulys Chacin,,(none),nuner001,Renato Nunez,meanj001,John Means,chacj001,Jhoulys Chacin,villj001,Jonathan Villar,4,stewd002,DJ Stewart,9,manct001,Trey Mancini,7,ruizr002,Rio Ruiz,5,nuner001,Renato Nunez,10,davic003,Chris Davis,3,wilks001,Steve Wilkerson,8,wynna001,Austin Wynns,2,martr006,Richie Martin,6,bradj001,Jackie Bradley,8,dever001,Rafael Devers,5,bogax001,Xander Bogaerts,6,martj006,J.D. Martinez,10,travs001,Sam Travis,7,holtb002,Brock Holt,3,herng001,Gorkys Hernandez,9,owinc001,Chris Owings,4,leons001,Sandy Leon,2,,Y,2019,-5,0,13,201909280,0.269437,0.246151,0.337365,0.303737,0.467359,0.41246,0.804724,0.716196,70.0,84.0,30.0,29.0,89.0,107.0,0.218784,0.236276,0.516884,0.457341,0.233083,0.257435,0.302564,0.315338,0.400376,0.428439,0.70294,0.743777,10.0,18.0,7.0,3.0,11.0,16.0,0.218784,0.236276,0.454701,0.473008,0.6,0.416667,0.591667,10.5,O,2.666667,5.0,33.333333,55.333333,41.0,54.0,153.0,230.0,8.0,8.0,24.0,29.0,21.0,28.0,12.0,12.0,1.0,0.0,42.0,42.0,0.0,0.0,2.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,9.0,13.0,1.0,2.0,161.333333,153.333333,154.0,139.0,696.0,631.0,27.0,22.0,90.0,70.0,83.0,64.0,64.0,36.0,3.0,0.0,148.0,120.0,8.0,0.0,6.0,3.0,6.0,5.0,6.0,5.0,0.0,0.0,31.0,36.0,3.0,3.0,53.0,66.0,27.0,33.0,68.0,87.0,33.333333,55.333333,153.0,230.0,21.0,28.0,53.0,66.0,0.346405,0.286957,42.0,42.0,80.0,99.0,5.67,4.554217,1.59,1.192771,0.27451,0.182609,0.522876,0.430435,218.0,175.0,91.0,86.0,245.0,225.0,161.333333,153.333333,696.0,631.0,83.0,64.0,218.0,175.0,0.313218,0.277338,148.0,120.0,309.0,261.0,4.630165,3.756522,1.35124,1.141304,0.212644,0.190174,0.443966,0.413629
11391,19850824,0,Sat,SDN,NL,123,NYN,NL,122,1,5,51,N,,,,NYC17,40863.0,152,10000000,02000102x,30,7,1,0,0,1,1,0,0,4,0,6,0,1,2,0,7,2,5,5,0,0,24,9,0,0,0,0,33,11,2,0,0,5,2,0,0,0,0,3,0,0,0,0,6,2,1,1,0,0,27,11,0,0,2,0,kiblj901,John Kibler,steld901,Dick Stello,froeb901,Bruce Froemming,davib902,Bob Davidson,,(none),,(none),willd104,Dick Williams,johnd105,Davey Johnson,darlr001,Ron Darling,dravd001,Dave Dravecky,orosj001,Jesse Orosco,santr001,Rafael Santana,dravd001,Dave Dravecky,darlr001,Ron Darling,tempg001,Garry Templeton,6,gwynt001,Tony Gwynn,9,garvs001,Steve Garvey,3,nettg001,Graig Nettles,5,kennt001,Terry Kennedy,2,martc001,Carmelo Martinez,7,mcrek001,Kevin McReynolds,8,flant001,Tim Flannery,4,dravd001,Dave Dravecky,1,dyksl001,Lenny Dykstra,8,backw001,Wally Backman,4,hernk001,Keith Hernandez,3,cartg001,Gary Carter,2,fostg001,George Foster,7,pacit001,Tom Paciorek,9,knigr001,Ray Knight,5,santr001,Rafael Santana,6,darlr001,Ron Darling,1,,Y,1985,4,1,6,198508240,0.254396,0.25262,0.320934,0.312157,0.380403,0.365739,0.701337,0.677896,116.0,86.0,56.0,43.0,121.0,130.0,0.149791,0.138201,0.435696,0.416265,0.282675,0.253644,0.347465,0.313059,0.420466,0.353741,0.767931,0.666801,24.0,14.0,8.0,8.0,18.0,28.0,0.149791,0.138201,0.472811,0.405188,0.0,0.0,0.5,0.0,,7.0,6.0,58.333333,64.666667,61.0,63.0,270.0,267.0,6.0,4.0,32.0,21.0,23.0,16.0,38.0,14.0,1.0,3.0,35.0,33.0,3.0,5.0,2.0,2.0,3.0,0.0,1.0,1.0,1.0,0.0,13.0,11.0,2.0,0.0,229.333333,203.333333,201.0,170.0,967.0,816.0,22.0,17.0,97.0,63.0,79.0,56.0,105.0,57.0,3.0,5.0,170.0,108.0,9.0,10.0,6.0,3.0,8.0,3.0,3.0,1.0,1.0,1.0,40.0,31.0,4.0,1.0,99.0,77.0,29.0,19.0,90.0,82.0,58.333333,64.666667,270.0,267.0,23.0,16.0,99.0,77.0,0.366667,0.28839,35.0,33.0,128.0,96.0,3.548571,2.226804,1.697143,1.190722,0.12963,0.123596,0.474074,0.359551,306.0,227.0,92.0,67.0,293.0,237.0,229.333333,203.333333,967.0,816.0,79.0,56.0,306.0,227.0,0.316443,0.278186,170.0,108.0,398.0,294.0,3.100291,2.478689,1.334302,1.116393,0.175801,0.132353,0.411582,0.360294
8871,19840715,0,Sun,SFN,NL,88,PIT,NL,89,3,9,51,D,,,,PIT07,13078.0,142,10020000,20006001x,30,3,0,0,1,3,0,1,0,0,0,2,0,0,0,0,1,3,9,9,0,0,24,10,0,0,3,0,38,17,3,1,2,9,0,0,0,2,0,4,0,0,3,0,7,1,2,2,0,0,27,12,1,0,0,0,weyel901,Lee Weyer,rennd901,Dutch Rennert,ripps901,Steve Rippley,grege901,Eric Gregg,,(none),,(none),robif103,Frank Robinson,tannc101,Chuck Tanner,tudoj001,John Tudor,robij001,Jeff Robinson,,(none),madlb001,Bill Madlock,robij001,Jeff Robinson,tudoj001,John Tudor,lemaj001,Johnnie LeMaster,6,trilm001,Manny Trillo,4,baked002,Dusty Baker,9,leonj001,Jeffrey Leonard,8,brenb001,Bob Brenly,3,younj001,Joel Youngblood,5,nicos001,Steve Nicosia,2,rabbj001,John Rabb,7,robij001,Jeff Robinson,1,wynnm001,Marvell Wynne,8,mazzl001,Lee Mazzilli,7,madlb001,Bill Madlock,5,thomj001,Jason Thompson,3,penat001,Tony Pena,2,ray-j001,Johnny Ray,4,frobd001,Doug Frobel,9,berrd001,Dale Berra,6,tudoj001,John Tudor,1,,Y,1984,6,1,12,198407150,0.254342,0.261463,0.312198,0.331632,0.360347,0.380822,0.672545,0.712454,99.0,118.0,74.0,81.0,140.0,166.0,0.138328,0.165816,0.409978,0.439651,0.266167,0.273567,0.32149,0.335025,0.373946,0.384473,0.695436,0.719499,15.0,31.0,15.0,16.0,27.0,30.0,0.138328,0.165816,0.421144,0.436548,0.0,0.0,0.5,0.0,,9.0,4.0,61.666667,46.666667,69.0,56.0,268.0,210.0,8.0,5.0,29.0,32.0,27.0,29.0,13.0,15.0,0.0,2.0,34.0,31.0,4.0,3.0,1.0,1.0,0.0,2.0,0.0,2.0,1.0,1.0,11.0,10.0,3.0,1.0,236.666667,96.333333,250.0,100.0,1024.0,417.0,32.0,8.0,122.0,52.0,108.0,44.0,75.0,29.0,3.0,4.0,123.0,67.0,11.0,3.0,5.0,4.0,4.0,4.0,0.0,4.0,2.0,1.0,48.0,15.0,5.0,2.0,82.0,71.0,33.0,22.0,102.0,78.0,61.666667,46.666667,268.0,210.0,27.0,29.0,82.0,71.0,0.30597,0.338095,34.0,31.0,115.0,93.0,3.940541,5.592857,1.32973,1.521429,0.126866,0.147619,0.429104,0.442857,325.0,129.0,122.0,35.0,372.0,135.0,236.666667,105.0,1024.0,420.0,108.0,48.814815,325.0,142.0,0.317383,0.309786,123.0,67.6,447.0,165.35,4.107042,4.184127,1.373239,1.352381,0.120117,0.160952,0.436523,0.39369
95618,20220819,0,Fri,SLN,NL,118,ARI,NL,119,5,1,54,N,,,,PHO01,32183.0,172,100000400,000000010,37,12,3,0,1,4,0,0,1,2,0,12,0,0,0,0,8,2,1,1,0,0,27,9,0,0,0,0,31,4,3,0,0,1,0,0,1,1,0,7,0,0,0,0,5,4,4,4,0,0,27,7,0,1,0,0,sches901,Stu Scheurwater,nelsj901,Jeff Nelson,buckc901,CB Bucknor,tosia901,Alex Tosi,,(none),,(none),marmo801,Oliver Marmol,lovut001,Tony Lovullo,mikom001,Miles Mikolas,henrt001,Tommy Henry,,(none),goldp001,Paul Goldschmidt,mikom001,Miles Mikolas,henrt001,Tommy Henry,carld002,Dylan Carlson,8,oneit001,Tyler O'Neill,7,goldp001,Paul Goldschmidt,3,arenn001,Nolan Arenado,5,pujoa001,Albert Pujols,10,edmat001,Tommy Edman,4,dejop001,Paul DeJong,6,moliy001,Yadier Molina,2,nootl001,Lars Nootbaar,9,varsd001,Daulton Varsho,8,rivee001,Emmanuel Rivera,3,rojaj001,Josh Rojas,4,walkc002,Christian Walker,10,mccaj003,Jake McCarthy,9,garrs003,Stone Garrett,7,alcas002,Sergio Alcantara,5,kellc002,Carson Kelly,2,perdg001,Gerardo Perdomo,6,,Y,2022,-4,0,6,202208190,0.231755,0.255729,0.301182,0.31902,0.388672,0.429698,0.689855,0.748718,72.0,101.0,25.0,23.0,102.0,66.0,0.230574,0.215532,0.443919,0.478195,0.247214,0.273547,0.314576,0.348022,0.404255,0.483968,0.718831,0.83199,26.0,14.0,8.0,4.0,13.0,10.0,0.230574,0.215532,0.457565,0.536871,0.384615,0.642857,0.370879,8.5,U,5.333333,8.0,17.333333,60.666667,13.0,63.0,73.0,248.0,2.0,9.0,8.0,33.0,8.0,31.0,8.0,9.0,1.0,0.0,9.0,45.0,0.0,0.0,1.0,6.0,1.0,0.0,1.0,0.0,0.0,1.0,2.0,9.0,0.0,0.0,17.333333,207.666667,13.0,190.0,73.0,842.0,2.0,25.0,8.0,90.0,8.0,82.0,8.0,40.0,1.0,1.0,9.0,153.0,0.0,2.0,1.0,9.0,1.0,2.0,1.0,9.0,0.0,1.0,2.0,32.0,0.0,2.0,21.0,72.0,6.0,27.0,19.0,90.0,30.0,60.666667,120.0,248.0,15.037037,31.0,40.0,72.0,0.319917,0.290323,18.4,45.0,48.15,99.0,4.511111,4.598901,1.333333,1.186813,0.153333,0.181452,0.40125,0.399194,21.0,230.0,6.0,86.0,19.0,276.0,105.0,207.666667,420.0,842.0,56.703704,82.0,152.5,230.0,0.35569,0.273159,78.4,153.0,183.15,316.0,4.860317,3.553772,1.452381,1.107544,0.186667,0.18171,0.436071,0.375297
51128,20030822,0,Fri,PIT,NL,126,MIL,NL,127,2,3,51,N,,,,MIL06,22413.0,179,110,00201000x,29,4,1,0,1,2,1,0,3,5,0,10,0,1,1,0,9,3,3,3,0,0,24,10,0,0,0,0,30,7,2,0,2,3,0,0,0,3,0,11,0,1,0,0,6,4,2,2,0,0,27,11,1,0,1,0,kulpr901,Ron Kulpa,eddid901,Doug Eddings,froeb901,Bruce Froemming,wintm901,Mike Winters,,(none),,(none),mccll001,Lloyd McClendon,yoste001,Ned Yost,franw001,Wayne Franklin,wellk001,Kip Wells,kolbd001,Danny Kolb,podss001,Scott Podsednik,wellk001,Kip Wells,franw001,Wayne Franklin,kendj001,Jason Kendall,2,reboj001,Jeff Reboulet,4,gileb002,Brian Giles,8,sandr002,Reggie Sanders,7,wilsc003,Craig Wilson,3,hernj001,Jose Hernandez,5,davij004,J.J. Davis,9,wilsj002,Jack Wilson,6,wellk001,Kip Wells,1,podss001,Scott Podsednik,8,hallb001,Bill Hall,4,jenkg001,Geoff Jenkins,7,sexsr001,Richie Sexson,3,clarb003,Brady Clark,9,helmw001,Wes Helms,5,osikk001,Keith Osik,2,clayr001,Royce Clayton,6,franw001,Wayne Franklin,1,,Y,2003,1,1,5,200308220,0.252163,0.260463,0.320393,0.328495,0.40447,0.413508,0.724863,0.742003,91.0,77.0,42.0,31.0,108.0,113.0,0.195905,0.173055,0.458804,0.46746,0.257085,0.27676,0.329068,0.351211,0.408907,0.486982,0.737975,0.838193,16.0,8.0,8.0,6.0,18.0,16.0,0.195905,0.173055,0.466179,0.539792,0.0,0.0,0.5,0.0,,7.0,5.0,58.333333,65.0,60.0,67.0,255.0,283.0,12.0,7.0,39.0,32.0,39.0,30.0,27.0,22.0,0.0,3.0,33.0,45.0,5.0,7.0,1.0,2.0,0.0,3.0,4.0,4.0,1.0,0.0,14.0,8.0,2.0,1.0,185.0,218.0,172.0,211.0,812.0,936.0,33.0,29.0,110.0,106.0,104.0,93.0,95.0,79.0,2.0,9.0,118.0,153.0,10.0,13.0,1.0,4.0,1.0,8.0,8.0,11.0,4.0,0.0,35.0,31.0,6.0,2.0,87.0,89.0,42.0,24.0,102.0,91.0,58.333333,65.0,255.0,283.0,39.0,30.0,87.0,89.0,0.341176,0.314488,33.0,45.0,129.0,113.0,6.017143,4.153846,1.491429,1.369231,0.129412,0.159011,0.505882,0.399293,267.0,290.0,113.0,93.0,285.0,304.0,185.0,218.0,812.0,936.0,104.0,93.0,267.0,290.0,0.328818,0.309829,118.0,153.0,380.0,383.0,5.059459,3.83945,1.443243,1.330275,0.14532,0.163462,0.46798,0.409188


In [18]:
df.shape

(96273, 329)

In [19]:
(df.IP_mod_10_h==0).sum()

3

In [20]:
(df.IP_mod_10_v==0).sum()

22

In [21]:
df.loc[df.IP_mod_10_v==0]

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,SObat_perc_162_h,SObat_perc_162_v,SLGmod_162_h,SLGmod_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,SObat_perc_30_h,SObat_perc_30_v,SLGmod_30_h,SLGmod_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,IP_real_h,IP_real_v,rollsum_IP_real_10_h,rollsum_IP_real_10_v,rollsum_H_10_h,rollsum_H_10_v,rollsum_BFP_10_h,rollsum_BFP_10_v,rollsum_HR_10_h,rollsum_HR_10_v,rollsum_R_10_h,rollsum_R_10_v,rollsum_ER_10_h,rollsum_ER_10_v,rollsum_BB_10_h,rollsum_BB_10_v,rollsum_IB_10_h,rollsum_IB_10_v,rollsum_SO_10_h,rollsum_SO_10_v,rollsum_SH_10_h,rollsum_SH_10_v,rollsum_SF_10_h,rollsum_SF_10_v,rollsum_WP_10_h,rollsum_WP_10_v,rollsum_HBP_10_h,rollsum_HBP_10_v,rollsum_BK_10_h,rollsum_BK_10_v,rollsum_2B_10_h,rollsum_2B_10_v,rollsum_3B_10_h,rollsum_3B_10_v,rollsum_IP_real_35_h,rollsum_IP_real_35_v,rollsum_H_35_h,rollsum_H_35_v,rollsum_BFP_35_h,rollsum_BFP_35_v,rollsum_HR_35_h,rollsum_HR_35_v,rollsum_R_35_h,rollsum_R_35_v,rollsum_ER_35_h,rollsum_ER_35_v,rollsum_BB_35_h,rollsum_BB_35_v,rollsum_IB_35_h,rollsum_IB_35_v,rollsum_SO_35_h,rollsum_SO_35_v,rollsum_SH_35_h,rollsum_SH_35_v,rollsum_SF_35_h,rollsum_SF_35_v,rollsum_WP_35_h,rollsum_WP_35_v,rollsum_HBP_35_h,rollsum_HBP_35_v,rollsum_BK_35_h,rollsum_BK_35_v,rollsum_2B_35_h,rollsum_2B_35_v,rollsum_3B_35_h,rollsum_3B_35_v,H_BB_roll_10_h,H_BB_roll_10_v,XB_roll_10_h,XB_roll_10_v,TB_roll_10_h,TB_roll_10_v,IP_mod_10_h,IP_mod_10_v,BF_mod_10_h,BF_mod_10_v,ER_mod_10_h,ER_mod_10_v,H_BB_mod_10_h,H_BB_mod_10_v,H_BB_perc_10_h,H_BB_perc_10_v,SO_mod_10_h,SO_mod_10_v,TB_BB_mod_10_h,TB_BB_mod_10_v,ERA_10_h,ERA_10_v,WHIP_10_h,WHIP_10_v,SO_perc_10_h,SO_perc_10_v,TB_BB_perc_10_h,TB_BB_perc_10_v,H_BB_roll_35_h,H_BB_roll_35_v,XB_roll_35_h,XB_roll_35_v,TB_roll_35_h,TB_roll_35_v,IP_mod_35_h,IP_mod_35_v,BF_mod_35_h,BF_mod_35_v,ER_mod_35_h,ER_mod_35_v,H_BB_mod_35_h,H_BB_mod_35_v,H_BB_perc_35_h,H_BB_perc_35_v,SO_mod_35_h,SO_mod_35_v,TB_BB_mod_35_h,TB_BB_mod_35_v,ERA_35_h,ERA_35_v,WHIP_35_h,WHIP_35_v,SO_perc_35_h,SO_perc_35_v,TB_BB_perc_35_h,TB_BB_perc_35_v
4126,19820602,0,Wed,DET,AL,48,CAL,AL,51,5,4,54,N,,,,ANA01,27396.0,184,110030,001200010,35,10,2,0,2,5,0,0,0,2,0,5,0,1,1,0,5,4,4,4,1,0,27,10,1,0,1,0,34,10,1,0,0,3,2,0,0,4,1,5,1,0,1,0,9,4,5,5,0,0,27,16,0,0,1,0,dimul901,Lou DiMuro,merrd901,Durwood Merrill,reilm901,Mike Reilly,barnl901,Larry Barnett,,(none),,(none),andes101,Sparky Anderson,maucg101,Gene Mauch,lopea001,Aurelio Lopez,corbd001,Doug Corbett,tobid001,Dave Tobik,gibsk001,Kirk Gibson,wilcm001,Milt Wilcox,zahng001,Geoff Zahn,lemoc001,Chet Lemon,9,cabee001,Enos Cabell,5,gibsk001,Kirk Gibson,8,iviem101,Mike Ivie,10,hernl001,Larry Herndon,7,parrl001,Lance Parrish,2,broot001,Tom Brookens,4,wockj001,John Wockenfuss,3,trama001,Alan Trammell,6,downb001,Brian Downing,7,carer001,Rod Carew,3,gricb001,Bobby Grich,4,jackr001,Reggie Jackson,9,bayld001,Don Baylor,10,lynnf001,Fred Lynn,8,decid001,Doug DeCinces,5,folit001,Tim Foli,6,boonb001,Bob Boone,2,,Y,1982,-1,0,9,198206020,0.257573,0.259184,0.331349,0.331715,0.382229,0.377551,0.713578,0.709267,73.0,84.0,52.0,66.0,137.0,106.0,0.133929,0.12569,0.443618,0.438494,0.264471,0.26777,0.33723,0.341506,0.399202,0.409932,0.736432,0.751438,9.0,14.0,8.0,21.0,17.0,27.0,0.133929,0.12569,0.458633,0.469352,0.0,0.0,0.5,0.0,,5.333333,0.0,70.0,0.0,65.0,0.0,283.0,0.0,6.0,0.0,24.0,0.0,22.0,0.0,15.0,0.0,3.0,0.0,22.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17.0,0.0,0.0,0.0,231.333333,0.0,246.0,0.0,972.0,0.0,24.0,0.0,117.0,0.0,101.0,0.0,58.0,0.0,5.0,0.0,74.0,0.0,9.0,0.0,2.0,0.0,2.0,0.0,0.0,0.0,2.0,0.0,42.0,0.0,0.0,0.0,80.0,0.0,29.0,0.0,94.0,0.0,70.0,0.0,283.0,0.0,22.0,0.0,80.0,0.0,0.282686,0.0,22.0,0.0,109.0,0.0,2.828571,0.0,1.142857,0.0,0.077739,0.0,0.385159,0.0,304.0,0.0,90.0,0.0,336.0,0.0,231.333333,0.0,972.0,0.0,101.0,0.0,304.0,0.0,0.312757,0.0,74.0,0.0,394.0,0.0,3.929395,0.0,1.314121,0.0,0.076132,0.0,0.40535,0.0
7282,19830828,0,Sun,SFN,NL,130,NYN,NL,128,7,2,54,D,,,,NYC17,14163.0,180,120100201,011000000,37,13,3,1,1,7,0,1,1,4,1,5,0,2,1,0,9,3,2,2,0,2,27,11,0,0,0,0,31,5,1,0,0,2,1,0,1,3,1,6,0,0,0,0,7,5,6,6,0,0,27,12,1,0,1,0,willc901,Charlie Williams,davig901,Gerry Davis,froeb901,Bruce Froemming,tatat901,Terry Tata,,(none),,(none),robif103,Frank Robinson,howaf102,Frank Howard,barrj101,Jim Barr,swanc001,Craig Swan,laveg001,Gary Lavelle,evand001,Darrell Evans,laskb001,Bill Laskey,swanc001,Craig Swan,lemaj001,Johnnie LeMaster,6,venam001,Max Venable,8,clarj001,Jack Clark,9,evand001,Darrell Evans,5,leonj001,Jeffrey Leonard,7,younj001,Joel Youngblood,4,bergd001,Dave Bergman,3,brenb001,Bob Brenly,2,laskb001,Bill Laskey,1,wilsm001,Mookie Wilson,8,bailb001,Bob Bailor,5,hernk001,Keith Hernandez,3,fostg001,George Foster,7,strad001,Darryl Strawberry,9,hodgr001,Ron Hodges,2,gileb001,Brian Giles,4,oquej001,Jose Oquendo,6,swanc001,Craig Swan,1,,Y,1983,-5,0,9,198308280,0.239867,0.247876,0.297463,0.325605,0.341562,0.377724,0.639025,0.703329,136.0,146.0,66.0,64.0,143.0,169.0,0.177763,0.162637,0.391452,0.442034,0.252456,0.260958,0.299263,0.326208,0.357564,0.373089,0.656827,0.699297,29.0,21.0,12.0,14.0,19.0,27.0,0.177763,0.162637,0.39779,0.428439,0.0,0.0,0.5,0.0,,1.666667,0.0,41.666667,0.0,49.0,0.0,182.0,0.0,6.0,0.0,27.0,0.0,27.0,0.0,17.0,0.0,3.0,0.0,16.0,0.0,1.0,0.0,3.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,14.0,0.0,2.0,0.0,155.333333,0.0,163.0,0.0,661.0,0.0,18.0,0.0,83.0,0.0,78.0,0.0,53.0,0.0,3.0,0.0,70.0,0.0,4.0,0.0,6.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,32.0,0.0,5.0,0.0,66.0,0.0,30.0,0.0,79.0,0.0,41.666667,0.0,182.0,0.0,27.0,0.0,66.0,0.0,0.362637,0.0,16.0,0.0,96.0,0.0,5.832,0.0,1.584,0.0,0.087912,0.0,0.527473,0.0,216.0,0.0,78.0,0.0,241.0,0.0,155.333333,0.0,661.0,0.0,78.0,0.0,216.0,0.0,0.326778,0.0,70.0,0.0,294.0,0.0,4.519313,0.0,1.390558,0.0,0.1059,0.0,0.444781,0.0
12469,19860526,0,Mon,CIN,NL,40,CHN,NL,42,6,9,51,D,,,,CHI11,25723.0,167,50000001,50400000x,33,8,1,0,1,6,0,0,0,7,0,6,0,0,2,0,7,3,9,9,0,0,24,9,0,0,1,0,32,9,2,0,2,9,0,0,0,5,0,4,1,0,1,0,4,3,6,6,0,0,27,8,0,0,2,0,froeb901,Bruce Froemming,marsr901,Randy Marsh,davib902,Bob Davidson,kiblj901,John Kibler,,(none),,(none),rosep001,Pete Rose,freyj801,Jim Frey,ecked001,Dennis Eckersley,terrs001,Scott Terry,smitl001,Lee Smith,trilm001,Manny Trillo,sotom001,Mario Soto,ecked001,Dennis Eckersley,milne001,Eddie Milner,8,rosep001,Pete Rose,3,parkd001,Dave Parker,9,esasn001,Nick Esasky,7,bellb001,Buddy Bell,5,concd001,Dave Concepcion,4,stilk001,Kurt Stillwell,6,diazb001,Bo Diaz,2,sotom001,Mario Soto,1,dunss001,Shawon Dunston,6,loped001,Davey Lopes,7,sandr001,Ryne Sandberg,4,morek001,Keith Moreland,9,durhl001,Leon Durham,3,mumpj001,Jerry Mumphrey,8,davij001,Jody Davis,2,trilm001,Manny Trillo,5,ecked001,Dennis Eckersley,1,,Y,1986,3,1,15,198605260,0.256001,0.251192,0.323616,0.324624,0.391795,0.372387,0.715411,0.697011,151.0,157.0,59.0,69.0,128.0,118.0,0.154723,0.144038,0.447068,0.433934,0.251976,0.223447,0.320467,0.311111,0.397233,0.324649,0.7177,0.63576,21.0,24.0,16.0,9.0,20.0,23.0,0.154723,0.144038,0.452424,0.400889,0.0,0.0,0.5,0.0,,7.0,0.0,62.666667,0.0,78.0,0.0,271.0,0.0,8.0,0.0,39.0,0.0,39.0,0.0,11.0,0.0,2.0,0.0,44.0,0.0,4.0,0.0,3.0,0.0,0.0,0.0,2.0,0.0,2.0,0.0,20.0,0.0,5.0,0.0,231.0,0.0,220.0,0.0,929.0,0.0,22.0,0.0,97.0,0.0,94.0,0.0,29.0,0.0,5.0,0.0,159.0,0.0,11.0,0.0,4.0,0.0,0.0,0.0,5.0,0.0,5.0,0.0,42.0,0.0,8.0,0.0,89.0,0.0,46.0,0.0,124.0,0.0,62.666667,0.0,271.0,0.0,39.0,0.0,89.0,0.0,0.328413,0.0,44.0,0.0,135.0,0.0,5.601064,0.0,1.420213,0.0,0.162362,0.0,0.498155,0.0,249.0,0.0,102.0,0.0,322.0,0.0,231.0,0.0,929.0,0.0,94.0,0.0,249.0,0.0,0.26803,0.0,159.0,0.0,351.0,0.0,3.662338,0.0,1.077922,0.0,0.171152,0.0,0.377826,0.0
22229,19900916,0,Sun,CLE,AL,147,KCA,AL,146,6,9,51,D,,,,KAN06,23806.0,179,4000200,31200030x,39,12,2,0,0,5,0,1,0,3,0,10,4,0,0,0,10,3,8,8,2,0,24,12,1,0,1,0,35,13,1,0,4,8,1,0,0,5,0,4,0,1,1,0,8,4,5,5,1,0,27,9,1,0,0,0,barnl901,Larry Barnett,koscg901,Greg Kosc,morrd901,Dan Morrison,phild901,Dave Phillips,,(none),,(none),mcnaj801,John McNamara,wathj001,John Wathan,montj002,Jeff Montgomery,valde001,Efrain Valdez,,(none),jackb001,Bo Jackson,candt001,Tom Candiotti,wagnh001,Hector Wagner,colea001,Alex Cole,8,fermf001,Felix Fermin,6,browj001,Jerry Browne,4,aloms001,Sandy Alomar,2,jamec001,Chris James,10,baerc001,Carlos Baerga,5,wardt001,Turner Ward,9,mantj001,Jeff Manto,3,jeffs001,Stan Jefferson,7,mcrab001,Brian McRae,8,seitk001,Kevin Seitzer,5,bretg001,George Brett,10,jackb001,Bo Jackson,7,perrg001,Gerald Perry,3,eisej001,Jim Eisenreich,9,stilk001,Kurt Stillwell,6,pecob001,Bill Pecota,4,boonb001,Bob Boone,2,,Y,1990,3,1,15,199009160,0.265605,0.2584,0.326866,0.315408,0.389542,0.378561,0.716408,0.693969,116.0,90.0,58.0,53.0,116.0,119.0,0.147761,0.145314,0.440464,0.426332,0.248975,0.278054,0.314953,0.333028,0.376025,0.408143,0.690978,0.741171,19.0,16.0,9.0,16.0,25.0,22.0,0.147761,0.145314,0.430841,0.453211,0.0,0.0,0.5,0.0,,2.333333,0.0,6.333333,0.0,10.0,0.0,31.0,0.0,0.0,0.0,6.0,0.0,5.0,0.0,3.0,0.0,1.0,0.0,2.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,6.333333,0.0,10.0,0.0,31.0,0.0,0.0,0.0,6.0,0.0,5.0,0.0,3.0,0.0,1.0,0.0,2.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,13.0,0.0,2.0,0.0,12.0,0.0,30.0,0.0,120.0,0.0,18.148148,0.0,48.5,0.0,0.38275,0.0,19.8,0.0,55.05,0.0,5.444444,0.0,1.616667,0.0,0.165,0.0,0.45875,0.0,13.0,0.0,2.0,0.0,12.0,0.0,105.0,0.0,420.0,0.0,59.814815,0.0,161.0,0.0,0.373643,0.0,79.8,0.0,190.05,0.0,5.126984,0.0,1.533333,0.0,0.19,0.0,0.4525,0.0
26172,19920825,0,Tue,CHN,NL,125,SDN,NL,125,4,7,51,N,,,,SAN01,14984.0,153,400,20010031x,36,10,1,0,0,4,0,0,0,2,0,8,0,0,0,0,7,4,7,7,0,0,24,14,0,0,0,0,29,9,3,0,3,7,1,0,0,5,2,1,0,2,0,0,4,3,4,4,0,0,27,3,0,0,1,0,wintm901,Mike Winters,froeb901,Bruce Froemming,monte901,Ed Montague,bellw901,Wally Bell,,(none),,(none),lefej101,Jim Lefebvre,riddg801,Greg Riddoch,maddm002,Mike Maddux,pattk001,Ken Patterson,myerr001,Randy Myers,santb001,Benito Santiago,harkm001,Mike Harkey,deshj001,Jim Deshaies,dascd001,Doug Dascenzo,8,sandr001,Ryne Sandberg,4,gracm001,Mark Grace,3,dawsa001,Andre Dawson,9,buecs001,Steve Buechele,5,salal001,Luis Salazar,7,giraj001,Joe Girardi,2,sancr001,Rey Sanchez,6,harkm001,Mike Harkey,1,fernt001,Tony Fernandez,6,azoco001,Oscar Azocar,7,shefg001,Gary Sheffield,5,mcgrf001,Fred McGriff,3,jackd002,Darrin Jackson,8,santb001,Benito Santiago,2,clarj002,Jerald Clark,9,stilk001,Kurt Stillwell,4,deshj001,Jim Deshaies,1,,Y,1992,3,1,11,199208250,0.254234,0.246429,0.312341,0.300436,0.386046,0.360875,0.698387,0.661311,83.0,92.0,55.0,53.0,118.0,122.0,0.14955,0.14149,0.433882,0.40668,0.24368,0.272052,0.287619,0.315284,0.380182,0.386258,0.667801,0.701542,10.0,16.0,5.0,12.0,21.0,21.0,0.14955,0.14149,0.41619,0.422707,0.0,0.0,0.5,0.0,,6.333333,0.0,64.666667,0.0,54.0,0.0,258.0,0.0,5.0,0.0,21.0,0.0,20.0,0.0,27.0,0.0,0.0,0.0,45.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,1.0,0.0,12.0,0.0,0.0,0.0,209.333333,0.0,192.0,0.0,875.0,0.0,21.0,0.0,103.0,0.0,101.0,0.0,93.0,0.0,5.0,0.0,125.0,0.0,5.0,0.0,7.0,0.0,0.0,0.0,2.0,0.0,6.0,0.0,45.0,0.0,5.0,0.0,81.0,0.0,22.0,0.0,76.0,0.0,64.666667,0.0,258.0,0.0,20.0,0.0,81.0,0.0,0.313953,0.0,45.0,0.0,103.0,0.0,2.783505,0.0,1.252577,0.0,0.174419,0.0,0.399225,0.0,285.0,0.0,97.0,0.0,289.0,0.0,209.333333,0.0,875.0,0.0,101.0,0.0,285.0,0.0,0.325714,0.0,125.0,0.0,382.0,0.0,4.342357,0.0,1.361465,0.0,0.142857,0.0,0.436571,0.0
26769,19930415,0,Thu,SLN,NL,9,LAN,NL,10,4,2,54,N,,,,LOS03,42171.0,171,200000020,110000000,28,7,0,0,0,3,0,1,0,7,2,5,0,3,1,0,5,2,2,2,0,0,27,12,0,0,0,0,34,7,1,0,1,2,0,0,0,0,0,2,1,0,0,0,5,2,4,4,1,1,27,12,0,0,1,0,tatat901,Terry Tata,grege901,Eric Gregg,davig901,Gerry Davis,bonig901,Greg Bonin,,(none),,(none),torrj101,Joe Torre,lasot101,Tom Lasorda,arocr001,Rene Arocha,grosk001,Kevin Gross,smitl001,Lee Smith,zeilt001,Todd Zeile,tewkb001,Bob Tewksbury,astap001,Pedro Astacio,penag001,Geronimo Pena,4,smito001,Ozzie Smith,6,jeffg001,Gregg Jefferies,3,lankr001,Ray Lankford,8,whitm001,Mark Whiten,9,zeilt001,Todd Zeile,5,jordb001,Brian Jordan,7,villh001,Hector Villanueva,2,tewkb001,Bob Tewksbury,1,butlb001,Brett Butler,8,reedj003,Jody Reed,4,piazm001,Mike Piazza,2,karre001,Eric Karros,3,wallt001,Tim Wallach,5,snydc001,Cory Snyder,9,websm001,Mitch Webster,7,offej001,Jose Offerman,6,astap001,Pedro Astacio,1,,Y,1993,-2,0,6,199304150,0.245813,0.261956,0.310597,0.322633,0.331969,0.375981,0.642566,0.698615,145.0,201.0,78.0,120.0,173.0,98.0,0.151556,0.162954,0.389352,0.427285,0.232512,0.26361,0.300718,0.333045,0.300493,0.378223,0.601211,0.711268,19.0,29.0,13.0,28.0,23.0,26.0,0.151556,0.162954,0.362657,0.436851,0.0,0.0,0.5,0.0,,7.0,0.0,73.0,0.0,72.0,0.0,303.0,0.0,1.0,0.0,21.0,0.0,17.0,0.0,17.0,0.0,2.0,0.0,37.0,0.0,3.0,0.0,2.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,7.0,0.0,2.0,0.0,89.0,0.0,84.0,0.0,369.0,0.0,2.0,0.0,25.0,0.0,20.0,0.0,23.0,0.0,4.0,0.0,49.0,0.0,3.0,0.0,3.0,0.0,1.0,0.0,2.0,0.0,0.0,0.0,9.0,0.0,2.0,0.0,89.0,0.0,13.0,0.0,85.0,0.0,73.0,0.0,303.0,0.0,17.0,0.0,89.0,0.0,0.293729,0.0,37.0,0.0,102.0,0.0,2.09589,0.0,1.219178,0.0,0.122112,0.0,0.336634,0.0,107.0,0.0,17.0,0.0,101.0,0.0,105.0,0.0,420.0,0.0,28.888889,0.0,131.0,0.0,0.29969,0.0,59.2,0.0,146.95,0.0,2.47619,0.0,1.247619,0.0,0.140952,0.0,0.349881,0.0
29476,19940520,0,Fri,SLN,NL,40,FLO,NL,41,3,2,54,N,,,,MIA01,31512.0,193,102000,000002000,31,6,2,0,0,3,0,0,0,10,2,4,1,1,0,0,11,5,2,2,0,0,27,13,0,0,2,0,33,9,2,0,0,2,1,0,1,2,0,4,0,0,2,0,8,4,3,3,0,0,27,13,1,0,0,0,marsr901,Randy Marsh,hirsm901,Mark Hirschbeck,vanol901,Larry Vanover,relic901,Charlie Reliford,,(none),,(none),torrj101,Joe Torre,lachr101,Rene Lachemann,everb001,Bryan Eversgerd,gardm001,Mark Gardner,perem002,Mike Perez,jordb001,Brian Jordan,cormr001,Rheal Cormier,gardm001,Mark Gardner,lankr001,Ray Lankford,8,smito001,Ozzie Smith,6,jeffg001,Gregg Jefferies,3,zeilt001,Todd Zeile,5,whitm001,Mark Whiten,9,jordb001,Brian Jordan,7,pagnt001,Tom Pagnozzi,2,alicl001,Luis Alicea,4,cormr001,Rheal Cormier,1,carrc001,Chuck Carr,8,abbok002,Kurt Abbott,6,santb001,Benito Santiago,2,conij001,Jeff Conine,7,desto001,Orestes Destrade,3,magad001,Dave Magadan,5,everc001,Carl Everett,9,barbb001,Bret Barberie,4,gardm001,Mark Gardner,1,,Y,1994,-1,0,5,199405200,0.251415,0.272448,0.312311,0.34616,0.363885,0.408491,0.676197,0.754652,109.0,147.0,47.0,73.0,127.0,153.0,0.182489,0.149375,0.415632,0.46842,0.270138,0.250499,0.345374,0.333037,0.398821,0.40519,0.744196,0.738227,24.0,24.0,5.0,15.0,23.0,17.0,0.182489,0.149375,0.460793,0.470693,0.0,0.0,0.5,0.0,,5.666667,0.0,29.0,0.0,32.0,0.0,124.0,0.0,7.0,0.0,25.0,0.0,23.0,0.0,9.0,0.0,0.0,0.0,15.0,0.0,2.0,0.0,4.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,8.0,0.0,2.0,0.0,155.0,0.0,156.0,0.0,661.0,0.0,24.0,0.0,109.0,0.0,103.0,0.0,53.0,0.0,0.0,0.0,93.0,0.0,5.0,0.0,11.0,0.0,4.0,0.0,9.0,0.0,0.0,0.0,41.0,0.0,4.0,0.0,41.0,0.0,26.0,0.0,58.0,0.0,30.0,0.0,124.0,0.0,23.555556,0.0,42.5,0.0,0.330645,0.0,15.0,0.0,67.0,0.0,7.066667,0.0,1.416667,0.0,0.120968,0.0,0.540323,0.0,209.0,0.0,97.0,0.0,253.0,0.0,155.0,0.0,661.0,0.0,103.0,0.0,209.0,0.0,0.316188,0.0,93.0,0.0,306.0,0.0,5.980645,0.0,1.348387,0.0,0.140696,0.0,0.462935,0.0
30179,19940716,0,Sat,LAN,NL,91,PHI,NL,91,6,10,51,N,,,,PHI12,46679.0,170,110030100,01503001x,35,12,1,0,1,6,0,1,0,3,0,2,0,0,3,0,6,4,6,6,1,0,24,12,3,0,2,0,35,11,2,1,2,9,0,1,0,5,1,3,1,0,2,0,7,3,6,6,0,0,27,12,0,0,3,0,wendh901,Harry Wendelstedt,relic901,Charlie Reliford,hirsm901,Mark Hirschbeck,riekr901,Rich Rieker,,(none),,(none),lasot101,Tom Lasorda,fregj101,Jim Fregosi,munob001,Bobby Munoz,martr002,Ramon Martinez,borlt001,Toby Borland,eisej001,Jim Eisenreich,herso001,Orel Hershiser,munob001,Bobby Munoz,butlb001,Brett Butler,8,deshd001,Delino DeShields,4,piazm001,Mike Piazza,2,wallt001,Tim Wallach,5,rodrh001,Henry Rodriguez,7,mondr002,Raul Mondesi,9,karre001,Eric Karros,3,bourr001,Rafael Bournigal,6,herso001,Orel Hershiser,1,hatcb001,Billy Hatcher,8,duncm001,Mariano Duncan,5,thomm001,Milt Thompson,7,krukj001,John Kruk,3,eisej001,Jim Eisenreich,9,moram001,Mickey Morandini,4,liebm001,Mike Lieberthal,2,stock001,Kevin Stocker,6,munob001,Bobby Munoz,1,,Y,1994,4,1,16,199407160,0.27,0.266019,0.342342,0.327839,0.408214,0.404428,0.750557,0.732267,90.0,99.0,35.0,52.0,136.0,130.0,0.164897,0.154607,0.46686,0.45459,0.251734,0.249246,0.321653,0.310886,0.360753,0.374874,0.682406,0.68576,20.0,10.0,9.0,8.0,22.0,21.0,0.164897,0.154607,0.420485,0.426199,0.0,0.0,0.5,0.0,,5.0,0.0,60.0,0.0,52.0,0.0,257.0,0.0,5.0,0.0,18.0,0.0,11.0,0.0,25.0,0.0,0.0,0.0,43.0,0.0,3.0,0.0,2.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0,90.333333,0.0,91.0,0.0,402.0,0.0,6.0,0.0,41.0,0.0,32.0,0.0,42.0,0.0,1.0,0.0,57.0,0.0,4.0,0.0,5.0,0.0,5.0,0.0,1.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,77.0,0.0,17.0,0.0,69.0,0.0,60.0,0.0,257.0,0.0,11.0,0.0,77.0,0.0,0.299611,0.0,43.0,0.0,94.0,0.0,1.65,0.0,1.283333,0.0,0.167315,0.0,0.365759,0.0,133.0,0.0,31.0,0.0,122.0,0.0,105.0,0.0,420.0,0.0,40.148148,0.0,155.0,0.0,0.332524,0.0,60.6,0.0,172.1,0.0,3.44127,0.0,1.47619,0.0,0.144286,0.0,0.409762,0.0
39400,19980920,0,Sun,SLN,NL,157,MIL,NL,156,11,6,54,D,,,,MIL05,52831.0,208,213030002,000105000,36,10,1,0,5,10,0,1,0,5,0,5,2,0,0,0,4,6,6,6,0,0,27,6,0,0,0,0,39,13,4,0,0,6,0,1,0,6,0,11,0,0,0,0,13,6,10,10,0,0,27,8,1,0,0,0,crawj901,Jerry Crawford,gormb901,Brian Gorman,davib902,Bob Davidson,wintm901,Mike Winters,,(none),,(none),larut101,Tony LaRussa,garnp001,Phil Garner,aybam001,Manny Aybar,karls001,Scott Karl,,(none),mcgwm001,Mark McGwire,merck001,Kent Mercker,karls001,Scott Karl,kellp001,Pat Kelly,4,tatif001,Fernando Tatis,5,mcgwm001,Mark McGwire,3,jordb001,Brian Jordan,8,gantr001,Ron Gant,7,marre001,Eli Marrero,2,ordal001,Luis Ordaz,6,merck001,Kent Mercker,1,littm001,Mark Little,9,vinaf001,Fernando Vina,4,lorem001,Mark Loretta,3,cirij001,Jeff Cirillo,5,burnj001,Jeromy Burnitz,9,grism001,Marquis Grissom,8,jackd002,Darrin Jackson,7,mathm001,Mike Matheny,2,valej003,Jose Valentin,6,karls001,Scott Karl,1,,Y,1998,-5,0,17,199809200,0.259567,0.256861,0.325329,0.336908,0.397834,0.434081,0.723163,0.770989,86.0,139.0,60.0,40.0,109.0,139.0,0.169901,0.18806,0.451316,0.495038,0.276852,0.251266,0.324978,0.343111,0.448148,0.445795,0.773127,0.788906,9.0,29.0,5.0,5.0,21.0,31.0,0.169901,0.18806,0.484875,0.513778,0.0,0.0,0.5,0.0,,3.0,0.0,60.0,0.0,73.0,0.0,262.0,0.0,6.0,0.0,35.0,0.0,35.0,0.0,18.0,0.0,0.0,0.0,29.0,0.0,5.0,0.0,2.0,0.0,4.0,0.0,2.0,0.0,0.0,0.0,14.0,0.0,1.0,0.0,204.666667,0.0,237.0,0.0,902.0,0.0,21.0,0.0,112.0,0.0,101.0,0.0,69.0,0.0,4.0,0.0,108.0,0.0,14.0,0.0,4.0,0.0,7.0,0.0,5.0,0.0,0.0,0.0,57.0,0.0,3.0,0.0,91.0,0.0,28.0,0.0,101.0,0.0,60.0,0.0,262.0,0.0,35.0,0.0,91.0,0.0,0.347328,0.0,29.0,0.0,119.0,0.0,5.25,0.0,1.516667,0.0,0.110687,0.0,0.454198,0.0,306.0,0.0,105.0,0.0,342.0,0.0,204.666667,0.0,902.0,0.0,101.0,0.0,306.0,0.0,0.339246,0.0,108.0,0.0,411.0,0.0,4.441368,0.0,1.495114,0.0,0.119734,0.0,0.455654,0.0
48452,20020806,0,Tue,MIN,AL,114,BAL,AL,110,2,9,51,N,,,,BAL12,33858.0,167,2000,00010260x,34,7,0,0,1,2,0,0,0,1,0,5,0,0,1,0,6,3,9,9,2,0,24,6,0,0,0,0,31,7,0,0,2,8,0,0,0,7,0,10,0,0,0,0,5,4,2,2,0,0,27,12,2,0,1,0,kulpr901,Ron Kulpa,scotd901,Dale Scott,joycj901,Jim Joyce,nelsj901,Jeff Nelson,,(none),,(none),gardr001,Ron Gardenhire,hargm001,Mike Hargrove,ponss001,Sidney Ponson,santj003,Johan Santana,,(none),cordm001,Marty Cordova,milte001,Eric Milton,ponss001,Sidney Ponson,jonej003,Jacque Jones,7,guzmc001,Cristian Guzman,6,mohrd001,Dustan Mohr,9,ortid001,David Ortiz,10,huntt001,Torii Hunter,8,miend001,Doug Mientkiewicz,3,cuddm001,Michael Cuddyer,5,piera001,A.J. Pierzynski,2,rival001,Luis Rivas,4,moram002,Melvin Mora,8,lopel002,Luis Lopez,6,mattg002,Gary Matthews,9,batit001,Tony Batista,5,cordm001,Marty Cordova,7,leonj002,Jose Leon,3,richc001,Chris Richard,10,gil-g001,Geronimo Gil,2,hairj002,Jerry Hairston,4,,Y,2002,7,1,11,200208060,0.252224,0.274297,0.312406,0.335236,0.402579,0.43681,0.714985,0.772046,143.0,109.0,50.0,71.0,100.0,90.0,0.172984,0.181477,0.45066,0.484102,0.267308,0.285578,0.324468,0.346154,0.426923,0.468004,0.751391,0.814158,27.0,15.0,10.0,14.0,18.0,11.0,0.172984,0.181477,0.471631,0.513112,0.0,0.0,0.5,0.0,,6.666667,0.0,57.666667,0.0,56.0,0.0,239.0,0.0,7.0,0.0,25.0,0.0,23.0,0.0,23.0,0.0,0.0,0.0,38.0,0.0,0.0,0.0,3.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,8.0,0.0,1.0,0.0,212.0,0.0,230.0,0.0,911.0,0.0,30.0,0.0,116.0,0.0,109.0,0.0,72.0,0.0,0.0,0.0,129.0,0.0,4.0,0.0,4.0,0.0,2.0,0.0,7.0,0.0,0.0,0.0,47.0,0.0,4.0,0.0,79.0,0.0,24.0,0.0,80.0,0.0,57.666667,0.0,239.0,0.0,23.0,0.0,79.0,0.0,0.330544,0.0,38.0,0.0,103.0,0.0,3.589595,0.0,1.369942,0.0,0.158996,0.0,0.430962,0.0,302.0,0.0,115.0,0.0,345.0,0.0,212.0,0.0,911.0,0.0,109.0,0.0,302.0,0.0,0.331504,0.0,129.0,0.0,417.0,0.0,4.627358,0.0,1.424528,0.0,0.141603,0.0,0.457739,0.0


In [22]:
df.loc[df.IP_mod_10_h==0]

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,SObat_perc_162_h,SObat_perc_162_v,SLGmod_162_h,SLGmod_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,SObat_perc_30_h,SObat_perc_30_v,SLGmod_30_h,SLGmod_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,IP_real_h,IP_real_v,rollsum_IP_real_10_h,rollsum_IP_real_10_v,rollsum_H_10_h,rollsum_H_10_v,rollsum_BFP_10_h,rollsum_BFP_10_v,rollsum_HR_10_h,rollsum_HR_10_v,rollsum_R_10_h,rollsum_R_10_v,rollsum_ER_10_h,rollsum_ER_10_v,rollsum_BB_10_h,rollsum_BB_10_v,rollsum_IB_10_h,rollsum_IB_10_v,rollsum_SO_10_h,rollsum_SO_10_v,rollsum_SH_10_h,rollsum_SH_10_v,rollsum_SF_10_h,rollsum_SF_10_v,rollsum_WP_10_h,rollsum_WP_10_v,rollsum_HBP_10_h,rollsum_HBP_10_v,rollsum_BK_10_h,rollsum_BK_10_v,rollsum_2B_10_h,rollsum_2B_10_v,rollsum_3B_10_h,rollsum_3B_10_v,rollsum_IP_real_35_h,rollsum_IP_real_35_v,rollsum_H_35_h,rollsum_H_35_v,rollsum_BFP_35_h,rollsum_BFP_35_v,rollsum_HR_35_h,rollsum_HR_35_v,rollsum_R_35_h,rollsum_R_35_v,rollsum_ER_35_h,rollsum_ER_35_v,rollsum_BB_35_h,rollsum_BB_35_v,rollsum_IB_35_h,rollsum_IB_35_v,rollsum_SO_35_h,rollsum_SO_35_v,rollsum_SH_35_h,rollsum_SH_35_v,rollsum_SF_35_h,rollsum_SF_35_v,rollsum_WP_35_h,rollsum_WP_35_v,rollsum_HBP_35_h,rollsum_HBP_35_v,rollsum_BK_35_h,rollsum_BK_35_v,rollsum_2B_35_h,rollsum_2B_35_v,rollsum_3B_35_h,rollsum_3B_35_v,H_BB_roll_10_h,H_BB_roll_10_v,XB_roll_10_h,XB_roll_10_v,TB_roll_10_h,TB_roll_10_v,IP_mod_10_h,IP_mod_10_v,BF_mod_10_h,BF_mod_10_v,ER_mod_10_h,ER_mod_10_v,H_BB_mod_10_h,H_BB_mod_10_v,H_BB_perc_10_h,H_BB_perc_10_v,SO_mod_10_h,SO_mod_10_v,TB_BB_mod_10_h,TB_BB_mod_10_v,ERA_10_h,ERA_10_v,WHIP_10_h,WHIP_10_v,SO_perc_10_h,SO_perc_10_v,TB_BB_perc_10_h,TB_BB_perc_10_v,H_BB_roll_35_h,H_BB_roll_35_v,XB_roll_35_h,XB_roll_35_v,TB_roll_35_h,TB_roll_35_v,IP_mod_35_h,IP_mod_35_v,BF_mod_35_h,BF_mod_35_v,ER_mod_35_h,ER_mod_35_v,H_BB_mod_35_h,H_BB_mod_35_v,H_BB_perc_35_h,H_BB_perc_35_v,SO_mod_35_h,SO_mod_35_v,TB_BB_mod_35_h,TB_BB_mod_35_v,ERA_35_h,ERA_35_v,WHIP_35_h,WHIP_35_v,SO_perc_35_h,SO_perc_35_v,TB_BB_perc_35_h,TB_BB_perc_35_v
15386,19870803,0,Mon,PHI,NL,104,NYN,NL,105,2,3,65,N,,,,NYC17,50297.0,209,200000000,20000000001,38,7,1,0,1,2,2,0,0,6,1,4,0,0,1,0,11,3,3,3,0,0,32,6,0,0,0,0,36,5,1,0,2,3,0,0,0,3,1,6,0,1,0,0,4,4,2,2,0,0,33,20,1,0,1,0,westj901,Joe West,darlg901,Gary Darling,marsr901,Randy Marsh,rungp901,Paul Runge,,(none),,(none),elial101,Lee Elia,johnd105,Davey Johnson,mcdor001,Roger McDowell,tekuk001,Kent Tekulve,,(none),hernk001,Keith Hernandez,carmd001,Don Carman,ferns001,Sid Fernandez,samuj001,Juan Samuel,4,schur001,Rick Schu,3,hayev001,Von Hayes,8,schmm001,Mike Schmidt,5,parrl001,Lance Parrish,2,jamec001,Chris James,7,wilsg001,Glenn Wilson,9,jelts001,Steve Jeltz,6,carmd001,Don Carman,1,wilsm001,Mookie Wilson,8,teuft001,Tim Teufel,4,hernk001,Keith Hernandez,3,strad001,Darryl Strawberry,9,mcrek001,Kevin McReynolds,7,cartg001,Gary Carter,2,johnh001,Howard Johnson,6,magad001,Dave Magadan,5,ferns001,Sid Fernandez,1,,Y,1987,1,1,5,198708030,0.268468,0.256811,0.339945,0.326043,0.421081,0.418446,0.761026,0.74449,133.0,129.0,46.0,56.0,143.0,128.0,0.1629,0.189649,0.477646,0.472621,0.276329,0.273892,0.35039,0.354641,0.426087,0.463054,0.776477,0.817695,36.0,23.0,8.0,10.0,29.0,20.0,0.1629,0.189649,0.484822,0.522767,0.0,0.0,0.5,0.0,,0.0,8.0,0.0,53.0,0.0,63.0,0.0,241.0,0.0,13.0,0.0,38.0,0.0,34.0,0.0,20.0,0.0,3.0,0.0,25.0,0.0,5.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,18.0,0.0,1.0,0.0,212.666667,0.0,189.0,0.0,884.0,0.0,31.0,0.0,98.0,0.0,91.0,0.0,76.0,0.0,11.0,0.0,129.0,0.0,8.0,0.0,6.0,0.0,3.0,0.0,5.0,0.0,3.0,0.0,44.0,0.0,4.0,0.0,83.0,0.0,46.0,0.0,109.0,0.0,53.0,0.0,241.0,0.0,34.0,0.0,83.0,0.0,0.344398,0.0,25.0,0.0,129.0,0.0,5.773585,0.0,1.566038,0.0,0.103734,0.0,0.53527,0.0,265.0,0.0,114.0,0.0,303.0,0.0,212.666667,0.0,884.0,0.0,91.0,0.0,265.0,0.0,0.299774,0.0,129.0,0.0,379.0,0.0,3.851097,0.0,1.246082,0.0,0.145928,0.0,0.428733
21820,19900813,0,Mon,SFN,NL,114,CIN,NL,113,5,6,51,N,,,,CIN08,34868.0,165,400000100,01050000x,32,7,1,0,1,5,1,0,1,4,0,10,0,0,1,0,6,4,6,6,1,0,24,11,0,0,1,0,29,7,2,0,0,6,1,0,0,2,0,4,1,0,1,0,2,4,5,5,0,0,27,6,0,0,1,0,marsr901,Randy Marsh,wendh901,Harry Wendelstedt,westj901,Joe West,barnr901,Ron Barnes,,(none),,(none),crair101,Roger Craig,pinil001,Lou Piniella,layat001,Tim Layana,wilst002,Trevor Wilson,myerr001,Randy Myers,olivj001,Joe Oliver,wilst002,Trevor Wilson,jackd001,Danny Jackson,butlb001,Brett Butler,8,littg001,Greg Litton,9,clarw001,Will Clark,3,mitck001,Kevin Mitchell,7,willm003,Matt Williams,5,cartg001,Gary Carter,2,thomr003,Robby Thompson,4,uribj001,Jose Uribe,6,wilst002,Trevor Wilson,1,davie001,Eric Davis,8,benzt001,Todd Benzinger,3,larkb001,Barry Larkin,6,saboc001,Chris Sabo,5,bragg001,Glenn Braggs,7,oneip001,Paul O'Neill,9,duncm001,Mariano Duncan,4,olivj001,Joe Oliver,2,jackd001,Danny Jackson,1,,Y,1990,1,1,11,199008130,0.256512,0.257348,0.314849,0.315494,0.38818,0.391398,0.703029,0.706892,167.0,104.0,56.0,50.0,108.0,100.0,0.167853,0.170631,0.436186,0.439049,0.24572,0.247535,0.302607,0.300642,0.389728,0.36785,0.692335,0.668492,22.0,18.0,15.0,12.0,23.0,25.0,0.167853,0.170631,0.435754,0.412466,0.0,0.0,0.5,0.0,,0.0,3.333333,0.0,62.333333,0.0,50.0,0.0,262.0,0.0,6.0,0.0,29.0,0.0,26.0,0.0,26.0,0.0,0.0,0.0,34.0,0.0,4.0,0.0,2.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,150.666667,0.0,116.0,0.0,627.0,0.0,11.0,0.0,69.0,0.0,61.0,0.0,69.0,0.0,0.0,0.0,89.0,0.0,12.0,0.0,4.0,0.0,3.0,0.0,5.0,0.0,3.0,0.0,16.0,0.0,2.0,0.0,76.0,0.0,18.0,0.0,68.0,0.0,62.333333,0.0,262.0,0.0,26.0,0.0,76.0,0.0,0.290076,0.0,34.0,0.0,94.0,0.0,3.754011,0.0,1.219251,0.0,0.129771,0.0,0.358779,0.0,185.0,0.0,42.0,0.0,158.0,0.0,150.666667,0.0,627.0,0.0,61.0,0.0,185.0,0.0,0.295056,0.0,89.0,0.0,227.0,0.0,3.643805,0.0,1.227876,0.0,0.141946,0.0,0.362041
96165,20220928,0,Wed,KCA,AL,155,DET,AL,154,1,2,51,N,,,,DET05,12610.0,170,100000000,20000000x,35,10,0,0,1,1,0,0,0,6,0,7,0,2,0,0,13,3,2,2,0,0,24,7,1,0,1,0,30,6,1,0,1,2,0,0,0,2,0,8,0,0,1,0,6,7,1,1,0,0,27,10,0,1,0,0,drecb901,Bruce Dreckman,vondc901,Clint Vondrak,conrc901,Chris Conroy,rehaj901,Jeremie Rehak,,(none),,(none),mathm001,Mike Matheny,hinca001,A.J. Hinch,norrd002,Daniel Norris,lyncd001,Daniel Lynch,sotog003,Gregory Soto,cabrm001,Miguel Cabrera,lyncd001,Daniel Lynch,mannm001,Matt Manning,melem001,MJ Melendez,2,massm001,Michael Massey,4,peres002,Salvador Perez,10,pasqv001,Vinnie Pasquantino,3,olive001,Edward Olivares,7,dozih001,Hunter Dozier,5,wated001,Drew Waters,8,isbek001,Kyle Isbel,9,lopen001,Nicky Lopez,6,greer003,Riley Greene,8,baezj001,Javier Baez,6,haase001,Eric Haase,2,cabrm001,Miguel Cabrera,10,torks001,Spencer Torkelson,3,castw003,Willi Castro,9,kreir001,Ryan Kreidler,4,candj002,Jeimer Candelario,5,reyev001,Victor Reyes,7,,Y,2022,1,1,3,202209280,0.231784,0.245714,0.28346,0.304791,0.345725,0.382488,0.629185,0.68728,54.0,107.0,22.0,33.0,92.0,84.0,0.245319,0.216955,0.389736,0.430853,0.246349,0.25496,0.294439,0.311009,0.389484,0.409722,0.683923,0.720731,6.0,25.0,3.0,6.0,18.0,10.0,0.245319,0.216955,0.428441,0.454128,0.570815,0.44843,0.561192,7.5,U,0.0,6.0,0.0,49.666667,0.0,62.0,0.0,224.0,0.0,10.0,0.0,30.0,0.0,28.0,0.0,16.0,0.0,0.0,0.0,43.0,0.0,1.0,0.0,1.0,0.0,2.0,0.0,1.0,0.0,1.0,0.0,8.0,0.0,0.0,0.0,167.0,0.0,192.0,0.0,763.0,0.0,26.0,0.0,100.0,0.0,94.0,0.0,73.0,0.0,2.0,0.0,158.0,0.0,2.0,0.0,8.0,0.0,9.0,0.0,8.0,0.0,2.0,0.0,28.0,0.0,2.0,0.0,78.0,0.0,28.0,0.0,90.0,0.0,49.666667,0.0,224.0,0.0,28.0,0.0,78.0,0.0,0.348214,0.0,43.0,0.0,106.0,0.0,5.073826,0.0,1.57047,0.0,0.191964,0.0,0.473214,0.0,265.0,0.0,84.0,0.0,276.0,0.0,167.0,0.0,763.0,0.0,94.0,0.0,265.0,0.0,0.347313,0.0,158.0,0.0,349.0,0.0,5.065868,0.0,1.586826,0.0,0.207077,0.0,0.457405


In [23]:
df.drop(df.index[df.IP_mod_10_v==0],inplace=True)
df.drop(df.index[df.IP_mod_10_h==0],inplace=True)
df.shape

(96248, 329)

In [24]:
df.reset_index(drop=True, inplace=True)

In [25]:
df.to_csv('df_bp5.csv', index=False)