In [40]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline

pd.set_option('display.max_columns',1000)
pd.set_option('display.max_rows',1000)



In [2]:
df_youna = pd.read_csv('PitchersData/pitching_data_youna002.csv')

In [3]:
df_youna.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 97 entries, 0 to 96
Data columns (total 31 columns):
 #   Column       Non-Null Count  Dtype  
---  ------       --------------  -----  
 0   at_vs        97 non-null     object 
 1   Opponent     97 non-null     object 
 2   League       97 non-null     object 
 3   GS           97 non-null     int64  
 4   CG           97 non-null     int64  
 5   SHO          97 non-null     int64  
 6   GF           97 non-null     int64  
 7   SV           97 non-null     int64  
 8   IP           97 non-null     float64
 9   H            97 non-null     int64  
 10  BFP          97 non-null     int64  
 11  HR           97 non-null     int64  
 12  R            97 non-null     int64  
 13  ER           97 non-null     int64  
 14  BB           97 non-null     int64  
 15  IB           97 non-null     int64  
 16  SO           97 non-null     int64  
 17  SH           97 non-null     int64  
 18  SF           97 non-null     int64  
 19  WP        

In [4]:
df_youna['IP_real'] = df_youna['IP_real'] = (df_youna.IP - (df_youna.IP % 1)) + (df_youna.IP % 1) *(10/3)
df_youna

Unnamed: 0,at_vs,Opponent,League,GS,CG,SHO,GF,SV,IP,H,BFP,HR,R,ER,BB,IB,SO,SH,SF,WP,HBP,BK,2B,3B,GDP,ROE,W,L,ERA,Date,dblhead_num,IP_real
0,AT,SF,N,1,0,0,0,0,5.0,3,20,1,1,1,1,0,5,0,0,0,1,0,1,0,0,0,1,0,1.8,6-27-2019,,5.0
1,AT,LA,N,0,0,0,0,0,2.1,0,7,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1.23,7- 2-2019,,2.333333
2,VS,COL,N,1,0,0,0,0,6.0,0,19,0,0,0,1,0,3,1,0,0,0,0,0,0,0,0,1,0,0.68,7- 7-2019,,6.0
3,AT,TEX,A,1,0,0,0,0,5.1,3,19,1,1,1,1,0,4,0,0,0,0,0,0,0,0,0,1,0,0.96,7-16-2019,,5.333333
4,VS,MIL,N,1,0,0,0,0,4.0,3,18,1,4,4,3,0,5,0,0,0,0,0,1,0,0,0,0,0,2.38,7-21-2019,,4.0
5,AT,MIA,N,1,0,0,0,0,6.0,8,25,1,2,2,1,0,2,0,0,0,0,0,2,0,1,0,1,0,2.51,7-27-2019,,6.0
6,VS,WAS,N,1,0,0,0,0,6.0,3,25,0,2,2,3,1,9,0,0,0,1,0,2,0,0,0,0,1,2.6,8- 2-2019,,6.0
7,AT,LA,N,1,0,0,0,0,3.1,5,19,1,4,4,3,1,2,1,0,1,0,0,1,0,0,1,0,1,3.32,8-10-2019,,3.333333
8,VS,SF,N,1,0,0,0,0,5.0,8,24,1,5,5,2,1,2,0,0,0,0,0,2,0,0,0,0,1,3.98,8-15-2019,,5.0
9,VS,COL,N,1,0,0,0,0,6.0,7,25,1,3,3,1,0,4,0,0,0,0,0,2,0,1,0,1,0,4.04,8-20-2019,,6.0


In [5]:
df_youna.columns

Index(['at_vs', 'Opponent', 'League', 'GS', 'CG', 'SHO', 'GF', 'SV', 'IP', 'H',
       'BFP', 'HR', 'R', 'ER', 'BB', 'IB', 'SO', 'SH', 'SF', 'WP', 'HBP', 'BK',
       '2B', '3B', 'GDP', 'ROE', 'W', 'L', 'ERA', 'Date', 'dblhead_num',
       'IP_real'],
      dtype='object')

### Generating Features for a Starting Pitcher
- Want to creature features based on a lookback across $n$ games for each pitcher
- Need to aggregate statistics like innings pitched (IP), runs or earned runs given up, hits and walks given up, strikeouts, and so on
- We will also need to decide how to handle pitchers early in their career when they have relatively few games on which to base their performance.

In [6]:
def roll_column(df, col, winsize):
    # do the standard Pandas rolling calc
    t_col = df[col].rolling(winsize, closed='left').sum().to_numpy()
    
    # for the early columns, just do a rolling sum from the beginning
    t_col[:winsize] = np.concatenate(([0],df[col].iloc[:(winsize)].cumsum().to_numpy()[:-1]))

    return(t_col)

In [11]:
def load_and_process_pitch_df(p_id, filepath=''):
    fname = filepath+'pitching_data_'+p_id+'.csv'
    pitch_df = pd.read_csv(fname)
    
    # Convert date, fix dblhead_num to be 0,1,2
    pitch_df['Date'] = (pd.to_datetime(pitch_df.Date).astype(str).str.replace('-','')).astype(int)
    pitch_df.dblhead_num.fillna(0, inplace=True)
    pitch_df['dblhead_num'] = pitch_df['dblhead_num'].astype(int)
    
    # Convert IP to proper mathematical format
    pitch_df['IP_real'] = (pitch_df.IP - (pitch_df.IP % 1)) + (pitch_df.IP % 1) * (10/3)
    
    cols_to_agg = ['IP_real', 'H','BFP', 'HR', 'R', 'ER', 'BB', 'IB', 'SO', 'SH', 'SF', 'WP', 'HBP', 'BK',
       '2B', '3B']
    winsizes = [10,35]
    for winsize in winsizes:
        for raw_col in cols_to_agg:
            new_colname = 'rollsum_'+raw_col+'_'+str(winsize)        
            pitch_df[new_colname] = roll_column(pitch_df, raw_col, winsize)

    
    er_per_ip_def = (5/9)
    h_bb_per_ip_def = 1.5
    h_bb_per_bf_def = .37
    so_per_bf_def = .2
    ip_per_game_def = 3
    bf_per_game_def = 12
    tb_bb_perc_def = .45
    for winsize in winsizes:
        hit_col = 'rollsum_H_'+str(winsize)
        bb_col = 'rollsum_BB_'+str(winsize)
        h_bb_col = 'H_BB_roll_'+str(winsize)
        double_col = 'rollsum_2B_'+str(winsize)
        triple_col = 'rollsum_3B_'+str(winsize)
        hr_col = 'rollsum_HR_'+str(winsize)
        xb_col = 'XB_roll_'+str(winsize)
        tb_col = 'TB_roll_'+str(winsize)
        so_col = 'rollsum_SO_'+str(winsize)
        so_mod_col = 'SO_mod_'+str(winsize)
        ip_col = 'rollsum_IP_real_'+str(winsize)
        ip_mod_col = 'IP_mod_'+str(winsize)
        er_col = 'rollsum_ER_'+str(winsize)
        er_mod_col = 'ER_mod_'+str(winsize)
        bf_col = 'rollsum_BFP_'+str(winsize)
        bf_mod_col = 'BF_mod_'+str(winsize)
        era_col = 'ERA_'+str(winsize)
        whip_col = 'WHIP_'+str(winsize)
        so_perc_col = 'SO_perc_'+str(winsize)
        h_bb_perc_col = 'H_BB_perc_'+str(winsize)
        h_bb_mod_col = 'H_BB_mod_'+str(winsize)
        h_bb_mod2_col = 'H_BB_mod2_'+str(winsize)
        tb_bb_mod_col = 'TB_BB_mod_'+str(winsize)
        tb_bb_perc_col = 'TB_BB_perc_'+str(winsize)
        pitch_df[h_bb_col] = pitch_df[hit_col]+pitch_df[bb_col]
        pitch_df[xb_col] = pitch_df[double_col]+2*pitch_df[triple_col]+2*pitch_df[hr_col]
        pitch_df[tb_col] = pitch_df[hit_col]+pitch_df[xb_col]
        pitch_df[ip_mod_col] = np.maximum(pitch_df[ip_col], winsize*ip_per_game_def)
        pitch_df[bf_mod_col] = np.maximum(pitch_df[bf_col], winsize*bf_per_game_def)
        pitch_df[er_mod_col] = pitch_df[er_col] + er_per_ip_def*(pitch_df[ip_mod_col]-pitch_df[ip_col])
        pitch_df[h_bb_mod_col] = pitch_df[h_bb_col] + h_bb_per_ip_def*(pitch_df[ip_mod_col]-pitch_df[ip_col])
        pitch_df[h_bb_mod2_col] = pitch_df[h_bb_col] + h_bb_per_bf_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[so_mod_col] = pitch_df[so_col] + so_per_bf_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[tb_bb_mod_col] = (pitch_df[tb_col] + pitch_df[bb_col])+ tb_bb_perc_def*(pitch_df[bf_mod_col]-pitch_df[bf_col])
        pitch_df[era_col] = (pitch_df[er_mod_col]/pitch_df[ip_mod_col])*9
        pitch_df[whip_col] = pitch_df[h_bb_mod_col]/pitch_df[ip_mod_col]
        pitch_df[so_perc_col] = pitch_df[so_mod_col]/pitch_df[bf_mod_col]
        pitch_df[tb_bb_perc_col] = pitch_df[tb_bb_mod_col]/pitch_df[bf_mod_col]
        pitch_df[h_bb_perc_col] = pitch_df[h_bb_mod2_col]/pitch_df[bf_mod_col]
    pitch_df['date_dblhead'] = (pitch_df['Date'].astype(str) + pitch_df['dblhead_num'].astype(str)).astype(int)
    pitch_df.set_index('date_dblhead', inplace=True)
    return(pitch_df)

In [17]:
df_youna = load_and_process_pitch_df('youna002','PitchersData/')

In [18]:
df_youna.head(25)

Unnamed: 0_level_0,at_vs,Opponent,League,GS,CG,SHO,GF,SV,IP,H,BFP,HR,R,ER,BB,IB,SO,SH,SF,WP,HBP,BK,2B,3B,GDP,ROE,W,L,ERA,Date,dblhead_num,IP_real,rollsum_IP_real_10,rollsum_H_10,rollsum_BFP_10,rollsum_HR_10,rollsum_R_10,rollsum_ER_10,rollsum_BB_10,rollsum_IB_10,rollsum_SO_10,rollsum_SH_10,rollsum_SF_10,rollsum_WP_10,rollsum_HBP_10,rollsum_BK_10,rollsum_2B_10,rollsum_3B_10,rollsum_IP_real_35,rollsum_H_35,rollsum_BFP_35,rollsum_HR_35,rollsum_R_35,rollsum_ER_35,rollsum_BB_35,rollsum_IB_35,rollsum_SO_35,rollsum_SH_35,rollsum_SF_35,rollsum_WP_35,rollsum_HBP_35,rollsum_BK_35,rollsum_2B_35,rollsum_3B_35,H_BB_roll_10,XB_roll_10,TB_roll_10,IP_mod_10,BF_mod_10,ER_mod_10,H_BB_mod_10,H_BB_mod2_10,SO_mod_10,TB_BB_mod_10,ERA_10,WHIP_10,SO_perc_10,TB_BB_perc_10,H_BB_perc_10,H_BB_roll_35,XB_roll_35,TB_roll_35,IP_mod_35,BF_mod_35,ER_mod_35,H_BB_mod_35,H_BB_mod2_35,SO_mod_35,TB_BB_mod_35,ERA_35,WHIP_35,SO_perc_35,TB_BB_perc_35,H_BB_perc_35
date_dblhead,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1
201906270,AT,SF,N,1,0,0,0,0,5.0,3,20,1,1,1,1,0,5,0,0,0,1,0,1,0,0,0,1,0,1.8,20190627,0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,30.0,120.0,16.666667,45.0,44.4,24.0,54.0,5.0,1.5,0.2,0.45,0.37,0.0,0.0,0.0,105.0,420.0,58.333333,157.5,155.4,84.0,189.0,5.0,1.5,0.2,0.45,0.37
201907020,AT,LA,N,0,0,0,0,0,2.1,0,7,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1.23,20190702,0,2.333333,5.0,3.0,20.0,1.0,1.0,1.0,1.0,0.0,5.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,5.0,3.0,20.0,1.0,1.0,1.0,1.0,0.0,5.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,4.0,3.0,6.0,30.0,120.0,14.888889,41.5,41.0,25.0,52.0,4.466667,1.383333,0.208333,0.433333,0.341667,4.0,3.0,6.0,105.0,420.0,56.555556,154.0,152.0,85.0,187.0,4.847619,1.466667,0.202381,0.445238,0.361905
201907070,VS,COL,N,1,0,0,0,0,6.0,0,19,0,0,0,1,0,3,1,0,0,0,0,0,0,0,0,1,0,0.68,20190707,0,6.0,7.333333,3.0,27.0,1.0,1.0,1.0,1.0,0.0,6.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,7.333333,3.0,27.0,1.0,1.0,1.0,1.0,0.0,6.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,4.0,3.0,6.0,30.0,120.0,13.592593,38.0,38.41,24.6,48.85,4.077778,1.266667,0.205,0.407083,0.320083,4.0,3.0,6.0,105.0,420.0,55.259259,150.5,149.41,84.6,183.85,4.736508,1.433333,0.201429,0.437738,0.355738
201907160,AT,TEX,A,1,0,0,0,0,5.1,3,19,1,1,1,1,0,4,0,0,0,0,0,0,0,0,0,1,0,0.96,20190716,0,5.333333,13.333333,3.0,46.0,1.0,1.0,1.0,2.0,0.0,9.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,13.333333,3.0,46.0,1.0,1.0,1.0,2.0,0.0,9.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,5.0,3.0,6.0,30.0,120.0,10.259259,30.0,32.38,23.8,41.3,3.077778,1.0,0.198333,0.344167,0.269833,5.0,3.0,6.0,105.0,420.0,51.925926,142.5,143.38,83.8,176.3,4.450794,1.357143,0.199524,0.419762,0.341381
201907210,VS,MIL,N,1,0,0,0,0,4.0,3,18,1,4,4,3,0,5,0,0,0,0,0,1,0,0,0,0,0,2.38,20190721,0,4.0,18.666667,6.0,65.0,2.0,2.0,2.0,3.0,0.0,13.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,18.666667,6.0,65.0,2.0,2.0,2.0,3.0,0.0,13.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,9.0,5.0,11.0,30.0,120.0,8.296296,26.0,29.35,24.0,38.75,2.488889,0.866667,0.2,0.322917,0.244583,9.0,5.0,11.0,105.0,420.0,49.962963,138.5,140.35,84.0,173.75,4.28254,1.319048,0.2,0.41369,0.334167
201907270,AT,MIA,N,1,0,0,0,0,6.0,8,25,1,2,2,1,0,2,0,0,0,0,0,2,0,1,0,1,0,2.51,20190727,0,6.0,22.666667,9.0,83.0,3.0,6.0,6.0,6.0,0.0,18.0,1.0,0.0,0.0,1.0,0.0,2.0,0.0,22.666667,9.0,83.0,3.0,6.0,6.0,6.0,0.0,18.0,1.0,0.0,0.0,1.0,0.0,2.0,0.0,15.0,8.0,17.0,30.0,120.0,10.074074,26.0,28.69,25.4,39.65,3.022222,0.866667,0.211667,0.330417,0.239083,15.0,8.0,17.0,105.0,420.0,51.740741,138.5,139.69,85.4,174.65,4.434921,1.319048,0.203333,0.415833,0.332595
201908020,VS,WAS,N,1,0,0,0,0,6.0,3,25,0,2,2,3,1,9,0,0,0,1,0,2,0,0,0,0,1,2.6,20190802,0,6.0,28.666667,17.0,108.0,4.0,8.0,8.0,7.0,0.0,20.0,1.0,0.0,0.0,1.0,0.0,4.0,0.0,28.666667,17.0,108.0,4.0,8.0,8.0,7.0,0.0,20.0,1.0,0.0,0.0,1.0,0.0,4.0,0.0,24.0,12.0,29.0,30.0,120.0,8.740741,26.0,28.44,22.4,41.4,2.622222,0.866667,0.186667,0.345,0.237,24.0,12.0,29.0,105.0,420.0,50.407407,138.5,139.44,82.4,176.4,4.320635,1.319048,0.19619,0.42,0.332
201908100,AT,LA,N,1,0,0,0,0,3.1,5,19,1,4,4,3,1,2,1,0,1,0,0,1,0,0,1,0,1,3.32,20190810,0,3.333333,34.666667,20.0,133.0,4.0,10.0,10.0,10.0,1.0,29.0,1.0,0.0,0.0,2.0,0.0,6.0,0.0,34.666667,20.0,133.0,4.0,10.0,10.0,10.0,1.0,29.0,1.0,0.0,0.0,2.0,0.0,6.0,0.0,30.0,14.0,34.0,34.666667,133.0,10.0,30.0,30.0,29.0,44.0,2.596154,0.865385,0.218045,0.330827,0.225564,30.0,14.0,34.0,105.0,420.0,49.074074,135.5,136.19,86.4,173.15,4.206349,1.290476,0.205714,0.412262,0.324262
201908150,VS,SF,N,1,0,0,0,0,5.0,8,24,1,5,5,2,1,2,0,0,0,0,0,2,0,0,0,0,1,3.98,20190815,0,5.0,38.0,25.0,152.0,5.0,14.0,14.0,13.0,2.0,31.0,2.0,0.0,1.0,2.0,0.0,7.0,0.0,38.0,25.0,152.0,5.0,14.0,14.0,13.0,2.0,31.0,2.0,0.0,1.0,2.0,0.0,7.0,0.0,38.0,17.0,42.0,38.0,152.0,14.0,38.0,38.0,31.0,55.0,3.315789,1.0,0.203947,0.361842,0.25,38.0,17.0,42.0,105.0,420.0,51.222222,138.5,137.16,84.6,175.6,4.390476,1.319048,0.201429,0.418095,0.326571
201908200,VS,COL,N,1,0,0,0,0,6.0,7,25,1,3,3,1,0,4,0,0,0,0,0,2,0,1,0,1,0,4.04,20190820,0,6.0,43.0,33.0,176.0,6.0,19.0,19.0,15.0,3.0,33.0,2.0,0.0,1.0,2.0,0.0,9.0,0.0,43.0,33.0,176.0,6.0,19.0,19.0,15.0,3.0,33.0,2.0,0.0,1.0,2.0,0.0,9.0,0.0,48.0,21.0,54.0,43.0,176.0,19.0,48.0,48.0,33.0,69.0,3.976744,1.116279,0.1875,0.392045,0.272727,48.0,21.0,54.0,105.0,420.0,53.444444,141.0,138.28,81.8,178.8,4.580952,1.342857,0.194762,0.425714,0.329238


### Load Data

In [20]:
df=pd.read_csv('df_bp3.csv')

  df=pd.read_csv('df_bp3.csv')


In [22]:
start_pitchers_h = df['pitcher_start_id_h'].unique()
start_pitchers_v = df['pitcher_start_id_v'].unique()
start_pitchers_all = np.union1d(start_pitchers_h, start_pitchers_v)
start_pitchers_all

array(['abadf001', 'abboc001', 'abboj001', ..., 'zinkc001', 'zitob001',
       'zycht001'], dtype=object)

In [23]:
pitcher_data = {}
for i, p_id in enumerate(start_pitchers_all):
    if i%100==0:
        print(i)
    pitcher_data[p_id] = load_and_process_pitch_df(p_id, 'PitchersData/')

0
100
200
300
400
500
600
700
800
900
1000
1100
1200
1300
1400
1500
1600
1700
1800
1900
2000
2100
2200


In [24]:
raw_cols_to_add = ['IP_real', 'rollsum_IP_real_10', 'rollsum_H_10',
       'rollsum_BFP_10', 'rollsum_HR_10', 'rollsum_R_10', 'rollsum_ER_10',
       'rollsum_BB_10', 'rollsum_IB_10', 'rollsum_SO_10', 'rollsum_SH_10',
       'rollsum_SF_10', 'rollsum_WP_10', 'rollsum_HBP_10',
       'rollsum_BK_10', 'rollsum_2B_10', 'rollsum_3B_10',
       'rollsum_IP_real_35', 'rollsum_H_35', 'rollsum_BFP_35',
       'rollsum_HR_35', 'rollsum_R_35', 'rollsum_ER_35', 'rollsum_BB_35',
       'rollsum_IB_35', 'rollsum_SO_35', 'rollsum_SH_35', 'rollsum_SF_35',
       'rollsum_WP_35', 'rollsum_HBP_35', 'rollsum_BK_35',
       'rollsum_2B_35', 'rollsum_3B_35', 'H_BB_roll_10', 'XB_roll_10',
       'TB_roll_10', 'IP_mod_10', 'BF_mod_10', 'ER_mod_10', 'H_BB_mod_10', 'H_BB_perc_10',
       'SO_mod_10', 'TB_BB_mod_10', 'ERA_10', 'WHIP_10', 'SO_perc_10',
       'TB_BB_perc_10', 'H_BB_roll_35', 'XB_roll_35', 'TB_roll_35',
       'IP_mod_35', 'BF_mod_35', 'ER_mod_35', 'H_BB_mod_35','H_BB_perc_35', 'SO_mod_35',
       'TB_BB_mod_35', 'ERA_35', 'WHIP_35', 'SO_perc_35', 'TB_BB_perc_35']
cols_to_add = [col+suff for col in raw_cols_to_add for suff in ['_h','_v']]

col_add_dict = {col:np.zeros(df.shape[0]) for col in cols_to_add}

In [27]:
for i in range(df.shape[0]):
    row = df.iloc[i,:]
    if i%1000==0:
        print(i)
    sp_id_v = row['pitcher_start_id_v']
    sp_id_h = row['pitcher_start_id_h']
    date_dblhead = row['date_dblhead']
    if sp_id_v in pitcher_data.keys():
        curr_df = pitcher_data[sp_id_v]
        if date_dblhead in curr_df.index:
            for col in raw_cols_to_add:
                col_add_dict[col+'_v'][i] = curr_df.loc[date_dblhead,col]
        else:
            print(f'no match for {sp_id_v} date {date_dblhead}')
    if sp_id_h in pitcher_data.keys():
        curr_df = pitcher_data[sp_id_h]
        if date_dblhead in curr_df.index:
            for col in raw_cols_to_add:
                col_add_dict[col+'_h'][i] = curr_df.loc[date_dblhead,col]
        else:
            print(f'no match for {sp_id_h} date {date_dblhead}')

0
no match for cormr001 date 199405200
1000
no match for herso001 date 199407160
2000
3000
4000
5000
6000
7000
8000
9000
10000
no match for merck001 date 199809200
11000
12000
13000
14000
15000
16000
17000
18000
19000
no match for milte001 date 200208060
20000
21000
22000
23000
24000
no match for armat002 date 200408030
25000
26000
27000
28000
no match for mitrs001 date 200605120
29000
30000
31000
32000
33000
34000
35000
36000
37000
38000
39000
40000
no match for volqe001 date 201104220
41000
no match for oswar001 date 201108190
42000
43000
44000
45000
46000
47000
48000
49000
50000
51000
52000
no match for sampa001 date 201606230
53000
54000
55000
56000
57000
no match for hillr001 date 201805192
no match for lylej001 date 201806230
58000
no match for buchc001 date 201809130
59000
no match for cobba001 date 201809230
60000
61000
62000
no match for curtj003 date 202104110
63000
64000
no match for snelb001 date 202204100
65000
66000
no match for mccls003 date 202208300
67000
no match for 

In [28]:
for col in cols_to_add:
    df[col] = col_add_dict[col]

  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]
  df[col] = col_add_dict[col]


In [30]:
df.sample(3)

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,IP_real_h,IP_real_v,rollsum_IP_real_10_h,rollsum_IP_real_10_v,rollsum_H_10_h,rollsum_H_10_v,rollsum_BFP_10_h,rollsum_BFP_10_v,rollsum_HR_10_h,rollsum_HR_10_v,rollsum_R_10_h,rollsum_R_10_v,rollsum_ER_10_h,rollsum_ER_10_v,rollsum_BB_10_h,rollsum_BB_10_v,rollsum_IB_10_h,rollsum_IB_10_v,rollsum_SO_10_h,rollsum_SO_10_v,rollsum_SH_10_h,rollsum_SH_10_v,rollsum_SF_10_h,rollsum_SF_10_v,rollsum_WP_10_h,rollsum_WP_10_v,rollsum_HBP_10_h,rollsum_HBP_10_v,rollsum_BK_10_h,rollsum_BK_10_v,rollsum_2B_10_h,rollsum_2B_10_v,rollsum_3B_10_h,rollsum_3B_10_v,rollsum_IP_real_35_h,rollsum_IP_real_35_v,rollsum_H_35_h,rollsum_H_35_v,rollsum_BFP_35_h,rollsum_BFP_35_v,rollsum_HR_35_h,rollsum_HR_35_v,rollsum_R_35_h,rollsum_R_35_v,rollsum_ER_35_h,rollsum_ER_35_v,rollsum_BB_35_h,rollsum_BB_35_v,rollsum_IB_35_h,rollsum_IB_35_v,rollsum_SO_35_h,rollsum_SO_35_v,rollsum_SH_35_h,rollsum_SH_35_v,rollsum_SF_35_h,rollsum_SF_35_v,rollsum_WP_35_h,rollsum_WP_35_v,rollsum_HBP_35_h,rollsum_HBP_35_v,rollsum_BK_35_h,rollsum_BK_35_v,rollsum_2B_35_h,rollsum_2B_35_v,rollsum_3B_35_h,rollsum_3B_35_v,H_BB_roll_10_h,H_BB_roll_10_v,XB_roll_10_h,XB_roll_10_v,TB_roll_10_h,TB_roll_10_v,IP_mod_10_h,IP_mod_10_v,BF_mod_10_h,BF_mod_10_v,ER_mod_10_h,ER_mod_10_v,H_BB_mod_10_h,H_BB_mod_10_v,H_BB_perc_10_h,H_BB_perc_10_v,SO_mod_10_h,SO_mod_10_v,TB_BB_mod_10_h,TB_BB_mod_10_v,ERA_10_h,ERA_10_v,WHIP_10_h,WHIP_10_v,SO_perc_10_h,SO_perc_10_v,TB_BB_perc_10_h,TB_BB_perc_10_v,H_BB_roll_35_h,H_BB_roll_35_v,XB_roll_35_h,XB_roll_35_v,TB_roll_35_h,TB_roll_35_v,IP_mod_35_h,IP_mod_35_v,BF_mod_35_h,BF_mod_35_v,ER_mod_35_h,ER_mod_35_v,H_BB_mod_35_h,H_BB_mod_35_v,H_BB_perc_35_h,H_BB_perc_35_v,SO_mod_35_h,SO_mod_35_v,TB_BB_mod_35_h,TB_BB_mod_35_v,ERA_35_h,ERA_35_v,WHIP_35_h,WHIP_35_v,SO_perc_35_h,SO_perc_35_v,TB_BB_perc_35_h,TB_BB_perc_35_v
35345,20090512,0,Tue,SDN,NL,33,CHN,NL,32,2,6,51,N,,,,CHI11,39963.0,159,200000000,00001212x,31,5,1,0,1,2,0,0,0,2,0,7,1,0,1,0,4,3,6,6,2,0,24,9,0,0,0,0,34,11,4,0,2,5,1,0,0,4,0,11,1,0,0,0,9,4,2,2,0,0,27,5,0,0,1,0,herna901,Angel Hernandez,welkb901,Bill Welke,welkt901,Tim Welke,barrs901,Scott Barry,,(none),,(none),blacb001,Buddy Black,pinil001,Lou Piniella,hardr001,Rich Harden,peavj001,Jake Peavy,,(none),bradm001,Milton Bradley,peavj001,Jake Peavy,hardr001,Rich Harden,gileb002,Brian Giles,9,ecksd001,David Eckstein,4,gonza003,Adrian Gonzalez,3,headc001,Chase Headley,7,geruj001,Jody Gerut,8,kouzk001,Kevin Kouzmanoff,5,blanh001,Henry Blanco,2,rodrl002,Luis Rodriguez,6,peavj001,Jake Peavy,1,soria001,Alfonso Soriano,7,therr001,Ryan Theriot,6,fukuk001,Kosuke Fukudome,8,lee-d002,Derrek Lee,3,bradm001,Milton Bradley,9,fontm001,Mike Fontenot,5,sotog001,Geovany Soto,2,milea001,Aaron Miles,4,hardr001,Rich Harden,1,,Y,2009,4,1,8,200905120,0.270878,0.251633,0.343436,0.316261,0.434845,0.400036,0.778281,0.716297,83.0,44.0,34.0,19.0,97.0,87.0,0.25,0.242574,0.328947,0.315742,0.407843,0.39703,0.736791,0.712772,19.0,15.0,11.0,4.0,19.0,14.0,0.0,0.0,0.5,0.0,,6.0,6.0,53.666667,66.333333,40.0,59.0,237.0,276.0,6.0,7.0,26.0,32.0,23.0,31.0,33.0,27.0,2.0,1.0,60.0,63.0,4.0,2.0,1.0,1.0,1.0,2.0,3.0,0.0,0.0,1.0,8.0,8.0,0.0,1.0,186.333333,226.333333,130.0,195.0,766.0,931.0,18.0,24.0,60.0,86.0,55.0,83.0,83.0,80.0,4.0,3.0,229.0,224.0,5.0,8.0,3.0,4.0,4.0,7.0,5.0,5.0,0.0,1.0,24.0,28.0,2.0,5.0,73.0,86.0,20.0,24.0,60.0,83.0,53.666667,66.333333,237.0,276.0,23.0,31.0,73.0,86.0,0.308017,0.311594,60.0,63.0,93.0,110.0,3.857143,4.20603,1.360248,1.296482,0.253165,0.228261,0.392405,0.398551,213.0,275.0,64.0,86.0,194.0,281.0,186.333333,226.333333,766.0,931.0,55.0,83.0,213.0,275.0,0.278068,0.295381,229.0,224.0,277.0,361.0,2.65653,3.300442,1.143113,1.215022,0.298956,0.240602,0.361619,0.387755
6925,19970625,0,Wed,KCA,AL,72,CHA,AL,74,7,8,59,D,,,,CHI12,22176.0,203,2000011300,0000011501,43,14,4,1,0,7,2,0,0,3,1,4,1,0,0,0,11,4,8,8,0,0,29,8,0,0,0,0,40,13,2,1,2,8,1,0,0,3,1,8,0,1,0,0,7,4,7,7,0,0,30,10,1,0,0,0,hendt901,Ted Hendry,barrt901,Ted Barrett,onorb901,Brian O'Nora,clara901,Al Clark,,(none),,(none),boonb001,Bob Boone,bevit801,Terry Bevington,karcm001,Matt Karchner,montj002,Jeff Montgomery,,(none),valdm002,Mario Valdez,belct001,Tim Belcher,castc002,Carlos Castillo,offej001,Jose Offerman,4,goodt001,Tom Goodwin,8,bellj001,Jay Bell,6,kingj001,Jeff King,3,davic001,Chili Davis,10,damoj001,Johnny Damon,7,dye-j001,Jermaine Dye,9,coops001,Scott Cooper,5,macfm001,Mike Macfarlane,2,martd002,Dave Martinez,9,durhr001,Ray Durham,4,thomf001,Frank Thomas,3,bellj002,Albert Belle,7,fabrj001,Jorge Fabregas,2,bainh001,Harold Baines,10,camem001,Mike Cameron,8,snopc001,Chris Snopek,5,guilo001,Ozzie Guillen,6,,Y,1997,1,1,15,199706250,0.277788,0.265969,0.351504,0.328713,0.429832,0.403825,0.781337,0.732538,115.0,182.0,51.0,85.0,122.0,108.0,0.266995,0.263311,0.32852,0.324756,0.419704,0.404647,0.748224,0.729403,18.0,28.0,6.0,18.0,20.0,15.0,0.0,0.0,0.5,0.0,,5.333333,7.0,14.0,72.333333,20.0,80.0,68.0,309.0,1.0,5.0,9.0,34.0,8.0,34.0,10.0,24.0,1.0,1.0,10.0,39.0,0.0,2.0,1.0,0.0,2.0,2.0,0.0,2.0,0.0,0.0,6.0,19.0,1.0,0.0,35.333333,259.333333,39.0,272.0,163.0,1088.0,4.0,22.0,20.0,111.0,18.0,104.0,24.0,69.0,3.0,5.0,25.0,124.0,0.0,5.0,2.0,9.0,3.0,5.0,0.0,5.0,0.0,0.0,10.0,57.0,1.0,3.0,30.0,104.0,10.0,29.0,30.0,109.0,30.0,72.333333,120.0,309.0,16.888889,34.0,54.0,104.0,0.410333,0.33657,20.4,39.0,63.4,133.0,5.066667,4.230415,1.8,1.437788,0.17,0.126214,0.528333,0.430421,63.0,341.0,20.0,107.0,59.0,379.0,105.0,259.333333,420.0,1088.0,56.703704,104.0,167.5,341.0,0.376405,0.313419,76.4,124.0,198.65,448.0,4.860317,3.609254,1.595238,1.31491,0.181905,0.113971,0.472976,0.411765
482,19940514,0,Sat,SDN,NL,35,LAN,NL,36,1,2,52,N,,,,LOS03,46137.0,147,1000000,000000101,33,8,1,0,0,1,0,0,0,3,1,3,0,0,2,0,8,2,2,2,0,0,25,10,1,0,0,0,33,9,0,0,0,2,1,0,0,1,1,7,0,0,0,0,8,2,1,1,0,0,27,12,0,0,2,0,willc901,Charlie Williams,barnr901,Ron Barnes,monte901,Ed Montague,darlg901,Gary Darling,,(none),,(none),riggj801,Jim Riggleman,lasot101,Tom Lasorda,gottj001,Jim Gott,hofft001,Trevor Hoffman,,(none),offej001,Jose Offerman,ashba002,Andy Ashby,herso001,Orel Hershiser,belld001,Derek Bell,8,hyert001,Tim Hyers,3,gwynt001,Tony Gwynn,9,planp001,Phil Plantier,7,livis001,Scott Livingstone,5,ausmb001,Brad Ausmus,2,lopel002,Luis Lopez,4,gutir001,Ricky Gutierrez,6,ashba002,Andy Ashby,1,butlb001,Brett Butler,8,deshd001,Delino DeShields,4,piazm001,Mike Piazza,2,wallt001,Tim Wallach,5,rodrh001,Henry Rodriguez,7,karre001,Eric Karros,3,mondr002,Raul Mondesi,9,offej001,Jose Offerman,6,herso001,Orel Hershiser,1,,Y,1994,1,1,3,199405140,,,,,,,,,,,,,,,0.295347,0.244379,0.36309,0.293419,0.475783,0.397849,0.838874,0.691268,28.0,14.0,11.0,6.0,26.0,28.0,0.0,0.0,0.5,0.0,,8.0,8.0,65.666667,65.0,68.0,62.0,274.0,278.0,6.0,8.0,28.0,31.0,23.0,27.0,19.0,22.0,3.0,6.0,47.0,44.0,1.0,4.0,1.0,2.0,1.0,4.0,0.0,1.0,0.0,0.0,15.0,14.0,0.0,4.0,224.333333,146.333333,219.0,183.0,948.0,673.0,20.0,23.0,111.0,113.0,90.0,102.0,71.0,63.0,11.0,10.0,153.0,98.0,11.0,7.0,4.0,8.0,7.0,8.0,7.0,3.0,0.0,1.0,44.0,37.0,5.0,5.0,87.0,84.0,27.0,38.0,95.0,100.0,65.666667,65.0,274.0,278.0,23.0,27.0,87.0,84.0,0.317518,0.302158,47.0,44.0,114.0,122.0,3.152284,3.738462,1.324873,1.292308,0.171533,0.158273,0.416058,0.438849,290.0,246.0,94.0,93.0,313.0,276.0,224.333333,146.333333,948.0,673.0,90.0,102.0,290.0,246.0,0.305907,0.365527,153.0,98.0,384.0,339.0,3.610698,6.273349,1.292719,1.681093,0.161392,0.145617,0.405063,0.503715


In [31]:
df.shape

(67352, 321)

In [33]:
(df['IP_mod_10_h']==0).sum()

1

In [34]:
(df['IP_mod_10_v']==0).sum()

16

In [35]:
df.loc[df['IP_mod_10_v']==0]

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,IP_real_h,IP_real_v,rollsum_IP_real_10_h,rollsum_IP_real_10_v,rollsum_H_10_h,rollsum_H_10_v,rollsum_BFP_10_h,rollsum_BFP_10_v,rollsum_HR_10_h,rollsum_HR_10_v,rollsum_R_10_h,rollsum_R_10_v,rollsum_ER_10_h,rollsum_ER_10_v,rollsum_BB_10_h,rollsum_BB_10_v,rollsum_IB_10_h,rollsum_IB_10_v,rollsum_SO_10_h,rollsum_SO_10_v,rollsum_SH_10_h,rollsum_SH_10_v,rollsum_SF_10_h,rollsum_SF_10_v,rollsum_WP_10_h,rollsum_WP_10_v,rollsum_HBP_10_h,rollsum_HBP_10_v,rollsum_BK_10_h,rollsum_BK_10_v,rollsum_2B_10_h,rollsum_2B_10_v,rollsum_3B_10_h,rollsum_3B_10_v,rollsum_IP_real_35_h,rollsum_IP_real_35_v,rollsum_H_35_h,rollsum_H_35_v,rollsum_BFP_35_h,rollsum_BFP_35_v,rollsum_HR_35_h,rollsum_HR_35_v,rollsum_R_35_h,rollsum_R_35_v,rollsum_ER_35_h,rollsum_ER_35_v,rollsum_BB_35_h,rollsum_BB_35_v,rollsum_IB_35_h,rollsum_IB_35_v,rollsum_SO_35_h,rollsum_SO_35_v,rollsum_SH_35_h,rollsum_SH_35_v,rollsum_SF_35_h,rollsum_SF_35_v,rollsum_WP_35_h,rollsum_WP_35_v,rollsum_HBP_35_h,rollsum_HBP_35_v,rollsum_BK_35_h,rollsum_BK_35_v,rollsum_2B_35_h,rollsum_2B_35_v,rollsum_3B_35_h,rollsum_3B_35_v,H_BB_roll_10_h,H_BB_roll_10_v,XB_roll_10_h,XB_roll_10_v,TB_roll_10_h,TB_roll_10_v,IP_mod_10_h,IP_mod_10_v,BF_mod_10_h,BF_mod_10_v,ER_mod_10_h,ER_mod_10_v,H_BB_mod_10_h,H_BB_mod_10_v,H_BB_perc_10_h,H_BB_perc_10_v,SO_mod_10_h,SO_mod_10_v,TB_BB_mod_10_h,TB_BB_mod_10_v,ERA_10_h,ERA_10_v,WHIP_10_h,WHIP_10_v,SO_perc_10_h,SO_perc_10_v,TB_BB_perc_10_h,TB_BB_perc_10_v,H_BB_roll_35_h,H_BB_roll_35_v,XB_roll_35_h,XB_roll_35_v,TB_roll_35_h,TB_roll_35_v,IP_mod_35_h,IP_mod_35_v,BF_mod_35_h,BF_mod_35_v,ER_mod_35_h,ER_mod_35_v,H_BB_mod_35_h,H_BB_mod_35_v,H_BB_perc_35_h,H_BB_perc_35_v,SO_mod_35_h,SO_mod_35_v,TB_BB_mod_35_h,TB_BB_mod_35_v,ERA_35_h,ERA_35_v,WHIP_35_h,WHIP_35_v,SO_perc_35_h,SO_perc_35_v,TB_BB_perc_35_h,TB_BB_perc_35_v
555,19940520,0,Fri,SLN,NL,40,FLO,NL,41,3,2,54,N,,,,MIA01,31512.0,193,102000,000002000,31,6,2,0,0,3,0,0,0,10,2,4,1,1,0,0,11,5,2,2,0,0,27,13,0,0,2,0,33,9,2,0,0,2,1,0,1,2,0,4,0,0,2,0,8,4,3,3,0,0,27,13,1,0,0,0,marsr901,Randy Marsh,hirsm901,Mark Hirschbeck,vanol901,Larry Vanover,relic901,Charlie Reliford,,(none),,(none),torrj101,Joe Torre,lachr101,Rene Lachemann,everb001,Bryan Eversgerd,gardm001,Mark Gardner,perem002,Mike Perez,jordb001,Brian Jordan,cormr001,Rheal Cormier,gardm001,Mark Gardner,lankr001,Ray Lankford,8,smito001,Ozzie Smith,6,jeffg001,Gregg Jefferies,3,zeilt001,Todd Zeile,5,whitm001,Mark Whiten,9,jordb001,Brian Jordan,7,pagnt001,Tom Pagnozzi,2,alicl001,Luis Alicea,4,cormr001,Rheal Cormier,1,carrc001,Chuck Carr,8,abbok002,Kurt Abbott,6,santb001,Benito Santiago,2,conij001,Jeff Conine,7,desto001,Orestes Destrade,3,magad001,Dave Magadan,5,everc001,Carl Everett,9,barbb001,Bret Barberie,4,gardm001,Mark Gardner,1,,Y,1994,-1,0,5,199405200,,,,,,,,,,,,,,,0.270138,0.250499,0.345374,0.333037,0.398821,0.40519,0.744196,0.738227,24.0,24.0,5.0,15.0,23.0,17.0,0.0,0.0,0.5,0.0,,5.666667,0.0,29.0,0.0,32.0,0.0,124.0,0.0,7.0,0.0,25.0,0.0,23.0,0.0,9.0,0.0,0.0,0.0,15.0,0.0,2.0,0.0,4.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,8.0,0.0,2.0,0.0,155.0,0.0,156.0,0.0,661.0,0.0,24.0,0.0,109.0,0.0,103.0,0.0,53.0,0.0,0.0,0.0,93.0,0.0,5.0,0.0,11.0,0.0,4.0,0.0,9.0,0.0,0.0,0.0,41.0,0.0,4.0,0.0,41.0,0.0,26.0,0.0,58.0,0.0,30.0,0.0,124.0,0.0,23.555556,0.0,42.5,0.0,0.330645,0.0,15.0,0.0,67.0,0.0,7.066667,0.0,1.416667,0.0,0.120968,0.0,0.540323,0.0,209.0,0.0,97.0,0.0,253.0,0.0,155.0,0.0,661.0,0.0,103.0,0.0,209.0,0.0,0.316188,0.0,93.0,0.0,306.0,0.0,5.980645,0.0,1.348387,0.0,0.140696,0.0,0.462935,0.0
1258,19940716,0,Sat,LAN,NL,91,PHI,NL,91,6,10,51,N,,,,PHI12,46679.0,170,110030100,01503001x,35,12,1,0,1,6,0,1,0,3,0,2,0,0,3,0,6,4,6,6,1,0,24,12,3,0,2,0,35,11,2,1,2,9,0,1,0,5,1,3,1,0,2,0,7,3,6,6,0,0,27,12,0,0,3,0,wendh901,Harry Wendelstedt,relic901,Charlie Reliford,hirsm901,Mark Hirschbeck,riekr901,Rich Rieker,,(none),,(none),lasot101,Tom Lasorda,fregj101,Jim Fregosi,munob001,Bobby Munoz,martr002,Ramon Martinez,borlt001,Toby Borland,eisej001,Jim Eisenreich,herso001,Orel Hershiser,munob001,Bobby Munoz,butlb001,Brett Butler,8,deshd001,Delino DeShields,4,piazm001,Mike Piazza,2,wallt001,Tim Wallach,5,rodrh001,Henry Rodriguez,7,mondr002,Raul Mondesi,9,karre001,Eric Karros,3,bourr001,Rafael Bournigal,6,herso001,Orel Hershiser,1,hatcb001,Billy Hatcher,8,duncm001,Mariano Duncan,5,thomm001,Milt Thompson,7,krukj001,John Kruk,3,eisej001,Jim Eisenreich,9,moram001,Mickey Morandini,4,liebm001,Mike Lieberthal,2,stock001,Kevin Stocker,6,munob001,Bobby Munoz,1,,Y,1994,4,1,16,199407160,,,,,,,,,,,,,,,0.251734,0.249246,0.321653,0.310886,0.360753,0.374874,0.682406,0.68576,20.0,10.0,9.0,8.0,22.0,21.0,0.0,0.0,0.5,0.0,,5.0,0.0,60.0,0.0,52.0,0.0,257.0,0.0,5.0,0.0,18.0,0.0,11.0,0.0,25.0,0.0,0.0,0.0,43.0,0.0,3.0,0.0,2.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0,90.333333,0.0,91.0,0.0,402.0,0.0,6.0,0.0,41.0,0.0,32.0,0.0,42.0,0.0,1.0,0.0,57.0,0.0,4.0,0.0,5.0,0.0,5.0,0.0,1.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,77.0,0.0,17.0,0.0,69.0,0.0,60.0,0.0,257.0,0.0,11.0,0.0,77.0,0.0,0.299611,0.0,43.0,0.0,94.0,0.0,1.65,0.0,1.283333,0.0,0.167315,0.0,0.365759,0.0,133.0,0.0,31.0,0.0,122.0,0.0,105.0,0.0,420.0,0.0,40.148148,0.0,155.0,0.0,0.332524,0.0,60.6,0.0,172.1,0.0,3.44127,0.0,1.47619,0.0,0.144286,0.0,0.409762,0.0
10479,19980920,0,Sun,SLN,NL,157,MIL,NL,156,11,6,54,D,,,,MIL05,52831.0,208,213030002,000105000,36,10,1,0,5,10,0,1,0,5,0,5,2,0,0,0,4,6,6,6,0,0,27,6,0,0,0,0,39,13,4,0,0,6,0,1,0,6,0,11,0,0,0,0,13,6,10,10,0,0,27,8,1,0,0,0,crawj901,Jerry Crawford,gormb901,Brian Gorman,davib902,Bob Davidson,wintm901,Mike Winters,,(none),,(none),larut101,Tony LaRussa,garnp001,Phil Garner,aybam001,Manny Aybar,karls001,Scott Karl,,(none),mcgwm001,Mark McGwire,merck001,Kent Mercker,karls001,Scott Karl,kellp001,Pat Kelly,4,tatif001,Fernando Tatis,5,mcgwm001,Mark McGwire,3,jordb001,Brian Jordan,8,gantr001,Ron Gant,7,marre001,Eli Marrero,2,ordal001,Luis Ordaz,6,merck001,Kent Mercker,1,littm001,Mark Little,9,vinaf001,Fernando Vina,4,lorem001,Mark Loretta,3,cirij001,Jeff Cirillo,5,burnj001,Jeromy Burnitz,9,grism001,Marquis Grissom,8,jackd002,Darrin Jackson,7,mathm001,Mike Matheny,2,valej003,Jose Valentin,6,karls001,Scott Karl,1,,Y,1998,-5,0,17,199809200,0.259567,0.256861,0.325329,0.336908,0.397834,0.434081,0.723163,0.770989,86.0,139.0,60.0,40.0,109.0,139.0,0.276852,0.251266,0.324978,0.343111,0.448148,0.445795,0.773127,0.788906,9.0,29.0,5.0,5.0,21.0,31.0,0.0,0.0,0.5,0.0,,3.0,0.0,60.0,0.0,73.0,0.0,262.0,0.0,6.0,0.0,35.0,0.0,35.0,0.0,18.0,0.0,0.0,0.0,29.0,0.0,5.0,0.0,2.0,0.0,4.0,0.0,2.0,0.0,0.0,0.0,14.0,0.0,1.0,0.0,204.666667,0.0,237.0,0.0,902.0,0.0,21.0,0.0,112.0,0.0,101.0,0.0,69.0,0.0,4.0,0.0,108.0,0.0,14.0,0.0,4.0,0.0,7.0,0.0,5.0,0.0,0.0,0.0,57.0,0.0,3.0,0.0,91.0,0.0,28.0,0.0,101.0,0.0,60.0,0.0,262.0,0.0,35.0,0.0,91.0,0.0,0.347328,0.0,29.0,0.0,119.0,0.0,5.25,0.0,1.516667,0.0,0.110687,0.0,0.454198,0.0,306.0,0.0,105.0,0.0,342.0,0.0,204.666667,0.0,902.0,0.0,101.0,0.0,306.0,0.0,0.339246,0.0,108.0,0.0,411.0,0.0,4.441368,0.0,1.495114,0.0,0.119734,0.0,0.455654,0.0
19531,20020806,0,Tue,MIN,AL,114,BAL,AL,110,2,9,51,N,,,,BAL12,33858.0,167,2000,00010260x,34,7,0,0,1,2,0,0,0,1,0,5,0,0,1,0,6,3,9,9,2,0,24,6,0,0,0,0,31,7,0,0,2,8,0,0,0,7,0,10,0,0,0,0,5,4,2,2,0,0,27,12,2,0,1,0,kulpr901,Ron Kulpa,scotd901,Dale Scott,joycj901,Jim Joyce,nelsj901,Jeff Nelson,,(none),,(none),gardr001,Ron Gardenhire,hargm001,Mike Hargrove,ponss001,Sidney Ponson,santj003,Johan Santana,,(none),cordm001,Marty Cordova,milte001,Eric Milton,ponss001,Sidney Ponson,jonej003,Jacque Jones,7,guzmc001,Cristian Guzman,6,mohrd001,Dustan Mohr,9,ortid001,David Ortiz,10,huntt001,Torii Hunter,8,miend001,Doug Mientkiewicz,3,cuddm001,Michael Cuddyer,5,piera001,A.J. Pierzynski,2,rival001,Luis Rivas,4,moram002,Melvin Mora,8,lopel002,Luis Lopez,6,mattg002,Gary Matthews,9,batit001,Tony Batista,5,cordm001,Marty Cordova,7,leonj002,Jose Leon,3,richc001,Chris Richard,10,gil-g001,Geronimo Gil,2,hairj002,Jerry Hairston,4,,Y,2002,7,1,11,200208060,0.252224,0.274297,0.312406,0.335236,0.402579,0.43681,0.714985,0.772046,143.0,109.0,50.0,71.0,100.0,90.0,0.267308,0.285578,0.324468,0.346154,0.426923,0.468004,0.751391,0.814158,27.0,15.0,10.0,14.0,18.0,11.0,0.0,0.0,0.5,0.0,,6.666667,0.0,57.666667,0.0,56.0,0.0,239.0,0.0,7.0,0.0,25.0,0.0,23.0,0.0,23.0,0.0,0.0,0.0,38.0,0.0,0.0,0.0,3.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,8.0,0.0,1.0,0.0,212.0,0.0,230.0,0.0,911.0,0.0,30.0,0.0,116.0,0.0,109.0,0.0,72.0,0.0,0.0,0.0,129.0,0.0,4.0,0.0,4.0,0.0,2.0,0.0,7.0,0.0,0.0,0.0,47.0,0.0,4.0,0.0,79.0,0.0,24.0,0.0,80.0,0.0,57.666667,0.0,239.0,0.0,23.0,0.0,79.0,0.0,0.330544,0.0,38.0,0.0,103.0,0.0,3.589595,0.0,1.369942,0.0,0.158996,0.0,0.430962,0.0,302.0,0.0,115.0,0.0,345.0,0.0,212.0,0.0,911.0,0.0,109.0,0.0,302.0,0.0,0.331504,0.0,129.0,0.0,417.0,0.0,4.627358,0.0,1.424528,0.0,0.141603,0.0,0.457739,0.0
24297,20040803,0,Tue,MON,NL,105,SLN,NL,105,10,6,72,N,,,,STL09,33696.0,255,1012002004,210210000000,52,16,4,0,3,10,1,0,0,6,1,4,0,0,0,0,13,7,6,6,1,0,36,16,1,0,2,0,45,12,2,0,2,6,1,0,0,6,2,8,0,1,1,0,10,7,9,9,0,0,36,17,1,0,0,0,carlm901,Mark Carlson,rungb901,Brian Runge,hohnb901,Bill Hohn,darlg901,Gary Darling,,(none),,(none),robif103,Frank Robinson,larut101,Tony LaRussa,cordc001,Chad Cordero,hared001,Dan Haren,,(none),batit001,Tony Batista,armat002,Tony Armas,marqj001,Jason Marquis,wilkb002,Brad Wilkerson,8,sledt001,Terrmel Sledge,7,vidrj001,Jose Vidro,4,batit001,Tony Batista,5,johnn001,Nick Johnson,3,gonza001,Alex Gonzalez,6,callr001,Ron Calloway,9,schnb001,Brian Schneider,2,armat002,Tony Armas,1,womat001,Tony Womack,4,rente001,Edgar Renteria,6,pujoa001,Albert Pujols,3,roles001,Scott Rolen,5,edmoj001,Jim Edmonds,8,ceder001,Roger Cedeno,9,andem003,Marlon Anderson,7,moliy001,Yadier Molina,2,marqj001,Jason Marquis,1,,Y,2004,-4,0,16,200408030,0.272989,0.248512,0.339318,0.311285,0.449713,0.387091,0.78903,0.698376,99.0,93.0,34.0,34.0,81.0,89.0,0.294508,0.262097,0.355536,0.330896,0.492424,0.399194,0.847961,0.730089,16.0,14.0,7.0,6.0,14.0,19.0,0.0,0.0,0.5,0.0,,5.666667,0.0,65.333333,0.0,72.0,0.0,276.0,0.0,9.0,0.0,22.0,0.0,21.0,0.0,15.0,0.0,0.0,0.0,49.0,0.0,1.0,0.0,1.0,0.0,2.0,0.0,3.0,0.0,0.0,0.0,9.0,0.0,1.0,0.0,150.0,0.0,166.0,0.0,648.0,0.0,16.0,0.0,67.0,0.0,64.0,0.0,47.0,0.0,3.0,0.0,95.0,0.0,3.0,0.0,5.0,0.0,6.0,0.0,7.0,0.0,0.0,0.0,29.0,0.0,4.0,0.0,87.0,0.0,29.0,0.0,101.0,0.0,65.333333,0.0,276.0,0.0,21.0,0.0,87.0,0.0,0.315217,0.0,49.0,0.0,116.0,0.0,2.892857,0.0,1.331633,0.0,0.177536,0.0,0.42029,0.0,213.0,0.0,69.0,0.0,235.0,0.0,150.0,0.0,648.0,0.0,64.0,0.0,213.0,0.0,0.328704,0.0,95.0,0.0,282.0,0.0,3.84,0.0,1.42,0.0,0.146605,0.0,0.435185,0.0
28110,20060512,0,Fri,FLO,NL,33,PIT,NL,36,9,12,51,N,,,,PIT08,24990.0,209,500000040,00440103x,43,18,5,0,0,8,0,0,0,2,0,5,0,0,1,0,9,4,11,11,0,0,24,14,2,0,2,0,34,15,0,1,0,12,1,2,3,5,0,3,1,0,1,0,9,4,8,8,0,0,27,10,1,0,1,0,nauep901,Paul Nauert,relic901,Charlie Reliford,vanol901,Larry Vanover,gibsg901,Greg Gibson,,(none),,(none),giraj001,Joe Girardi,tracj101,Jim Tracy,cappm001,Matt Capps,wellt002,Todd Wellemeyer,gonzm001,Mike Gonzalez,bay-j001,Jason Bay,mitrs001,Sergio Mitre,santv001,Victor Santos,ramih003,Hanley Ramirez,6,uggld001,Dan Uggla,4,cabrm001,Miguel Cabrera,5,willj004,Josh Willingham,7,borcj001,Joe Borchard,9,jacom001,Mike Jacobs,3,olivm001,Miguel Olivo,2,aberr001,Reggie Abercrombie,8,mitrs001,Sergio Mitre,1,bautj002,Jose Bautista,5,mclon001,Nate McLouth,8,sancf001,Freddy Sanchez,6,wilsc003,Craig Wilson,3,burnj001,Jeromy Burnitz,9,bay-j001,Jason Bay,7,paulr001,Ronny Paulino,2,castj005,Jose Castillo,4,santv001,Victor Santos,1,,Y,2006,3,1,21,200605120,0.257477,0.269126,0.314195,0.332176,0.396396,0.410924,0.710592,0.743101,70.0,106.0,25.0,42.0,120.0,113.0,0.236181,0.24902,0.291705,0.322723,0.376884,0.405882,0.66859,0.728606,13.0,27.0,3.0,12.0,21.0,26.0,0.0,0.0,0.5,0.0,,6.0,0.0,42.666667,0.0,48.0,0.0,185.0,0.0,4.0,0.0,24.0,0.0,22.0,0.0,16.0,0.0,1.0,0.0,31.0,0.0,3.0,0.0,3.0,0.0,5.0,0.0,1.0,0.0,0.0,0.0,5.0,0.0,3.0,0.0,174.666667,0.0,192.0,0.0,780.0,0.0,24.0,0.0,108.0,0.0,91.0,0.0,69.0,0.0,9.0,0.0,111.0,0.0,7.0,0.0,3.0,0.0,10.0,0.0,5.0,0.0,0.0,0.0,39.0,0.0,6.0,0.0,64.0,0.0,19.0,0.0,67.0,0.0,42.666667,0.0,185.0,0.0,22.0,0.0,64.0,0.0,0.345946,0.0,31.0,0.0,83.0,0.0,4.640625,0.0,1.5,0.0,0.167568,0.0,0.448649,0.0,261.0,0.0,99.0,0.0,291.0,0.0,174.666667,0.0,780.0,0.0,91.0,0.0,261.0,0.0,0.334615,0.0,111.0,0.0,360.0,0.0,4.688931,0.0,1.494275,0.0,0.142308,0.0,0.461538,0.0
40015,20110422,0,Fri,CIN,NL,20,SLN,NL,20,2,4,51,N,,,,STL10,40327.0,190,10100,11101000x,34,10,0,0,1,2,0,1,0,5,0,3,2,1,1,0,11,4,4,4,1,0,24,10,1,0,2,0,31,12,2,0,0,3,0,1,1,1,0,2,0,1,2,0,6,5,2,2,2,0,27,14,0,0,1,0,diazl901,Laz Diaz,barrs901,Scott Barry,hirsj901,John Hirschbeck,bellw901,Wally Bell,,(none),,(none),baked002,Dusty Baker,larut101,Tony LaRussa,mcclk001,Kyle McClellan,malom001,Matt Maloney,boggm001,Mitchell Boggs,pujoa001,Albert Pujols,volqe001,Edinson Volquez,batim001,Miguel Batista,stubd001,Drew Stubbs,8,philb001,Brandon Phillips,4,vottj001,Joey Votto,3,gomej001,Jonny Gomes,7,brucj001,Jay Bruce,9,rente001,Edgar Renteria,6,cairm001,Miguel Cairo,5,hernr002,Ramon Hernandez,2,volqe001,Edinson Volquez,1,therr001,Ryan Theriot,6,rasmc001,Colby Rasmus,8,pujoa001,Albert Pujols,3,hollm001,Matt Holliday,7,berkl001,Lance Berkman,9,freed001,David Freese,5,moliy001,Yadier Molina,2,descd001,Daniel Descalso,4,batim001,Miguel Batista,1,,Y,2011,2,1,6,201104220,0.267963,0.275259,0.332731,0.337467,0.405907,0.441271,0.738638,0.778738,80.0,95.0,37.0,38.0,103.0,69.0,0.283539,0.274927,0.353648,0.344133,0.420552,0.439497,0.7742,0.78363,17.0,27.0,7.0,6.0,23.0,13.0,0.0,0.0,0.5,0.0,,0.0,0.0,14.333333,0.0,8.0,0.0,55.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,6.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,49.333333,0.0,45.0,0.0,210.0,0.0,4.0,0.0,19.0,0.0,17.0,0.0,20.0,0.0,3.0,0.0,39.0,0.0,1.0,0.0,1.0,0.0,2.0,0.0,2.0,0.0,0.0,0.0,8.0,0.0,2.0,0.0,14.0,0.0,3.0,0.0,11.0,0.0,30.0,0.0,120.0,0.0,9.703704,0.0,37.5,0.0,0.317083,0.0,20.0,0.0,46.25,0.0,2.911111,0.0,1.25,0.0,0.166667,0.0,0.385417,0.0,65.0,0.0,20.0,0.0,65.0,0.0,105.0,0.0,420.0,0.0,47.925926,0.0,148.5,0.0,0.339762,0.0,81.0,0.0,179.5,0.0,4.107937,0.0,1.414286,0.0,0.192857,0.0,0.427381,0.0
41590,20110819,0,Fri,PHI,NL,123,WAS,NL,123,4,8,53,N,,,,WAS11,37841.0,177,4000000,001010006,33,8,3,1,0,4,0,0,0,3,0,4,0,0,0,0,5,4,8,8,0,0,26,9,1,0,0,0,35,10,2,0,2,8,2,0,0,2,1,7,0,0,0,0,5,4,4,4,0,0,27,15,0,0,1,0,iassd901,Dan Iassogna,scotd901,Dale Scott,mealj901,Jerry Meals,buckc901,CB Bucknor,,(none),,(none),manuc101,Charlie Manuel,johnd105,Davey Johnson,cofft001,Todd Coffey,madsr001,Ryan Madson,,(none),zimmr001,Ryan Zimmerman,oswar001,Roy Oswalt,hernl003,Livan Hernandez,rollj001,Jimmy Rollins,6,maybj001,John Mayberry,8,utlec001,Chase Utley,4,howar001,Ryan Howard,3,pench001,Hunter Pence,9,ibanr001,Raul Ibanez,7,ruizc001,Carlos Ruiz,2,valdw001,Wilson Valdez,5,oswar001,Roy Oswalt,1,desmi001,Ian Desmond,6,ankir001,Rick Ankiel,8,zimmr001,Ryan Zimmerman,5,nix-l001,Laynce Nix,3,wertj001,Jayson Werth,9,espid001,Danny Espinosa,4,gomej001,Jonny Gomes,7,ramow001,Wilson Ramos,2,hernl003,Livan Hernandez,1,,Y,2011,4,1,12,201108190,0.238666,0.255488,0.303842,0.324077,0.374309,0.402123,0.678151,0.7262,109.0,119.0,39.0,27.0,112.0,68.0,0.254652,0.262439,0.315647,0.325602,0.403526,0.440976,0.719173,0.766578,10.0,21.0,8.0,10.0,28.0,8.0,0.0,0.0,0.5,0.0,,4.0,0.0,53.666667,0.0,73.0,0.0,242.0,0.0,6.0,0.0,37.0,0.0,30.0,0.0,11.0,0.0,0.0,0.0,35.0,0.0,3.0,0.0,2.0,0.0,2.0,0.0,3.0,0.0,0.0,0.0,10.0,0.0,2.0,0.0,212.0,0.0,246.0,0.0,915.0,0.0,22.0,0.0,121.0,0.0,106.0,0.0,59.0,0.0,7.0,0.0,126.0,0.0,13.0,0.0,7.0,0.0,3.0,0.0,8.0,0.0,0.0,0.0,49.0,0.0,8.0,0.0,84.0,0.0,26.0,0.0,99.0,0.0,53.666667,0.0,242.0,0.0,30.0,0.0,84.0,0.0,0.347107,0.0,35.0,0.0,110.0,0.0,5.031056,0.0,1.565217,0.0,0.144628,0.0,0.454545,0.0,305.0,0.0,109.0,0.0,355.0,0.0,212.0,0.0,915.0,0.0,106.0,0.0,305.0,0.0,0.333333,0.0,126.0,0.0,414.0,0.0,4.5,0.0,1.438679,0.0,0.137705,0.0,0.452459,0.0
52960,20160623,0,Thu,SEA,AL,73,DET,AL,73,4,5,59,D,,,,DET05,35767.0,204,1210000,0202000001,37,8,2,0,4,4,0,0,0,2,0,8,0,0,1,0,5,6,5,5,1,1,29,6,1,0,1,0,36,8,2,0,1,4,0,0,1,8,1,11,2,0,0,0,11,5,4,4,0,0,30,10,1,0,1,0,fleta901,Andy Fletcher,westj901,Joe West,rippm901,Mark Ripperger,danlk901,Kerwin Danley,,(none),,(none),servs002,Scott Servais,ausmb001,Brad Ausmus,ryank002,Kyle Ryan,cishs001,Steve Cishek,,(none),,(none),sampa001,Adrian Sampson,norrd002,Daniel Norris,martk001,Ketel Marte,6,gutif001,Franklin Gutierrez,7,canor001,Robinson Cano,10,cruzn002,Nelson Cruz,9,lee-d004,Dae-Ho Lee,3,seagk001,Kyle Seager,5,iannc001,Chris Iannetta,2,martl004,Leonys Martin,8,omals001,Shawn O'Malley,4,kinsi001,Ian Kinsler,4,iglej001,Jose Iglesias,6,cabrm001,Miguel Cabrera,10,castn001,Nick Castellanos,5,uptoj001,Justin Upton,7,moyas001,Steven Moya,9,mccaj001,James McCann,2,saltj001,Jarrod Saltalamacchia,3,romia001,Andrew Romine,8,,Y,2016,1,1,9,201606230,0.269665,0.261782,0.323145,0.321399,0.433333,0.437845,0.756478,0.759244,59.0,64.0,35.0,40.0,88.0,98.0,0.283835,0.27955,0.341969,0.328084,0.464286,0.45591,0.806255,0.783994,14.0,9.0,7.0,5.0,14.0,19.0,0.0,0.0,0.5,0.0,,5.0,0.0,40.666667,0.0,34.0,0.0,167.0,0.0,6.0,0.0,20.0,0.0,15.0,0.0,10.0,0.0,0.0,0.0,28.0,0.0,0.0,0.0,2.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,3.0,0.0,67.666667,0.0,58.0,0.0,285.0,0.0,10.0,0.0,35.0,0.0,29.0,0.0,25.0,0.0,0.0,0.0,49.0,0.0,1.0,0.0,5.0,0.0,3.0,0.0,2.0,0.0,0.0,0.0,12.0,0.0,3.0,0.0,44.0,0.0,24.0,0.0,58.0,0.0,40.666667,0.0,167.0,0.0,15.0,0.0,44.0,0.0,0.263473,0.0,28.0,0.0,68.0,0.0,3.319672,0.0,1.081967,0.0,0.167665,0.0,0.407186,0.0,83.0,0.0,38.0,0.0,96.0,0.0,105.0,0.0,420.0,0.0,49.740741,0.0,139.0,0.0,0.316548,0.0,76.0,0.0,181.75,0.0,4.263492,0.0,1.32381,0.0,0.180952,0.0,0.432738,0.0
57401,20180519,2,Sat,LAN,NL,45,WAS,NL,45,5,4,54,N,,,,WAS11,32378.0,207,100010012,000004000,36,10,3,1,2,5,0,0,0,4,1,15,1,0,2,0,8,7,4,4,0,0,27,8,1,0,1,0,31,4,2,0,0,4,0,0,2,4,1,8,0,0,1,0,6,4,5,5,0,0,27,7,0,1,2,0,danlk901,Kerwin Danley,fairc901,Chad Fairchild,drecb901,Bruce Dreckman,viscj901,Jansen Visconti,,(none),,(none),robed001,Dave Roberts,martd002,Dave Martinez,goede001,Erik Goeddel,dools001,Sean Doolittle,jansk001,Kenley Jansen,kempm001,Matt Kemp,hillr001,Rich Hill,schem001,Max Scherzer,pedej001,Joc Pederson,7,muncm001,Max Muncy,5,grany001,Yasmani Grandal,3,bellc002,Cody Bellinger,8,taylc001,Chris Taylor,6,utlec001,Chase Utley,4,puigy001,Yasiel Puig,9,barna001,Austin Barnes,2,hillr001,Rich Hill,1,turnt001,Trea Turner,6,difow001,Wilmer Difo,4,harpb003,Bryce Harper,9,renda001,Anthony Rendon,5,reynm001,Mark Reynolds,3,taylm002,Michael Taylor,8,sevep001,Pedro Severino,2,schem001,Max Scherzer,1,steva001,Andrew Stevenson,7,,Y,2018,-1,0,9,201805192,0.255478,0.242485,0.324105,0.322014,0.42878,0.424853,0.752885,0.746868,121.0,73.0,33.0,27.0,84.0,84.0,0.245473,0.238981,0.321881,0.317223,0.418511,0.402547,0.740392,0.71977,21.0,9.0,8.0,4.0,16.0,19.0,0.0,0.0,0.5,0.0,,7.0,0.0,62.0,0.0,36.0,0.0,237.0,0.0,4.0,0.0,14.0,0.0,11.0,0.0,14.0,0.0,1.0,0.0,96.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,3.0,0.0,0.0,0.0,12.0,0.0,3.0,0.0,225.666667,0.0,137.0,0.0,873.0,0.0,22.0,0.0,63.0,0.0,56.0,0.0,59.0,0.0,3.0,0.0,319.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,13.0,0.0,0.0,0.0,37.0,0.0,5.0,0.0,50.0,0.0,26.0,0.0,62.0,0.0,62.0,0.0,237.0,0.0,11.0,0.0,50.0,0.0,0.21097,0.0,96.0,0.0,76.0,0.0,1.596774,0.0,0.806452,0.0,0.405063,0.0,0.320675,0.0,196.0,0.0,91.0,0.0,228.0,0.0,225.666667,0.0,873.0,0.0,56.0,0.0,196.0,0.0,0.224513,0.0,319.0,0.0,287.0,0.0,2.233383,0.0,0.868538,0.0,0.365407,0.0,0.328751,0.0


In [36]:
df.drop(df.index[df['IP_mod_10_v']==0], inplace=True)
df.drop(df.index[df['IP_mod_10_h']==0], inplace=True)

In [37]:
df.loc[df['IP_mod_10_v']==0]

Unnamed: 0,date,dblheader_code,day_of_week,team_v,league_v,game_no_v,team_h,league_h,game_no_h,runs_v,runs_h,outs_total,day_night,completion_info,forfeit_info,protest_info,ballpark_id,attendance,game_minutes,linescore_v,linescore_h,AB_v,H_v,2B_v,3B_v,HR_v,RBI_v,SH_v,SF_v,HBP_v,BB_v,IBB_v,SO_v,SB_v,CS_v,GIDP_v,CI_v,LOB_v,P_num_v,ERind_v,ERteam_v,WP_v,balk_v,PO_v,ASST_v,ERR_v,PB_v,DP_v,TP_v,AB_h,H_h,2B_h,3B_h,HR_h,RBI_h,SH_h,SF_h,HBP_h,BB_h,IBB_h,SO_h,SB_h,CS_h,GIDP_h,CI_h,LOB_h,P_num_h,ERind_h,ERteam_h,WP_h,balk_h,PO_h,ASST_h,ERR_h,PB_h,DP_h,TP_h,ump_HB_id,ump_HB_name,ump_1B_id,ump_1B_name,ump_2B_id,ump_2B_name,ump_3B_id,ump_3B_name,ump_LF_id,ump_LF_name,ump_RF_id,ump_RF_name,mgr_id_v,mgr_name_v,mgr_id_h,mgr_name_h,pitcher_id_w,pitcher_name_w,pitcher_id_l,pitcher_name_l,pitcher_id_s,pitcher_name_s,GWRBI_id,GWRBI_name,pitcher_start_id_v,pitcher_start_name_v,pitcher_start_id_h,pitcher_start_name_h,batter1_name_v,batter1_id_v,batter1_pos_v,batter2_name_v,batter2_id_v,batter2_pos_v,batter3_name_v,batter3_id_v,batter3_pos_v,batter4_name_v,batter4_id_v,batter4_pos_v,batter5_name_v,batter5_id_v,batter5_pos_v,batter6_name_v,batter6_id_v,batter6_pos_v,batter7_name_v,batter7_id_v,batter7_pos_v,batter8_name_v,batter8_id_v,batter8_pos_v,batter9_name_v,batter9_id_v,batter9_pos_v,batter1_name_h,batter1_id_h,batter1_pos_h,batter2_name_h,batter2_id_h,batter2_pos_h,batter3_name_h,batter3_id_h,batter3_pos_h,batter4_name_h,batter4_id_h,batter4_pos_h,batter5_name_h,batter5_id_h,batter5_pos_h,batter6_name_h,batter6_id_h,batter6_pos_h,batter7_name_h,batter7_id_h,batter7_pos_h,batter8_name_h,batter8_id_h,batter8_pos_h,batter9_name_h,batter9_id_h,batter9_pos_h,misc_info,acqui_info,season,run_diff,home_victory,run_total,date_dblhead,BATAVG_162_h,BATAVG_162_v,OBP_162_h,OBP_162_v,SLG_162_h,SLG_162_v,OBS_162_h,OBS_162_v,SB_162_h,SB_162_v,CS_162_h,CS_162_v,ERR_162_h,ERR_162_v,BATAVG_30_h,BATAVG_30_v,OBP_30_h,OBP_30_v,SLG_30_h,SLG_30_v,OBS_30_h,OBS_30_v,SB_30_h,SB_30_v,CS_30_h,CS_30_v,ERR_30_h,ERR_30_v,implied_prob_h,implied_prob_v,implied_prob_h_mid,over_under_line,over_under_result,IP_real_h,IP_real_v,rollsum_IP_real_10_h,rollsum_IP_real_10_v,rollsum_H_10_h,rollsum_H_10_v,rollsum_BFP_10_h,rollsum_BFP_10_v,rollsum_HR_10_h,rollsum_HR_10_v,rollsum_R_10_h,rollsum_R_10_v,rollsum_ER_10_h,rollsum_ER_10_v,rollsum_BB_10_h,rollsum_BB_10_v,rollsum_IB_10_h,rollsum_IB_10_v,rollsum_SO_10_h,rollsum_SO_10_v,rollsum_SH_10_h,rollsum_SH_10_v,rollsum_SF_10_h,rollsum_SF_10_v,rollsum_WP_10_h,rollsum_WP_10_v,rollsum_HBP_10_h,rollsum_HBP_10_v,rollsum_BK_10_h,rollsum_BK_10_v,rollsum_2B_10_h,rollsum_2B_10_v,rollsum_3B_10_h,rollsum_3B_10_v,rollsum_IP_real_35_h,rollsum_IP_real_35_v,rollsum_H_35_h,rollsum_H_35_v,rollsum_BFP_35_h,rollsum_BFP_35_v,rollsum_HR_35_h,rollsum_HR_35_v,rollsum_R_35_h,rollsum_R_35_v,rollsum_ER_35_h,rollsum_ER_35_v,rollsum_BB_35_h,rollsum_BB_35_v,rollsum_IB_35_h,rollsum_IB_35_v,rollsum_SO_35_h,rollsum_SO_35_v,rollsum_SH_35_h,rollsum_SH_35_v,rollsum_SF_35_h,rollsum_SF_35_v,rollsum_WP_35_h,rollsum_WP_35_v,rollsum_HBP_35_h,rollsum_HBP_35_v,rollsum_BK_35_h,rollsum_BK_35_v,rollsum_2B_35_h,rollsum_2B_35_v,rollsum_3B_35_h,rollsum_3B_35_v,H_BB_roll_10_h,H_BB_roll_10_v,XB_roll_10_h,XB_roll_10_v,TB_roll_10_h,TB_roll_10_v,IP_mod_10_h,IP_mod_10_v,BF_mod_10_h,BF_mod_10_v,ER_mod_10_h,ER_mod_10_v,H_BB_mod_10_h,H_BB_mod_10_v,H_BB_perc_10_h,H_BB_perc_10_v,SO_mod_10_h,SO_mod_10_v,TB_BB_mod_10_h,TB_BB_mod_10_v,ERA_10_h,ERA_10_v,WHIP_10_h,WHIP_10_v,SO_perc_10_h,SO_perc_10_v,TB_BB_perc_10_h,TB_BB_perc_10_v,H_BB_roll_35_h,H_BB_roll_35_v,XB_roll_35_h,XB_roll_35_v,TB_roll_35_h,TB_roll_35_v,IP_mod_35_h,IP_mod_35_v,BF_mod_35_h,BF_mod_35_v,ER_mod_35_h,ER_mod_35_v,H_BB_mod_35_h,H_BB_mod_35_v,H_BB_perc_35_h,H_BB_perc_35_v,SO_mod_35_h,SO_mod_35_v,TB_BB_mod_35_h,TB_BB_mod_35_v,ERA_35_h,ERA_35_v,WHIP_35_h,WHIP_35_v,SO_perc_35_h,SO_perc_35_v,TB_BB_perc_35_h,TB_BB_perc_35_v


In [38]:
df.reset_index(drop=True, inplace=True)

In [39]:
df.to_csv('df_bp5.csv', index=False)