In [1]:
SEED=42
import os
import glob
from joblib import Parallel, delayed
import pandas as pd
import numpy as np
import scipy as sc
from sklearn.model_selection import KFold, GroupKFold
import lightgbm as lgb
import warnings
from utils import get_feature_groups
import itertools
warnings.filterwarnings('ignore')
pd.set_option('max_columns', 300)
pd.set_option('max_rows', 300)

# Function to read our base train and test set
def read_train_test():
    train = pd.read_csv('../input/optiver-realized-volatility-prediction/train.csv')
    test = pd.read_csv('../input/optiver-realized-volatility-prediction/test.csv')
    # Create a key to merge with book and trade data
    train['row_id'] = train['stock_id'].astype(str) + '-' + train['time_id'].astype(str)
    test['row_id'] = test['stock_id'].astype(str) + '-' + test['time_id'].astype(str)
    print(f'Our training set has {train.shape[0]} rows')
    return train, test

# Function to get group stats for the stock_id and time_id
def get_time_stock(df):
    # Get realized volatility columns
    vol_cols = ['log_return1_realized_volatility', 'log_return2_realized_volatility', 'log_return1_realized_volatility_450', 'log_return2_realized_volatility_450', 
                'log_return1_realized_volatility_300', 'log_return2_realized_volatility_300', 'log_return1_realized_volatility_150', 'log_return2_realized_volatility_150', 
                'trade_log_return_realized_volatility', 'trade_log_return_realized_volatility_450', 'trade_log_return_realized_volatility_300', 'trade_log_return_realized_volatility_150']

    # Group by the stock id
    df_stock_id = df.groupby(['stock_id'])[vol_cols].agg(['mean', 'std', 'max', 'min', 'median']).reset_index()
    # Rename columns joining suffix
    df_stock_id.columns = ['_'.join(col) for col in df_stock_id.columns]
    df_stock_id = df_stock_id.add_suffix('_' + 'stock')

    # Group by the time id
    df_time_id = df.groupby(['time_id'])[vol_cols].agg(['mean', 'std', 'max', 'min', 'median']).reset_index()
    # Rename columns joining suffix
    df_time_id.columns = ['_'.join(col) for col in df_time_id.columns]
    df_time_id = df_time_id.add_suffix('_' + 'time')
    
    # Merge with original dataframe
    df = df.merge(df_stock_id, how = 'left', left_on = ['stock_id'], right_on = ['stock_id__stock'])
    df = df.merge(df_time_id, how = 'left', left_on = ['time_id'], right_on = ['time_id__time'])
    df.drop(['stock_id__stock', 'time_id__time'], axis = 1, inplace = True)
    return df

# Function to calculate the root mean squared percentage error
def rmspe(y_true, y_pred):
    return np.sqrt(np.mean(np.square((y_true - y_pred) / y_true)))

In [2]:
train, _ = read_train_test()
df_book = pd.read_csv('../input/processed-book-ffill/df_book.csv')
print(df_book.shape)
df_trade = pd.read_csv('../input/processed-book-ffill/df_trade.csv')
print(df_trade.shape)
train_ = df_book.merge(df_trade, on = ['row_id'], how = 'left')
train = train.merge(train_, on = ['row_id'], how = 'left')

# Get group stats of time_id and stock_id
train = get_time_stock(train)
train['logtarget'] = train['target'].apply(np.log)
train = train.sample(frac=1, random_state=SEED).reset_index(drop=True)
train

Our training set has 428932 rows
(428932, 249)
(428913, 57)


Unnamed: 0,stock_id,time_id,target,row_id,wap1_sum,wap1_mean,wap1_std,wap1_median,wap1_kurtosis,wap1_skew,wap2_sum,wap2_mean,wap2_std,wap2_median,wap2_kurtosis,wap2_skew,log_return1_sum,log_return1_realized_volatility,log_return1_mean,log_return1_std,log_return1_median,log_return1_kurtosis,log_return1_skew,log_return2_sum,log_return2_realized_volatility,log_return2_mean,log_return2_std,log_return2_median,log_return2_kurtosis,log_return2_skew,wap_balance_sum,wap_balance_mean,wap_balance_std,wap_balance_median,wap_balance_kurtosis,wap_balance_skew,price_spread_sum,price_spread_mean,price_spread_std,price_spread_median,price_spread_kurtosis,price_spread_skew,bid_spread_sum,bid_spread_mean,bid_spread_std,bid_spread_median,bid_spread_kurtosis,bid_spread_skew,ask_spread_sum,ask_spread_mean,ask_spread_std,ask_spread_median,ask_spread_kurtosis,ask_spread_skew,total_volume_sum,total_volume_mean,total_volume_std,total_volume_median,total_volume_kurtosis,total_volume_skew,volume_imbalance_sum,volume_imbalance_mean,volume_imbalance_std,volume_imbalance_median,volume_imbalance_kurtosis,volume_imbalance_skew,wap1_sum_450,wap1_mean_450,wap1_std_450,wap1_median_450,wap1_kurtosis_450,wap1_skew_450,wap2_sum_450,wap2_mean_450,wap2_std_450,wap2_median_450,wap2_kurtosis_450,wap2_skew_450,log_return1_sum_450,log_return1_realized_volatility_450,log_return1_mean_450,log_return1_std_450,log_return1_median_450,log_return1_kurtosis_450,log_return1_skew_450,log_return2_sum_450,log_return2_realized_volatility_450,log_return2_mean_450,log_return2_std_450,log_return2_median_450,log_return2_kurtosis_450,log_return2_skew_450,wap_balance_sum_450,wap_balance_mean_450,wap_balance_std_450,wap_balance_median_450,wap_balance_kurtosis_450,wap_balance_skew_450,price_spread_sum_450,price_spread_mean_450,price_spread_std_450,price_spread_median_450,price_spread_kurtosis_450,price_spread_skew_450,bid_spread_sum_450,bid_spread_mean_450,bid_spread_std_450,bid_spread_median_450,bid_spread_kurtosis_450,bid_spread_skew_450,ask_spread_sum_450,ask_spread_mean_450,ask_spread_std_450,ask_spread_median_450,ask_spread_kurtosis_450,ask_spread_skew_450,total_volume_sum_450,total_volume_mean_450,total_volume_std_450,total_volume_median_450,total_volume_kurtosis_450,total_volume_skew_450,volume_imbalance_sum_450,volume_imbalance_mean_450,volume_imbalance_std_450,volume_imbalance_median_450,volume_imbalance_kurtosis_450,volume_imbalance_skew_450,wap1_sum_300,wap1_mean_300,wap1_std_300,wap1_median_300,wap1_kurtosis_300,wap1_skew_300,wap2_sum_300,wap2_mean_300,wap2_std_300,wap2_median_300,wap2_kurtosis_300,wap2_skew_300,log_return1_sum_300,log_return1_realized_volatility_300,log_return1_mean_300,log_return1_std_300,log_return1_median_300,log_return1_kurtosis_300,log_return1_skew_300,log_return2_sum_300,log_return2_realized_volatility_300,log_return2_mean_300,...,trade_order_count_skew_450,trade_log_return_realized_volatility_300,trade_seconds_in_bucket_count_unique_300,trade_size_mean_300,trade_size_median_300,trade_size_std_300,trade_size_sum_300,trade_size_kurtosis_300,trade_size_skew_300,trade_order_count_mean_300,trade_order_count_median_300,trade_order_count_std_300,trade_order_count_sum_300,trade_order_count_kurtosis_300,trade_order_count_skew_300,trade_log_return_realized_volatility_150,trade_seconds_in_bucket_count_unique_150,trade_size_mean_150,trade_size_median_150,trade_size_std_150,trade_size_sum_150,trade_size_kurtosis_150,trade_size_skew_150,trade_order_count_mean_150,trade_order_count_median_150,trade_order_count_std_150,trade_order_count_sum_150,trade_order_count_kurtosis_150,trade_order_count_skew_150,log_return1_realized_volatility_mean_stock,log_return1_realized_volatility_std_stock,log_return1_realized_volatility_max_stock,log_return1_realized_volatility_min_stock,log_return1_realized_volatility_median_stock,log_return2_realized_volatility_mean_stock,log_return2_realized_volatility_std_stock,log_return2_realized_volatility_max_stock,log_return2_realized_volatility_min_stock,log_return2_realized_volatility_median_stock,log_return1_realized_volatility_450_mean_stock,log_return1_realized_volatility_450_std_stock,log_return1_realized_volatility_450_max_stock,log_return1_realized_volatility_450_min_stock,log_return1_realized_volatility_450_median_stock,log_return2_realized_volatility_450_mean_stock,log_return2_realized_volatility_450_std_stock,log_return2_realized_volatility_450_max_stock,log_return2_realized_volatility_450_min_stock,log_return2_realized_volatility_450_median_stock,log_return1_realized_volatility_300_mean_stock,log_return1_realized_volatility_300_std_stock,log_return1_realized_volatility_300_max_stock,log_return1_realized_volatility_300_min_stock,log_return1_realized_volatility_300_median_stock,log_return2_realized_volatility_300_mean_stock,log_return2_realized_volatility_300_std_stock,log_return2_realized_volatility_300_max_stock,log_return2_realized_volatility_300_min_stock,log_return2_realized_volatility_300_median_stock,log_return1_realized_volatility_150_mean_stock,log_return1_realized_volatility_150_std_stock,log_return1_realized_volatility_150_max_stock,log_return1_realized_volatility_150_min_stock,log_return1_realized_volatility_150_median_stock,log_return2_realized_volatility_150_mean_stock,log_return2_realized_volatility_150_std_stock,log_return2_realized_volatility_150_max_stock,log_return2_realized_volatility_150_min_stock,log_return2_realized_volatility_150_median_stock,trade_log_return_realized_volatility_mean_stock,trade_log_return_realized_volatility_std_stock,trade_log_return_realized_volatility_max_stock,trade_log_return_realized_volatility_min_stock,trade_log_return_realized_volatility_median_stock,trade_log_return_realized_volatility_450_mean_stock,trade_log_return_realized_volatility_450_std_stock,trade_log_return_realized_volatility_450_max_stock,trade_log_return_realized_volatility_450_min_stock,trade_log_return_realized_volatility_450_median_stock,trade_log_return_realized_volatility_300_mean_stock,trade_log_return_realized_volatility_300_std_stock,trade_log_return_realized_volatility_300_max_stock,trade_log_return_realized_volatility_300_min_stock,trade_log_return_realized_volatility_300_median_stock,trade_log_return_realized_volatility_150_mean_stock,trade_log_return_realized_volatility_150_std_stock,trade_log_return_realized_volatility_150_max_stock,trade_log_return_realized_volatility_150_min_stock,trade_log_return_realized_volatility_150_median_stock,log_return1_realized_volatility_mean_time,log_return1_realized_volatility_std_time,log_return1_realized_volatility_max_time,log_return1_realized_volatility_min_time,log_return1_realized_volatility_median_time,log_return2_realized_volatility_mean_time,log_return2_realized_volatility_std_time,log_return2_realized_volatility_max_time,log_return2_realized_volatility_min_time,log_return2_realized_volatility_median_time,log_return1_realized_volatility_450_mean_time,log_return1_realized_volatility_450_std_time,log_return1_realized_volatility_450_max_time,log_return1_realized_volatility_450_min_time,log_return1_realized_volatility_450_median_time,log_return2_realized_volatility_450_mean_time,log_return2_realized_volatility_450_std_time,log_return2_realized_volatility_450_max_time,log_return2_realized_volatility_450_min_time,log_return2_realized_volatility_450_median_time,log_return1_realized_volatility_300_mean_time,log_return1_realized_volatility_300_std_time,log_return1_realized_volatility_300_max_time,log_return1_realized_volatility_300_min_time,log_return1_realized_volatility_300_median_time,log_return2_realized_volatility_300_mean_time,log_return2_realized_volatility_300_std_time,log_return2_realized_volatility_300_max_time,log_return2_realized_volatility_300_min_time,log_return2_realized_volatility_300_median_time,log_return1_realized_volatility_150_mean_time,log_return1_realized_volatility_150_std_time,log_return1_realized_volatility_150_max_time,log_return1_realized_volatility_150_min_time,log_return1_realized_volatility_150_median_time,log_return2_realized_volatility_150_mean_time,log_return2_realized_volatility_150_std_time,log_return2_realized_volatility_150_max_time,log_return2_realized_volatility_150_min_time,log_return2_realized_volatility_150_median_time,trade_log_return_realized_volatility_mean_time,trade_log_return_realized_volatility_std_time,trade_log_return_realized_volatility_max_time,trade_log_return_realized_volatility_min_time,trade_log_return_realized_volatility_median_time,trade_log_return_realized_volatility_450_mean_time,trade_log_return_realized_volatility_450_std_time,trade_log_return_realized_volatility_450_max_time,trade_log_return_realized_volatility_450_min_time,trade_log_return_realized_volatility_450_median_time,trade_log_return_realized_volatility_300_mean_time,trade_log_return_realized_volatility_300_std_time,trade_log_return_realized_volatility_300_max_time,trade_log_return_realized_volatility_300_min_time,trade_log_return_realized_volatility_300_median_time,trade_log_return_realized_volatility_150_mean_time,trade_log_return_realized_volatility_150_std_time,trade_log_return_realized_volatility_150_max_time,trade_log_return_realized_volatility_150_min_time,trade_log_return_realized_volatility_150_median_time,logtarget
0,16,9787,0.005983,16-9787,600.47920,1.000799,0.001474,1.001224,-0.717402,-0.603572,600.47980,1.000800,0.001451,1.000853,-0.882724,-0.349390,3.412304e-03,0.007143,5.696667e-06,0.000292,0.0,,,0.002679,0.009541,4.473089e-06,0.000390,0.0,,,0.301854,0.000503,0.000389,0.000380,2.062880,1.293203,0.766263,0.001277,3.961763e-04,0.001222,0.925953,0.845613,0.206112,0.000344,3.413202e-04,0.000102,1.441881,1.509628,-0.208047,-0.000347,2.339496e-04,-0.000306,-0.156370,-0.820018,205938,343.230000,125.163414,343.5,0.607534,0.543676,50934,84.890000,80.327489,61.0,3.835718,1.729536,150.23227,1.001548,0.000609,1.001588,-0.847361,-0.444916,150.22621,1.001508,0.000777,1.001582,-0.894796,-0.411312,-0.000668,0.002511,-0.000004,0.000206,0.000000,6.436289,-0.281597,-0.001603,0.004331,-1.068959e-05,0.000355,0.0,4.667474,-0.290491,0.059297,0.000395,0.000262,0.000321,0.243205,0.865057,0.157611,0.001051,2.933580e-04,0.001019,0.132544,0.568622,0.042936,0.000286,3.438091e-04,0.000102,5.126406,2.409755,-0.061496,-0.000410,2.819893e-04,-0.000408,-0.649802,-0.717176,54328,362.186667,101.039589,376.5,0.302431,0.010579,13944,92.960000,80.218149,68.0,1.277626,1.202210,300.06528,1.000218,0.001532,1.000459,-1.268572,-0.211921,300.09310,1.000310,0.001450,1.000318,-1.165923,-0.071340,0.001536,0.004749,5.118334e-06,0.000275,0.0,11.945170,0.890162,0.001796,0.007158,5.988251e-06,...,0.875830,0.002793,21.0,133.285714,100.0,129.576673,2799.0,2.596872,1.674181,2.476190,2.0,1.965173,52.0,3.727907,1.859149,0.003539,31.0,116.032258,100.0,115.595987,3597.0,3.979935,1.846557,2.290323,2.0,1.773763,71.0,4.537075,1.918866,0.004612,0.003989,0.054206,0.000541,0.003416,0.006776,0.005683,0.094116,0.000949,0.005156,0.002079,0.001809,0.031666,0.000039,0.001561,0.003016,0.002335,0.035454,0.000000,0.002393,0.003059,0.002609,0.044278,0.000356,0.002311,0.004432,0.003394,0.054119,0.000547,0.003515,0.003853,0.003236,0.052743,0.000404,0.002905,0.005609,0.004375,0.066829,0.000796,0.004370,0.002533,0.001900,0.030371,0.000335,0.001972,0.001180,0.000938,0.020232,0.000000,0.000924,0.001746,0.001333,0.023597,0.000143,0.001370,0.002185,0.001642,0.026871,0.000024,0.001703,0.006039,0.002132,0.013142,0.002440,0.005639,0.008308,0.003377,0.017820,0.002770,0.007545,0.002739,0.001128,0.008007,0.000805,0.002543,0.003962,0.002027,0.013407,0.001198,0.003420,0.004215,0.001588,0.011059,0.001270,0.004037,0.005889,0.002655,0.015861,0.001820,0.005391,0.005294,0.001917,0.012067,0.002230,0.005023,0.007287,0.003069,0.016192,0.002477,0.006576,0.003645,0.000970,0.007297,0.001789,0.003490,0.001548,0.000587,0.004070,0.000294,0.001452,0.002483,0.000756,0.004954,0.001089,0.002451,0.003181,0.000859,0.006486,0.001580,0.003066,-5.118799
1,105,5773,0.002415,105-5773,600.64197,1.001070,0.000766,1.000880,-1.233713,0.323047,600.63720,1.001062,0.000767,1.000869,-1.133407,0.331394,9.610265e-04,0.002404,1.604385e-06,0.000098,0.0,,,0.000862,0.002987,1.439038e-06,0.000122,0.0,,,0.037653,0.000063,0.000045,0.000059,0.576712,0.846452,0.136220,0.000227,2.992114e-05,0.000223,49.560348,7.180402,0.133913,0.000223,4.916321e-08,0.000223,-0.370451,1.242778,-0.133915,-0.000223,5.276032e-08,-0.000223,-0.886907,-1.054903,1345594,2242.656667,355.292645,2261.5,0.475379,0.001115,249858,416.430000,301.443309,397.5,-0.322840,0.590491,150.27628,1.001842,0.000232,1.001783,-0.031354,0.303419,150.26897,1.001793,0.000239,1.001701,0.372317,0.801643,-0.001076,0.000935,-0.000007,0.000076,0.000000,5.587417,-0.690410,-0.001014,0.000984,-6.759636e-06,0.000080,0.0,6.698305,-0.836391,0.009523,0.000063,0.000037,0.000064,0.125605,0.552536,0.034974,0.000233,4.717714e-05,0.000223,16.477516,4.298544,0.033477,0.000223,4.723490e-08,0.000223,0.411674,1.552891,-0.033479,-0.000223,5.370415e-08,-0.000223,-1.039938,-0.979762,365155,2434.366667,331.188817,2402.5,0.790279,0.705171,94345,628.966667,315.955596,658.5,-0.750892,0.054617,300.50732,1.001691,0.000554,1.001777,-0.402539,-0.638434,300.50260,1.001675,0.000565,1.001686,-0.251925,-0.564191,0.000965,0.001549,3.217323e-06,0.000090,0.0,4.172035,0.061218,0.001028,0.002124,3.428133e-06,...,1.111111,0.001400,42.0,178.166667,119.5,163.577224,7483.0,1.406003,1.400625,2.642857,2.0,2.228654,111.0,9.374648,2.732078,0.001684,68.0,184.926471,104.5,165.604124,12575.0,0.464508,1.153667,2.676471,2.0,2.235675,182.0,5.729440,2.106316,0.002903,0.002619,0.046933,0.000416,0.002131,0.003796,0.003375,0.062174,0.000605,0.002765,0.001340,0.001094,0.014084,0.000057,0.001025,0.001747,0.001415,0.018163,0.000045,0.001333,0.001941,0.001567,0.024346,0.000200,0.001462,0.002533,0.002039,0.034762,0.000154,0.001927,0.002428,0.002012,0.035214,0.000367,0.001816,0.003174,0.002619,0.044624,0.000400,0.002363,0.002252,0.001882,0.028099,0.000292,0.001659,0.001057,0.000856,0.012821,0.000000,0.000814,0.001533,0.001210,0.017172,0.000000,0.001164,0.001915,0.001528,0.022168,0.000206,0.001439,0.003812,0.001515,0.008950,0.001842,0.003445,0.005569,0.002612,0.015949,0.002197,0.004947,0.001800,0.000757,0.004375,0.000912,0.001592,0.002656,0.001331,0.007022,0.000816,0.002192,0.002618,0.001056,0.006323,0.001220,0.002515,0.003834,0.001907,0.013032,0.001509,0.003281,0.003262,0.001305,0.007827,0.001638,0.002965,0.004800,0.002281,0.014448,0.001934,0.004258,0.002515,0.000834,0.006272,0.001413,0.002284,0.001176,0.000500,0.003769,0.000000,0.001091,0.001704,0.000593,0.004029,0.000843,0.001570,0.002196,0.000715,0.005209,0.001141,0.002004,-6.026106
2,58,22076,0.002863,58-22076,598.30756,0.997179,0.000907,0.996946,-0.797297,0.444533,598.41360,0.997356,0.000832,0.997271,-0.877343,0.045016,-2.216200e-03,0.002623,-3.699834e-06,0.000107,0.0,,,-0.002213,0.004488,-3.694307e-06,0.000183,0.0,,,0.214987,0.000358,0.000263,0.000281,0.932617,0.957359,0.429021,0.000715,2.510883e-04,0.000681,0.978536,1.128808,0.078867,0.000131,8.000458e-05,0.000097,4.615472,2.372039,-0.202357,-0.000337,2.384041e-04,-0.000291,-0.752067,-0.602195,276551,460.918333,185.923068,430.0,2.135823,0.947047,81439,135.731667,144.914780,95.0,4.092933,1.846135,149.43927,0.996262,0.000364,0.996238,-0.036891,0.196912,149.47705,0.996514,0.000483,0.996605,0.226860,-0.331357,-0.000479,0.001350,-0.000003,0.000111,0.000000,10.684832,-0.017438,-0.000676,0.003176,-4.509830e-06,0.000260,0.0,12.436074,0.252570,0.052095,0.000347,0.000276,0.000237,3.080923,1.566382,0.094242,0.000628,2.469873e-04,0.000584,3.201331,1.523856,0.018627,0.000124,5.852864e-05,0.000097,5.625292,2.365393,-0.073240,-0.000488,2.536689e-04,-0.000582,-1.024049,-0.196268,73626,490.840000,140.650220,508.0,-0.752033,-0.029702,25184,167.893333,155.208937,96.0,-0.640518,0.707922,298.93270,0.996442,0.000369,0.996369,-0.500712,-0.288098,299.01505,0.996717,0.000500,0.996605,0.224923,-0.131212,-0.001064,0.001750,-3.547048e-06,0.000101,0.0,12.111864,0.213879,-0.001163,0.003562,-3.876705e-06,...,1.011806,0.001050,14.0,168.714286,113.5,168.786815,2362.0,3.079798,1.926442,3.714286,4.0,2.524604,52.0,0.685208,0.988960,0.001286,19.0,167.631579,113.0,167.329087,3185.0,1.856015,1.508271,3.947368,4.0,3.045464,75.0,-0.404448,0.875708,0.004224,0.003572,0.041124,0.000373,0.003158,0.006102,0.005002,0.067929,0.000493,0.004704,0.001929,0.001585,0.020951,0.000125,0.001482,0.002807,0.002198,0.022311,0.000197,0.002169,0.002831,0.002277,0.023949,0.000232,0.002168,0.004104,0.003169,0.029909,0.000403,0.003190,0.003555,0.002924,0.035527,0.000323,0.002710,0.005138,0.004028,0.043294,0.000455,0.003984,0.002628,0.002023,0.021194,0.000394,0.002060,0.001233,0.000984,0.014402,0.000000,0.000968,0.001807,0.001396,0.018886,0.000248,0.001425,0.002261,0.001729,0.019871,0.000355,0.001784,0.002035,0.001872,0.018706,0.000503,0.001735,0.002879,0.002309,0.020866,0.000553,0.002457,0.001050,0.001474,0.015257,0.000192,0.000786,0.001375,0.001559,0.015508,0.000198,0.001054,0.001474,0.001654,0.016968,0.000296,0.001188,0.002035,0.001992,0.019575,0.000365,0.001655,0.001774,0.001698,0.017135,0.000401,0.001470,0.002498,0.002108,0.020027,0.000470,0.002108,0.001165,0.000610,0.004684,0.000407,0.000997,0.000591,0.000381,0.002469,0.000138,0.000500,0.000838,0.000478,0.003798,0.000237,0.000727,0.001039,0.000544,0.004101,0.000335,0.000903,-5.855742
3,77,5817,0.005279,77-5817,601.05817,1.001764,0.002921,1.001746,-0.907996,-0.267860,601.09640,1.001827,0.002950,1.001847,-0.921080,-0.240119,3.857260e-03,0.006993,6.439499e-06,0.000286,0.0,,,0.003651,0.009757,6.094700e-06,0.000399,0.0,,,0.126732,0.000211,0.000145,0.000183,-0.508057,0.594553,0.243257,0.000405,9.510022e-05,0.000380,10.070632,3.473891,0.228444,0.000381,3.469868e-08,0.000381,3.432172,-2.187528,-0.228436,-0.000381,4.818484e-08,-0.000381,-0.308955,1.244469,2227382,3712.303333,960.696486,3510.5,3.223581,1.391724,503860,839.766667,738.489271,700.0,4.493070,1.811369,150.06807,1.000454,0.000727,1.000512,0.089949,-0.548133,150.06671,1.000445,0.000898,1.000448,-0.049675,-0.487789,0.000180,0.003105,0.000001,0.000254,0.000006,4.411888,-0.860237,-0.000076,0.005661,-5.054132e-07,0.000464,0.0,1.853950,-0.298721,0.035303,0.000235,0.000157,0.000186,-0.923424,0.510255,0.060510,0.000403,9.066640e-05,0.000381,11.730264,3.705408,0.057111,0.000381,3.302441e-08,0.000381,4.560014,-2.422400,-0.057109,-0.000381,5.061392e-08,-0.000381,-0.710823,1.092016,560983,3739.886667,798.023267,3700.0,-0.422332,0.374290,104961,699.740000,589.194108,500.0,2.990411,1.511708,300.67102,1.002237,0.002305,1.001224,-1.239833,0.507073,300.66970,1.002232,0.002362,1.001224,-1.138022,0.449436,-0.005484,0.005275,-1.827947e-05,0.000305,0.0,6.844016,-1.428839,-0.005791,0.007743,-1.930346e-05,...,5.594599,0.004610,112.0,682.857143,300.0,1172.768495,76480.0,44.339770,5.877816,4.437500,3.0,6.513716,497.0,46.139530,6.011767,0.005418,151.0,624.788079,300.0,1039.558513,94343.0,55.070991,6.415324,4.145695,3.0,5.706601,626.0,59.961417,6.749943,0.003366,0.002558,0.035552,0.000700,0.002649,0.004712,0.003120,0.042911,0.001081,0.003910,0.001614,0.001287,0.026178,0.000064,0.001293,0.002272,0.001577,0.031902,0.000011,0.001919,0.002320,0.001804,0.034769,0.000252,0.001853,0.003260,0.002180,0.041658,0.000414,0.002721,0.002877,0.002206,0.035307,0.000614,0.002284,0.004037,0.002690,0.042607,0.000827,0.003368,0.002755,0.002188,0.026274,0.000000,0.002100,0.001314,0.001091,0.017820,0.000000,0.001036,0.001898,0.001536,0.025383,0.000000,0.001469,0.002362,0.001880,0.026047,0.000000,0.001823,0.009777,0.004200,0.024979,0.003297,0.008878,0.013158,0.006552,0.038566,0.003549,0.011594,0.005003,0.002328,0.015763,0.001717,0.004437,0.006671,0.004012,0.028888,0.001896,0.005535,0.006854,0.003120,0.018998,0.002273,0.006056,0.009058,0.004685,0.031326,0.002470,0.007990,0.008396,0.003615,0.021787,0.002864,0.007503,0.011277,0.005539,0.033449,0.003090,0.010024,0.006122,0.001858,0.013466,0.003014,0.005873,0.003191,0.001223,0.009058,0.001113,0.003018,0.004393,0.001471,0.009818,0.001796,0.004206,0.005367,0.001700,0.011079,0.002390,0.005120,-5.243951
4,56,14572,0.002328,56-14572,598.78840,0.997981,0.000927,0.997882,-0.857376,0.054103,598.76544,0.997942,0.000961,0.997819,-1.026107,0.042450,-1.671476e-03,0.002564,-2.790444e-06,0.000105,0.0,,,-0.001691,0.003622,-2.823096e-06,0.000148,0.0,,,0.074003,0.000123,0.000095,0.000108,0.736676,0.928654,0.166596,0.000278,8.049258e-05,0.000261,1.190128,0.916931,0.042784,0.000071,6.605039e-05,0.000043,2.095133,1.583203,-0.048897,-0.000081,6.813075e-05,-0.000065,1.772496,-1.348820,201007,335.011667,156.600216,321.0,4.624120,1.524437,72007,120.011667,94.411798,99.0,1.640380,1.094121,149.60847,0.997390,0.000361,0.997394,-0.748833,0.079546,149.59203,0.997280,0.000412,0.997257,-0.802039,0.046661,0.001371,0.001495,0.000009,0.000122,0.000000,4.755705,-0.607413,0.001544,0.002001,1.029398e-05,0.000164,0.0,3.500741,-0.087984,0.022062,0.000147,0.000112,0.000138,0.666570,0.927687,0.043701,0.000291,9.093613e-05,0.000282,0.895255,0.809980,0.018575,0.000124,8.508687e-05,0.000087,-0.565675,0.616885,-0.009558,-0.000064,6.090475e-05,-0.000043,4.533438,-1.915580,48883,325.886667,116.885967,321.0,-0.915541,0.050118,14875,99.166667,81.427731,96.5,2.685287,1.385483,299.17014,0.997234,0.000510,0.997321,-0.380009,-0.402873,299.14703,0.997157,0.000513,0.997187,-0.593481,-0.266779,0.000498,0.002086,1.661003e-06,0.000121,0.0,3.145998,-0.198122,0.000439,0.003080,1.461875e-06,...,1.056036,0.001192,101.0,97.594059,100.0,116.953852,9857.0,21.986562,3.694020,2.950495,2.0,5.534214,298.0,76.091345,8.395677,0.001373,123.0,94.666667,97.0,117.439881,11644.0,19.116359,3.486713,2.991870,2.0,5.193779,368.0,80.399622,8.401031,0.004845,0.002790,0.030041,0.000988,0.004028,0.006085,0.003376,0.037915,0.001576,0.005096,0.002321,0.001305,0.011015,0.000308,0.001975,0.002918,0.001580,0.018216,0.000562,0.002488,0.003318,0.001850,0.019398,0.000627,0.002793,0.004174,0.002240,0.025303,0.000967,0.003548,0.004125,0.002332,0.026912,0.000823,0.003439,0.005185,0.002822,0.034495,0.001291,0.004373,0.003389,0.002171,0.020474,0.000686,0.002687,0.001620,0.001017,0.008734,0.000231,0.001312,0.002324,0.001445,0.013968,0.000461,0.001865,0.002892,0.001817,0.019497,0.000608,0.002310,0.001889,0.000964,0.006077,0.000576,0.001648,0.002897,0.001591,0.008706,0.000714,0.002395,0.000907,0.000507,0.002648,0.000203,0.000752,0.001394,0.000904,0.006202,0.000018,0.001085,0.001300,0.000626,0.002994,0.000260,0.001122,0.002006,0.001147,0.006834,0.000067,0.001633,0.001625,0.000805,0.004466,0.000288,0.001443,0.002479,0.001403,0.008010,0.000070,0.002047,0.001267,0.000550,0.003294,0.000000,0.001189,0.000620,0.000313,0.001484,0.000128,0.000568,0.000915,0.000401,0.002313,0.000221,0.000834,0.001135,0.000482,0.002866,0.000348,0.001030,-6.062848
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
428927,76,21439,0.002647,76-21439,600.85600,1.001427,0.000982,1.001238,-0.258683,0.731784,600.83440,1.001391,0.000968,1.001338,-0.213067,0.673776,2.942843e-03,0.003456,4.912926e-06,0.000141,0.0,,,0.003319,0.004683,5.540259e-06,0.000191,0.0,,,0.097441,0.000162,0.000117,0.000146,0.169890,0.773545,0.213385,0.000356,1.394403e-04,0.000345,2.980784,1.457641,0.104993,0.000175,1.198182e-04,0.000148,0.169257,0.922909,-0.122059,-0.000203,1.454425e-04,-0.000198,0.189370,-0.909727,319671,532.785000,188.145076,501.0,0.121759,0.594470,108369,180.615000,120.773592,169.0,0.790040,0.794638,150.42587,1.002839,0.000632,1.002918,-0.722024,-0.636665,150.41370,1.002758,0.000646,1.002840,-0.753161,-0.656653,0.001639,0.001829,0.000011,0.000149,0.000000,5.145311,0.106764,0.001876,0.002308,1.250727e-05,0.000189,0.0,7.812954,0.849945,0.022604,0.000151,0.000116,0.000123,0.427302,0.968552,0.054624,0.000364,1.195822e-04,0.000345,1.063059,0.839058,0.028350,0.000189,1.403048e-04,0.000148,-0.196668,0.828519,-0.024490,-0.000163,1.056552e-04,-0.000198,0.918211,-0.899916,96118,640.786667,204.102277,600.0,-0.581358,0.515835,29646,197.640000,141.300018,171.0,0.224662,0.776403,300.64368,1.002146,0.000847,1.001750,-1.233605,0.413047,300.62393,1.002080,0.000841,1.001654,-1.212862,0.410087,0.002298,0.002261,7.660316e-06,0.000131,0.0,5.582712,0.031058,0.002537,0.002880,8.455152e-06,...,1.202575,0.001431,41.0,143.487805,100.0,141.423499,5883.0,1.546696,1.434326,2.707317,2.0,2.347806,111.0,2.454038,1.718382,0.001656,61.0,123.098361,100.0,128.331953,7509.0,2.506649,1.565703,2.557377,2.0,2.061752,156.0,3.676636,1.861792,0.004540,0.003100,0.038771,0.000880,0.003643,0.005778,0.003884,0.055342,0.001048,0.004723,0.002154,0.001408,0.017263,0.000338,0.001766,0.002754,0.001732,0.022490,0.000381,0.002320,0.003093,0.002034,0.025409,0.000497,0.002536,0.003952,0.002546,0.036109,0.000560,0.003305,0.003847,0.002545,0.030346,0.000648,0.003119,0.004908,0.003188,0.047050,0.000764,0.004065,0.002735,0.001948,0.022090,0.000485,0.002136,0.001303,0.000939,0.014751,0.000154,0.001020,0.001871,0.001312,0.019345,0.000287,0.001474,0.002336,0.001648,0.019607,0.000453,0.001842,0.002818,0.001335,0.007531,0.000284,0.002492,0.004039,0.002142,0.011330,0.000068,0.003553,0.001380,0.000721,0.004571,0.000158,0.001195,0.002009,0.001109,0.007004,0.000061,0.001671,0.001969,0.001024,0.006053,0.000174,0.001695,0.002815,0.001572,0.008584,0.000062,0.002383,0.002403,0.001156,0.006412,0.000234,0.002181,0.003446,0.001866,0.010201,0.000063,0.002935,0.001909,0.000811,0.004795,0.000650,0.001692,0.000981,0.000478,0.002818,0.000000,0.000866,0.001346,0.000629,0.003775,0.000000,0.001217,0.001646,0.000698,0.004178,0.000520,0.001442,-5.934183
428928,108,16733,0.001089,108-16733,599.87500,0.999792,0.000372,0.999724,-1.149882,-0.009472,599.80200,0.999670,0.000471,0.999634,-0.811869,0.019223,-1.170027e-03,0.001024,-1.953301e-06,0.000042,0.0,,,-0.001522,0.001667,-2.540422e-06,0.000068,0.0,,,0.098845,0.000165,0.000118,0.000126,-1.116643,0.458715,0.244101,0.000407,1.585902e-07,0.000407,-0.943112,-0.045696,0.244052,0.000407,2.316365e-08,0.000407,0.631420,1.622014,-0.244045,-0.000407,0.000000e+00,-0.000407,-3.000000,0.000000,14477849,24129.748333,2932.225114,23654.0,-0.028096,0.433493,2080539,3467.565000,2420.802655,3165.5,0.448897,0.781153,149.93121,0.999541,0.000154,0.999547,-0.124166,-0.734934,149.92207,0.999481,0.000248,0.999576,0.920982,-1.688973,-0.000289,0.000406,-0.000002,0.000033,0.000000,11.326935,-1.186579,-0.000653,0.000614,-4.350038e-06,0.000050,0.0,141.634582,-11.914139,0.017084,0.000114,0.000105,0.000086,1.017301,1.487177,0.061040,0.000407,6.290679e-08,0.000407,0.977114,1.725171,0.061013,0.000407,2.263804e-08,0.000407,0.978790,1.725900,-0.061011,-0.000407,0.000000e+00,-0.000407,-3.000000,0.000000,3705074,24700.493333,1749.543725,24668.5,-0.885320,-0.045490,593902,3959.346667,1983.670031,3574.0,-0.737909,0.258339,299.85287,0.999510,0.000253,0.999528,0.158565,0.744103,299.81332,0.999378,0.000357,0.999572,-1.226197,0.009576,-0.000916,0.000812,-3.054283e-06,0.000047,0.0,54.435214,-4.249926,-0.001098,0.001236,-3.660867e-06,...,0.079174,0.000910,9.0,1340.444444,233.0,1554.064036,12064.0,-1.398534,0.533336,7.111111,7.0,5.710614,64.0,-1.711915,0.084025,0.000997,12.0,1419.583333,525.0,1573.548766,17035.0,-1.336899,0.602476,7.666667,9.0,5.532274,92.0,-1.711585,-0.072278,0.003337,0.002545,0.035924,0.000368,0.002642,0.004335,0.003075,0.038709,0.000376,0.003548,0.001568,0.001191,0.017611,0.000062,0.001274,0.002023,0.001410,0.018896,0.000031,0.001705,0.002261,0.001660,0.022615,0.000261,0.001824,0.002926,0.001957,0.024179,0.000081,0.002458,0.002820,0.002097,0.029733,0.000319,0.002260,0.003658,0.002491,0.032411,0.000113,0.003030,0.002683,0.002127,0.027750,0.000208,0.002072,0.001259,0.001024,0.015276,0.000000,0.000998,0.001826,0.001420,0.020301,0.000000,0.001436,0.002284,0.001775,0.024155,0.000000,0.001780,0.001949,0.001015,0.007754,0.000115,0.001798,0.002858,0.001561,0.010666,0.000008,0.002547,0.000901,0.000463,0.002852,0.000075,0.000811,0.001314,0.000737,0.003958,0.000002,0.001102,0.001298,0.000639,0.004554,0.000080,0.001186,0.001904,0.001077,0.007826,0.000003,0.001551,0.001633,0.000869,0.006988,0.000088,0.001503,0.002394,0.001340,0.009858,0.000008,0.002068,0.001322,0.000531,0.003180,0.000000,0.001261,0.000622,0.000273,0.001351,0.000000,0.000579,0.000877,0.000352,0.002123,0.000000,0.000857,0.001113,0.000443,0.002451,0.000000,0.001026,-6.822463
428929,37,14273,0.002531,37-14273,601.11096,1.001852,0.000367,1.001833,0.624756,1.055845,601.35460,1.002258,0.000556,1.002294,-0.976299,-0.146546,-1.316365e-03,0.002124,-2.197604e-06,0.000087,0.0,,,0.000596,0.005234,9.953217e-07,0.000214,0.0,,,0.404903,0.000675,0.000359,0.000584,-0.233344,0.428476,0.765416,0.001276,3.093680e-04,0.001303,-1.447699,-0.091916,0.093891,0.000156,1.623810e-04,0.000030,-1.662358,0.491494,-0.036006,-0.000060,1.071243e-04,-0.000006,2.064486,-1.846837,103454,172.423333,100.354185,125.5,-0.980879,0.182233,47972,79.953333,61.444013,89.0,2.488920,1.288776,150.27243,1.001816,0.000176,1.001920,-0.110227,-0.487537,150.35689,1.002379,0.000251,1.002554,1.989640,-1.451404,-0.000238,0.001060,-0.000002,0.000087,0.000000,30.835999,-2.929819,-0.000248,0.001680,-1.655800e-06,0.000138,0.0,46.323563,-0.219829,0.089504,0.000597,0.000148,0.000634,4.806844,-1.734691,0.140031,0.000934,1.211388e-04,0.000877,0.552668,1.508953,0.044171,0.000294,1.026674e-04,0.000338,2.707623,-2.134799,-0.017555,-0.000117,1.033026e-04,-0.000214,-1.980851,0.134039,9660,64.400000,51.013618,16.0,-1.926529,0.115360,6910,46.066667,42.313573,6.0,-1.950850,0.118561,300.50052,1.001668,0.000206,1.001709,-1.047710,0.447769,300.65912,1.002197,0.000318,1.002294,0.190176,-0.758860,-0.000041,0.001089,-1.364900e-07,0.000063,0.0,58.774581,-3.711293,-0.000411,0.002053,-1.369017e-06,...,0.000000,0.000884,2.0,19.000000,19.0,25.455844,38.0,-2.000000,0.000000,1.500000,1.5,0.707107,3.0,-2.000000,0.000000,0.000884,2.0,19.000000,19.0,25.455844,38.0,-2.000000,0.000000,1.500000,1.5,0.707107,3.0,-2.000000,0.000000,0.007163,0.004996,0.053782,0.000603,0.005614,0.009888,0.007433,0.096552,0.000927,0.007564,0.003281,0.002495,0.034143,0.000000,0.002588,0.004529,0.003564,0.046615,0.000000,0.003491,0.004827,0.003404,0.042128,0.000000,0.003835,0.006654,0.004968,0.064391,0.000248,0.005171,0.006061,0.004196,0.044557,0.000458,0.004740,0.008354,0.006137,0.068750,0.000572,0.006446,0.003000,0.002200,0.041908,0.000000,0.002386,0.001409,0.001079,0.011524,0.000000,0.001149,0.002076,0.001536,0.028799,0.000000,0.001673,0.002614,0.001863,0.029389,0.000000,0.002122,0.002076,0.000836,0.004408,0.000767,0.001833,0.003012,0.001376,0.007255,0.000411,0.002610,0.001016,0.000454,0.002424,0.000245,0.000888,0.001463,0.000757,0.004608,0.000005,0.001290,0.001439,0.000609,0.003302,0.000519,0.001245,0.002101,0.001045,0.005407,0.000052,0.001750,0.001787,0.000754,0.003910,0.000629,0.001564,0.002585,0.001225,0.006322,0.000090,0.002270,0.001414,0.000568,0.003279,0.000000,0.001259,0.000712,0.000352,0.001986,0.000000,0.000645,0.000989,0.000426,0.002689,0.000000,0.000896,0.001216,0.000498,0.002931,0.000000,0.001113,-5.979000
428930,41,11351,0.001864,41-11351,600.30000,1.000500,0.000194,1.000479,-0.102242,-0.335757,600.28180,1.000470,0.000254,1.000469,0.128287,-0.210395,-1.884784e-04,0.001252,-3.146550e-07,0.000051,0.0,,,-0.000210,0.002172,-3.510817e-07,0.000089,0.0,,,0.047055,0.000078,0.000048,0.000073,0.584539,0.803946,0.136816,0.000228,9.300933e-06,0.000228,594.889339,24.430163,0.136676,0.000228,3.183415e-08,0.000228,2.706872,-1.908859,-0.136652,-0.000228,5.952166e-08,-0.000228,-1.982151,0.133582,16360223,27267.038333,3021.952883,27049.5,-0.017006,0.194480,3003171,5005.285000,3831.373475,3972.0,-0.047303,0.852849,150.07831,1.000522,0.000111,1.000487,-0.003667,-0.106204,150.07579,1.000505,0.000171,1.000411,-1.029364,0.369141,0.000309,0.000536,0.000002,0.000044,0.000000,10.206429,-0.585830,0.000271,0.000930,1.809912e-06,0.000076,0.0,18.780652,0.150879,0.012084,0.000081,0.000027,0.000074,2.010435,0.924002,0.034148,0.000228,8.138696e-08,0.000228,-1.389327,-0.730384,0.034171,0.000228,9.634912e-09,0.000228,32.535455,-5.877031,-0.034160,-0.000228,5.692277e-08,-0.000228,-1.584843,-0.644299,4212732,28084.880000,2638.984259,28636.5,0.095796,-0.522562,442000,2946.666667,2254.018329,2656.0,1.244195,1.099054,300.14554,1.000485,0.000178,1.000487,0.082977,-0.864219,300.13773,1.000459,0.000241,1.000412,-0.147260,-0.527192,-0.000110,0.000897,-3.665666e-07,0.000052,0.0,12.689356,-1.183722,-0.000189,0.001603,-6.291133e-07,...,0.743180,0.000864,42.0,1592.547619,621.0,2131.626188,66887.0,-0.122161,1.190632,6.404762,5.0,5.468578,269.0,-0.700958,0.750111,0.001093,64.0,1504.265625,621.0,1988.283109,96273.0,0.289861,1.304168,6.828125,5.0,5.722567,437.0,-0.604144,0.732743,0.002252,0.001799,0.020220,0.000304,0.001681,0.002925,0.002118,0.023693,0.000322,0.002292,0.001051,0.000827,0.008286,0.000051,0.000824,0.001364,0.000978,0.008742,0.000012,0.001122,0.001520,0.001175,0.012973,0.000132,0.001173,0.001978,0.001370,0.013610,0.000035,0.001599,0.001895,0.001479,0.015995,0.000190,0.001444,0.002468,0.001731,0.018022,0.000285,0.001968,0.001919,0.001580,0.017448,0.000223,0.001423,0.000900,0.000737,0.007570,0.000000,0.000698,0.001301,0.001043,0.012015,0.000000,0.000995,0.001623,0.001306,0.013876,0.000000,0.001220,0.002390,0.001159,0.006707,0.000825,0.002102,0.003412,0.001626,0.009134,0.000956,0.002970,0.001214,0.000648,0.003261,0.000400,0.001035,0.001728,0.000844,0.004467,0.000439,0.001528,0.001701,0.000877,0.005591,0.000577,0.001453,0.002417,0.001213,0.006826,0.000653,0.002030,0.002083,0.001053,0.006372,0.000717,0.001765,0.002958,0.001462,0.008596,0.000834,0.002470,0.001623,0.000693,0.004710,0.000694,0.001442,0.000828,0.000416,0.002878,0.000000,0.000747,0.001173,0.000534,0.003743,0.000489,0.001038,0.001426,0.000638,0.004545,0.000618,0.001287,-6.284911


In [6]:
train_ = pd.read_csv("../baseline/data/baseline_train.csv")
train = train.merge(train_, on=["time_id", "stock_id", "target"], how="inner")
train

Unnamed: 0,stock_id,time_id,target,row_id,wap1_sum,wap1_mean,wap1_std,wap1_median,wap1_kurtosis,wap1_skew,wap2_sum,wap2_mean,wap2_std,wap2_median,wap2_kurtosis,wap2_skew,log_return1_sum,log_return1_realized_volatility,log_return1_mean,log_return1_std,log_return1_median,log_return1_kurtosis,log_return1_skew,log_return2_sum,log_return2_realized_volatility,log_return2_mean,log_return2_std,log_return2_median,log_return2_kurtosis,log_return2_skew,wap_balance_sum,wap_balance_mean,wap_balance_std,wap_balance_median,wap_balance_kurtosis,wap_balance_skew,price_spread_sum,price_spread_mean,price_spread_std,price_spread_median,price_spread_kurtosis,price_spread_skew,bid_spread_sum,bid_spread_mean,bid_spread_std,bid_spread_median,bid_spread_kurtosis,bid_spread_skew,ask_spread_sum,ask_spread_mean,ask_spread_std,ask_spread_median,ask_spread_kurtosis,ask_spread_skew,total_volume_sum,total_volume_mean,total_volume_std,total_volume_median,total_volume_kurtosis,total_volume_skew,volume_imbalance_sum,volume_imbalance_mean,volume_imbalance_std,volume_imbalance_median,volume_imbalance_kurtosis,volume_imbalance_skew,wap1_sum_450,wap1_mean_450,wap1_std_450,wap1_median_450,wap1_kurtosis_450,wap1_skew_450,wap2_sum_450,wap2_mean_450,wap2_std_450,wap2_median_450,wap2_kurtosis_450,wap2_skew_450,log_return1_sum_450,log_return1_realized_volatility_450,log_return1_mean_450,log_return1_std_450,log_return1_median_450,log_return1_kurtosis_450,log_return1_skew_450,log_return2_sum_450,log_return2_realized_volatility_450,log_return2_mean_450,log_return2_std_450,log_return2_median_450,log_return2_kurtosis_450,log_return2_skew_450,wap_balance_sum_450,wap_balance_mean_450,wap_balance_std_450,wap_balance_median_450,wap_balance_kurtosis_450,wap_balance_skew_450,price_spread_sum_450,price_spread_mean_450,price_spread_std_450,price_spread_median_450,price_spread_kurtosis_450,price_spread_skew_450,bid_spread_sum_450,bid_spread_mean_450,bid_spread_std_450,bid_spread_median_450,bid_spread_kurtosis_450,bid_spread_skew_450,ask_spread_sum_450,ask_spread_mean_450,ask_spread_std_450,ask_spread_median_450,ask_spread_kurtosis_450,ask_spread_skew_450,total_volume_sum_450,total_volume_mean_450,total_volume_std_450,total_volume_median_450,total_volume_kurtosis_450,total_volume_skew_450,volume_imbalance_sum_450,volume_imbalance_mean_450,volume_imbalance_std_450,volume_imbalance_median_450,volume_imbalance_kurtosis_450,volume_imbalance_skew_450,wap1_sum_300,wap1_mean_300,wap1_std_300,wap1_median_300,wap1_kurtosis_300,wap1_skew_300,wap2_sum_300,wap2_mean_300,wap2_std_300,wap2_median_300,wap2_kurtosis_300,wap2_skew_300,log_return1_sum_300,log_return1_realized_volatility_300,log_return1_mean_300,log_return1_std_300,log_return1_median_300,log_return1_kurtosis_300,log_return1_skew_300,log_return2_sum_300,log_return2_realized_volatility_300,log_return2_mean_300,...,waproll_std5_down50_skew,waproll_std5_down50_autocorr,waproll_std5_down50_median,waproll_std10_down50_mean,waproll_std10_down50_std,waproll_std10_down50_skew,waproll_std10_down50_autocorr,waproll_std10_down50_median,wapcandlef1_down50,wapcandlef2_down50,wapcandlef3_down50,wapcandlef41_down50,wapcandlef42_down50,up25num,waproll_std5_up25_mean,waproll_std5_up25_std,waproll_std5_up25_skew,waproll_std5_up25_autocorr,waproll_std5_up25_median,waproll_std10_up25_mean,waproll_std10_up25_std,waproll_std10_up25_skew,waproll_std10_up25_autocorr,waproll_std10_up25_median,wapcandlef1_up25,wapcandlef2_up25,wapcandlef3_up25,wapcandlef41_up25,wapcandlef42_up25,down25num,waproll_std5_down25_mean,waproll_std5_down25_std,waproll_std5_down25_skew,waproll_std5_down25_autocorr,waproll_std5_down25_median,waproll_std10_down25_mean,waproll_std10_down25_std,waproll_std10_down25_skew,waproll_std10_down25_autocorr,waproll_std10_down25_median,wapcandlef1_down25,wapcandlef2_down25,wapcandlef3_down25,wapcandlef41_down25,wapcandlef42_down25,up75num,waproll_std5_up75_mean,waproll_std5_up75_std,waproll_std5_up75_skew,waproll_std5_up75_autocorr,waproll_std5_up75_median,waproll_std10_up75_mean,waproll_std10_up75_std,waproll_std10_up75_skew,waproll_std10_up75_autocorr,waproll_std10_up75_median,wapcandlef1_up75,wapcandlef2_up75,wapcandlef3_up75,wapcandlef41_up75,wapcandlef42_up75,down75num,waproll_std5_down75_mean,waproll_std5_down75_std,waproll_std5_down75_skew,waproll_std5_down75_autocorr,waproll_std5_down75_median,waproll_std10_down75_mean,waproll_std10_down75_std,waproll_std10_down75_skew,waproll_std10_down75_autocorr,waproll_std10_down75_median,wapcandlef1_down75,wapcandlef2_down75,wapcandlef3_down75,wapcandlef41_down75,wapcandlef42_down75,book_wap1_lambda_,book_wap2_lambda_,book_wap_mean_lambda_,book_wap_diff_lambda_,book_price_spread_lambda_,book_bid_spread_lambda_,book_ask_spread_lambda_,book_total_volume_lambda_,book_volume_imbalance_lambda_,pricesum,pricemean,pricestd,pricemax,pricemin,pricemedian,sizesum,sizemean,sizestd,sizemax,sizemin,sizemedian,order_countsum,order_countmean,order_countstd,order_countmax,order_countmin,order_countmedian,seconds_in_bucketsum,seconds_in_bucketmean,seconds_in_bucketstd,seconds_in_bucketmax,seconds_in_bucketmin,seconds_in_bucketmedian,__book_wap1_lambda_____mean___time,__book_wap1_lambda_____std___time,__book_wap1_lambda_____max___time,__book_wap1_lambda_____min___time,__book_wap1_lambda_____median___time,__book_wap2_lambda_____mean___time,__book_wap2_lambda_____std___time,__book_wap2_lambda_____max___time,__book_wap2_lambda_____min___time,__book_wap2_lambda_____median___time,__book_wap_mean_lambda_____mean___time,__book_wap_mean_lambda_____std___time,__book_wap_mean_lambda_____max___time,__book_wap_mean_lambda_____min___time,__book_wap_mean_lambda_____median___time,__book_wap_diff_lambda_____mean___time,__book_wap_diff_lambda_____std___time,__book_wap_diff_lambda_____max___time,__book_wap_diff_lambda_____min___time,__book_wap_diff_lambda_____median___time,__book_wap1_lambda_____mean___stock,__book_wap1_lambda_____std___stock,__book_wap1_lambda_____max___stock,__book_wap1_lambda_____min___stock,__book_wap1_lambda_____median___stock,__book_wap2_lambda_____mean___stock,__book_wap2_lambda_____std___stock,__book_wap2_lambda_____max___stock,__book_wap2_lambda_____min___stock,__book_wap2_lambda_____median___stock,__book_wap_mean_lambda_____mean___stock,__book_wap_mean_lambda_____std___stock,__book_wap_mean_lambda_____max___stock,__book_wap_mean_lambda_____min___stock,__book_wap_mean_lambda_____median___stock,__book_wap_diff_lambda_____mean___stock,__book_wap_diff_lambda_____std___stock,__book_wap_diff_lambda_____max___stock,__book_wap_diff_lambda_____min___stock,__book_wap_diff_lambda_____median___stock
0,16,9787,0.005983,16-9787,600.47920,1.000799,0.001474,1.001224,-0.717402,-0.603572,600.47980,1.000800,0.001451,1.000853,-0.882724,-0.349390,3.412304e-03,0.007143,5.696667e-06,0.000292,0.0,,,0.002679,0.009541,4.473089e-06,0.000390,0.0,,,0.301854,0.000503,0.000389,0.000380,2.062880,1.293203,0.766263,0.001277,3.961763e-04,0.001222,0.925953,0.845613,0.206112,0.000344,3.413202e-04,0.000102,1.441881,1.509628,-0.208047,-0.000347,2.339496e-04,-0.000306,-0.156370,-0.820018,205938,343.230000,125.163414,343.5,0.607534,0.543676,50934,84.890000,80.327489,61.0,3.835718,1.729536,150.23227,1.001548,0.000609,1.001588,-0.847361,-0.444916,150.22621,1.001508,0.000777,1.001582,-0.894796,-0.411312,-0.000668,0.002511,-0.000004,0.000206,0.000000,6.436289,-0.281597,-0.001603,0.004331,-1.068959e-05,0.000355,0.0,4.667474,-0.290491,0.059297,0.000395,0.000262,0.000321,0.243205,0.865057,0.157611,0.001051,2.933580e-04,0.001019,0.132544,0.568622,0.042936,0.000286,3.438091e-04,0.000102,5.126406,2.409755,-0.061496,-0.000410,2.819893e-04,-0.000408,-0.649802,-0.717176,54328,362.186667,101.039589,376.5,0.302431,0.010579,13944,92.960000,80.218149,68.0,1.277626,1.202210,300.06528,1.000218,0.001532,1.000459,-1.268572,-0.211921,300.09310,1.000310,0.001450,1.000318,-1.165923,-0.071340,0.001536,0.004749,5.118334e-06,0.000275,0.0,11.945170,0.890162,0.001796,0.007158,5.988251e-06,...,1.090891,0.787598,0.000306,0.000527,0.000355,1.107211,0.938689,0.000441,4.795566e-07,0.074111,6.051118e+03,5.691554e-05,0.000262,77,0.000441,0.000235,0.440734,0.700955,0.000457,0.000623,0.000243,0.339423,0.900524,0.000596,3.352422e-07,0.053203,-3552.636102,6.565865e-06,0.000318,232,0.000318,0.000231,0.724409,0.745321,0.000276,0.000441,0.000226,0.822536,0.921730,0.000414,2.473907e-07,0.057226,1.144385e+04,3.390126e-05,0.000238,231,0.000276,0.000212,1.267157,0.776278,0.000214,0.000374,0.000200,0.588718,0.912240,0.000351,1.518477e-07,0.072685,1.751099e+04,1.321468e-05,0.000246,78,0.000525,0.000377,0.676063,0.762281,0.000421,0.000756,0.000395,0.382616,0.904799,0.000669,1.349312e-06,0.117475,2296.125644,0.000044,0.000367,0.007143,0.009541,0.006242,8.486556,4.444938,15.924421,0.0,5.941818,6.143118,43.040848,1.000950,0.001069,1.002907,0.998725,1.000969,4898.0,113.906977,117.795386,526.0,1.0,100.0,100.0,2.325581,1.873638,9.0,1.0,2.0,13638.0,317.162791,195.783764,589.0,7.0,288.0,0.006039,0.002132,0.013142,0.002440,0.005639,0.008308,0.003377,0.017820,0.002770,0.007545,0.005771,0.001884,0.010974,0.002643,0.005640,,,,5.666140,18.080760,0.004612,0.003989,0.054206,0.000541,0.003416,0.006776,0.005683,0.094116,0.000949,0.005156,0.004312,0.003476,0.052871,0.000639,0.003271,,,,1.764698,9.811453
1,105,5773,0.002415,105-5773,600.64197,1.001070,0.000766,1.000880,-1.233713,0.323047,600.63720,1.001062,0.000767,1.000869,-1.133407,0.331394,9.610265e-04,0.002404,1.604385e-06,0.000098,0.0,,,0.000862,0.002987,1.439038e-06,0.000122,0.0,,,0.037653,0.000063,0.000045,0.000059,0.576712,0.846452,0.136220,0.000227,2.992114e-05,0.000223,49.560348,7.180402,0.133913,0.000223,4.916321e-08,0.000223,-0.370451,1.242778,-0.133915,-0.000223,5.276032e-08,-0.000223,-0.886907,-1.054903,1345594,2242.656667,355.292645,2261.5,0.475379,0.001115,249858,416.430000,301.443309,397.5,-0.322840,0.590491,150.27628,1.001842,0.000232,1.001783,-0.031354,0.303419,150.26897,1.001793,0.000239,1.001701,0.372317,0.801643,-0.001076,0.000935,-0.000007,0.000076,0.000000,5.587417,-0.690410,-0.001014,0.000984,-6.759636e-06,0.000080,0.0,6.698305,-0.836391,0.009523,0.000063,0.000037,0.000064,0.125605,0.552536,0.034974,0.000233,4.717714e-05,0.000223,16.477516,4.298544,0.033477,0.000223,4.723490e-08,0.000223,0.411674,1.552891,-0.033479,-0.000223,5.370415e-08,-0.000223,-1.039938,-0.979762,365155,2434.366667,331.188817,2402.5,0.790279,0.705171,94345,628.966667,315.955596,658.5,-0.750892,0.054617,300.50732,1.001691,0.000554,1.001777,-0.402539,-0.638434,300.50260,1.001675,0.000565,1.001686,-0.251925,-0.564191,0.000965,0.001549,3.217323e-06,0.000090,0.0,4.172035,0.061218,0.001028,0.002124,3.428133e-06,...,0.978272,0.718039,0.000100,0.000149,0.000066,1.192673,0.907496,0.000135,2.366598e-08,0.062335,3.580261e+04,4.035783e-06,0.000085,130,0.000161,0.000105,0.877035,0.743587,0.000140,0.000220,0.000112,1.446555,0.922497,0.000193,3.071080e-08,0.063002,21524.217800,6.684870e-06,0.000120,388,0.000093,0.000059,0.859082,0.749616,0.000092,0.000128,0.000059,0.735473,0.916467,0.000120,1.469930e-08,0.043118,4.113833e+04,5.184425e-07,0.000077,388,0.000095,0.000058,0.441294,0.743236,0.000098,0.000132,0.000057,0.359208,0.899577,0.000127,1.256197e-08,0.033007,4.741062e+04,-6.172710e-07,0.000077,130,0.000152,0.000087,0.770579,0.708650,0.000133,0.000219,0.000093,1.055737,0.924620,0.000195,5.284416e-08,0.097997,14199.928379,0.000009,0.000107,0.002404,0.002987,0.002579,14.923135,2.298935,0.004032,0.0,3.078708,8.924933,89.096634,1.001086,0.000765,1.002567,0.999888,1.000836,16477.0,185.134831,159.747613,700.0,1.0,101.0,225.0,2.528090,2.062048,13.0,1.0,2.0,26121.0,293.494382,159.711539,586.0,0.0,285.0,0.003812,0.001515,0.008950,0.001842,0.003445,0.005569,0.002612,0.015949,0.002197,0.004947,0.003853,0.001433,0.009198,0.001987,0.003581,,,,2.024708,18.353987,0.002903,0.002619,0.046933,0.000416,0.002131,0.003796,0.003375,0.062174,0.000605,0.002765,0.003004,0.002463,0.037666,0.000510,0.002254,,,,0.000000,13.445859
2,58,22076,0.002863,58-22076,598.30756,0.997179,0.000907,0.996946,-0.797297,0.444533,598.41360,0.997356,0.000832,0.997271,-0.877343,0.045016,-2.216200e-03,0.002623,-3.699834e-06,0.000107,0.0,,,-0.002213,0.004488,-3.694307e-06,0.000183,0.0,,,0.214987,0.000358,0.000263,0.000281,0.932617,0.957359,0.429021,0.000715,2.510883e-04,0.000681,0.978536,1.128808,0.078867,0.000131,8.000458e-05,0.000097,4.615472,2.372039,-0.202357,-0.000337,2.384041e-04,-0.000291,-0.752067,-0.602195,276551,460.918333,185.923068,430.0,2.135823,0.947047,81439,135.731667,144.914780,95.0,4.092933,1.846135,149.43927,0.996262,0.000364,0.996238,-0.036891,0.196912,149.47705,0.996514,0.000483,0.996605,0.226860,-0.331357,-0.000479,0.001350,-0.000003,0.000111,0.000000,10.684832,-0.017438,-0.000676,0.003176,-4.509830e-06,0.000260,0.0,12.436074,0.252570,0.052095,0.000347,0.000276,0.000237,3.080923,1.566382,0.094242,0.000628,2.469873e-04,0.000584,3.201331,1.523856,0.018627,0.000124,5.852864e-05,0.000097,5.625292,2.365393,-0.073240,-0.000488,2.536689e-04,-0.000582,-1.024049,-0.196268,73626,490.840000,140.650220,508.0,-0.752033,-0.029702,25184,167.893333,155.208937,96.0,-0.640518,0.707922,298.93270,0.996442,0.000369,0.996369,-0.500712,-0.288098,299.01505,0.996717,0.000500,0.996605,0.224923,-0.131212,-0.001064,0.001750,-3.547048e-06,0.000101,0.0,12.111864,0.213879,-0.001163,0.003562,-3.876705e-06,...,0.236003,0.768291,0.000193,0.000256,0.000101,-0.504972,0.923206,0.000266,3.122869e-07,-0.210979,-9.315311e+03,-5.735157e-05,0.000178,45,0.000207,0.000156,1.303906,0.652972,0.000151,0.000328,0.000139,0.176244,0.859653,0.000302,1.575617e-07,-0.426395,-20931.000000,-6.052526e-05,0.000158,133,0.000173,0.000107,0.186547,0.757026,0.000173,0.000231,0.000092,-0.230092,0.896278,0.000236,1.804813e-07,-0.121557,-1.930099e+04,-2.954053e-05,0.000132,133,0.000157,0.000094,0.232056,0.795469,0.000156,0.000203,0.000078,-0.043437,0.903233,0.000206,1.065285e-07,-0.125007,-3.306620e+04,-1.110722e-05,0.000119,45,0.000251,0.000182,0.331269,0.815529,0.000246,0.000365,0.000182,-0.417606,0.928878,0.000396,9.437716e-07,-0.319008,-2609.535333,-0.000111,0.000215,0.002623,0.004488,0.002635,8.961113,4.256296,5.646941,0.0,4.204509,10.495756,21.933313,0.996969,0.000757,0.998399,0.996168,0.996749,3643.0,165.590909,162.155322,653.0,2.0,113.5,88.0,4.000000,2.927700,10.0,1.0,4.0,8105.0,368.409091,177.985997,565.0,31.0,418.0,0.002035,0.001872,0.018706,0.000503,0.001735,0.002879,0.002309,0.020866,0.000553,0.002457,0.001923,0.001343,0.012610,0.000496,0.001674,,,,3.599783,11.103788,0.004224,0.003572,0.041124,0.000373,0.003158,0.006102,0.005002,0.067929,0.000493,0.004704,0.004020,0.003281,0.040993,0.000358,0.003100,,,,2.099306,12.351617
3,77,5817,0.005279,77-5817,601.05817,1.001764,0.002921,1.001746,-0.907996,-0.267860,601.09640,1.001827,0.002950,1.001847,-0.921080,-0.240119,3.857260e-03,0.006993,6.439499e-06,0.000286,0.0,,,0.003651,0.009757,6.094700e-06,0.000399,0.0,,,0.126732,0.000211,0.000145,0.000183,-0.508057,0.594553,0.243257,0.000405,9.510022e-05,0.000380,10.070632,3.473891,0.228444,0.000381,3.469868e-08,0.000381,3.432172,-2.187528,-0.228436,-0.000381,4.818484e-08,-0.000381,-0.308955,1.244469,2227382,3712.303333,960.696486,3510.5,3.223581,1.391724,503860,839.766667,738.489271,700.0,4.493070,1.811369,150.06807,1.000454,0.000727,1.000512,0.089949,-0.548133,150.06671,1.000445,0.000898,1.000448,-0.049675,-0.487789,0.000180,0.003105,0.000001,0.000254,0.000006,4.411888,-0.860237,-0.000076,0.005661,-5.054132e-07,0.000464,0.0,1.853950,-0.298721,0.035303,0.000235,0.000157,0.000186,-0.923424,0.510255,0.060510,0.000403,9.066640e-05,0.000381,11.730264,3.705408,0.057111,0.000381,3.302441e-08,0.000381,4.560014,-2.422400,-0.057109,-0.000381,5.061392e-08,-0.000381,-0.710823,1.092016,560983,3739.886667,798.023267,3700.0,-0.422332,0.374290,104961,699.740000,589.194108,500.0,2.990411,1.511708,300.67102,1.002237,0.002305,1.001224,-1.239833,0.507073,300.66970,1.002232,0.002362,1.001224,-1.138022,0.449436,-0.005484,0.005275,-1.827947e-05,0.000305,0.0,6.844016,-1.428839,-0.005791,0.007743,-1.930346e-05,...,1.714312,0.814050,0.000243,0.000436,0.000259,1.422666,0.931932,0.000376,4.594015e-08,0.053487,-7.404578e+04,1.962889e-05,0.000255,146,0.000419,0.000313,1.479319,0.839796,0.000365,0.000631,0.000435,1.452453,0.961701,0.000505,4.761360e-08,0.078676,-86535.391565,2.562365e-05,0.000306,436,0.000262,0.000191,2.002234,0.771754,0.000212,0.000365,0.000208,1.485866,0.935352,0.000316,2.692755e-08,0.041859,-1.263069e+05,8.692961e-06,0.000218,436,0.000263,0.000159,0.607767,0.746940,0.000226,0.000375,0.000170,0.511911,0.930447,0.000353,2.072071e-08,0.040333,-1.973740e+05,3.034289e-06,0.000208,146,0.000416,0.000311,1.421296,0.792886,0.000354,0.000608,0.000315,1.056948,0.909105,0.000583,1.012976e-07,0.077543,-41170.878226,0.000035,0.000343,0.006993,0.009757,0.008035,10.073180,5.545836,0.002083,0.0,5.180952,12.259069,201.324570,1.001615,0.002840,1.006663,0.996002,1.001332,131051.0,651.995025,965.292513,10589.0,50.0,344.0,877.0,4.363184,5.564390,60.0,1.0,3.0,63296.0,314.905473,178.358392,596.0,2.0,325.0,0.009777,0.004200,0.024979,0.003298,0.008878,0.013158,0.006552,0.038566,0.003549,0.011594,0.009269,0.003716,0.021429,0.003390,0.008426,,,,5.592280,15.498549,0.003366,0.002558,0.035552,0.000700,0.002649,0.004712,0.003120,0.042910,0.001081,0.003910,0.003872,0.002671,0.036644,0.000849,0.003146,,,,0.921629,13.606591
4,56,14572,0.002328,56-14572,598.78840,0.997981,0.000927,0.997882,-0.857376,0.054103,598.76544,0.997942,0.000961,0.997819,-1.026107,0.042450,-1.671476e-03,0.002564,-2.790444e-06,0.000105,0.0,,,-0.001691,0.003622,-2.823096e-06,0.000148,0.0,,,0.074003,0.000123,0.000095,0.000108,0.736676,0.928654,0.166596,0.000278,8.049258e-05,0.000261,1.190128,0.916931,0.042784,0.000071,6.605039e-05,0.000043,2.095133,1.583203,-0.048897,-0.000081,6.813075e-05,-0.000065,1.772496,-1.348820,201007,335.011667,156.600216,321.0,4.624120,1.524437,72007,120.011667,94.411798,99.0,1.640380,1.094121,149.60847,0.997390,0.000361,0.997394,-0.748833,0.079546,149.59203,0.997280,0.000412,0.997257,-0.802039,0.046661,0.001371,0.001495,0.000009,0.000122,0.000000,4.755705,-0.607413,0.001544,0.002001,1.029398e-05,0.000164,0.0,3.500741,-0.087984,0.022062,0.000147,0.000112,0.000138,0.666570,0.927687,0.043701,0.000291,9.093613e-05,0.000282,0.895255,0.809980,0.018575,0.000124,8.508687e-05,0.000087,-0.565675,0.616885,-0.009558,-0.000064,6.090475e-05,-0.000043,4.533438,-1.915580,48883,325.886667,116.885967,321.0,-0.915541,0.050118,14875,99.166667,81.427731,96.5,2.685287,1.385483,299.17014,0.997234,0.000510,0.997321,-0.380009,-0.402873,299.14703,0.997157,0.000513,0.997187,-0.593481,-0.266779,0.000498,0.002086,1.661003e-06,0.000121,0.0,3.145998,-0.198122,0.000439,0.003080,1.461875e-06,...,0.576553,0.802864,0.000106,0.000167,0.000089,0.564880,0.936756,0.000156,2.232058e-07,-0.066930,1.645353e+03,-3.147134e-06,0.000099,118,0.000149,0.000112,1.409285,0.703402,0.000120,0.000210,0.000119,1.023467,0.928699,0.000165,1.257623e-07,-0.138563,-3927.279809,-9.281995e-06,0.000098,355,0.000103,0.000057,0.514799,0.756140,0.000096,0.000141,0.000062,0.743057,0.922096,0.000133,1.190931e-07,-0.055600,1.190859e+03,2.452705e-06,0.000084,354,0.000096,0.000063,1.499223,0.789606,0.000083,0.000137,0.000078,1.745198,0.944740,0.000119,7.430125e-08,-0.060964,1.838526e+03,-2.276821e-06,0.000070,119,0.000147,0.000121,1.276071,0.788199,0.000119,0.000205,0.000125,0.552118,0.943062,0.000188,5.857255e-07,-0.118810,796.023375,-0.000010,0.000122,0.002564,0.003622,0.002514,19.371048,6.650390,17.818066,0.0,9.533835,11.982359,153.646930,0.997707,0.000892,0.999762,0.996034,0.997491,15685.0,101.850649,127.310068,915.0,1.0,99.0,490.0,3.181818,4.884890,55.0,1.0,2.0,51555.0,334.772727,162.386714,595.0,5.0,362.0,0.001889,0.000964,0.006077,0.000576,0.001648,0.002897,0.001591,0.008706,0.000714,0.002395,0.001985,0.000951,0.005242,0.000591,0.001709,,,,0.800570,11.673630,0.004845,0.002790,0.030041,0.000988,0.004028,0.006085,0.003376,0.037915,0.001577,0.005096,0.004412,0.002564,0.026125,0.001012,0.003628,,,,5.596212,23.238896
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
428927,76,21439,0.002647,76-21439,600.85600,1.001427,0.000982,1.001238,-0.258683,0.731784,600.83440,1.001391,0.000968,1.001338,-0.213067,0.673776,2.942843e-03,0.003456,4.912926e-06,0.000141,0.0,,,0.003319,0.004683,5.540259e-06,0.000191,0.0,,,0.097441,0.000162,0.000117,0.000146,0.169890,0.773545,0.213385,0.000356,1.394403e-04,0.000345,2.980784,1.457641,0.104993,0.000175,1.198182e-04,0.000148,0.169257,0.922909,-0.122059,-0.000203,1.454425e-04,-0.000198,0.189370,-0.909727,319671,532.785000,188.145076,501.0,0.121759,0.594470,108369,180.615000,120.773592,169.0,0.790040,0.794638,150.42587,1.002839,0.000632,1.002918,-0.722024,-0.636665,150.41370,1.002758,0.000646,1.002840,-0.753161,-0.656653,0.001639,0.001829,0.000011,0.000149,0.000000,5.145311,0.106764,0.001876,0.002308,1.250727e-05,0.000189,0.0,7.812954,0.849945,0.022604,0.000151,0.000116,0.000123,0.427302,0.968552,0.054624,0.000364,1.195822e-04,0.000345,1.063059,0.839058,0.028350,0.000189,1.403048e-04,0.000148,-0.196668,0.828519,-0.024490,-0.000163,1.056552e-04,-0.000198,0.918211,-0.899916,96118,640.786667,204.102277,600.0,-0.581358,0.515835,29646,197.640000,141.300018,171.0,0.224662,0.776403,300.64368,1.002146,0.000847,1.001750,-1.233605,0.413047,300.62393,1.002080,0.000841,1.001654,-1.212862,0.410087,0.002298,0.002261,7.660316e-06,0.000131,0.0,5.582712,0.031058,0.002537,0.002880,8.455152e-06,...,1.509122,0.780793,0.000116,0.000173,0.000105,2.282476,0.947109,0.000143,1.004936e-07,0.102450,3.347717e+04,1.982147e-05,0.000129,117,0.000167,0.000099,0.808238,0.713716,0.000145,0.000226,0.000091,0.600493,0.904100,0.000221,6.467012e-08,0.209131,50846.878783,3.395267e-05,0.000136,350,0.000127,0.000079,1.572223,0.794416,0.000114,0.000160,0.000078,1.583178,0.939398,0.000136,5.740811e-08,0.075858,5.851070e+04,1.455145e-05,0.000118,350,0.000132,0.000070,0.651836,0.738617,0.000125,0.000167,0.000070,1.004658,0.923165,0.000152,3.746451e-08,0.078408,9.714658e+04,1.613851e-05,0.000115,117,0.000153,0.000132,2.831952,0.728751,0.000114,0.000212,0.000164,2.151077,0.940478,0.000151,2.236709e-07,0.223133,14782.543592,0.000040,0.000142,0.003456,0.004683,0.003308,14.947007,9.293586,14.569200,0.0,6.515039,15.301167,68.122440,1.001801,0.001040,1.003610,0.999852,1.001385,7816.0,114.941176,125.278065,540.0,1.0,100.0,171.0,2.514706,2.018516,10.0,1.0,2.0,24562.0,361.205882,173.693121,599.0,14.0,382.5,0.002818,0.001335,0.007531,0.000284,0.002492,0.004039,0.002142,0.011330,0.000068,0.003553,0.002848,0.001302,0.007653,0.000148,0.002571,,,,0.672716,17.016576,0.004540,0.003100,0.038771,0.000880,0.003643,0.005778,0.003884,0.055342,0.001048,0.004723,0.004077,0.002744,0.037967,0.000780,0.003275,,,,5.147635,22.639032
428928,108,16733,0.001089,108-16733,599.87500,0.999792,0.000372,0.999724,-1.149882,-0.009472,599.80200,0.999670,0.000471,0.999634,-0.811869,0.019223,-1.170027e-03,0.001024,-1.953301e-06,0.000042,0.0,,,-0.001522,0.001667,-2.540422e-06,0.000068,0.0,,,0.098845,0.000165,0.000118,0.000126,-1.116643,0.458715,0.244101,0.000407,1.585902e-07,0.000407,-0.943112,-0.045696,0.244052,0.000407,2.316365e-08,0.000407,0.631420,1.622014,-0.244045,-0.000407,0.000000e+00,-0.000407,-3.000000,0.000000,14477849,24129.748333,2932.225114,23654.0,-0.028096,0.433493,2080539,3467.565000,2420.802655,3165.5,0.448897,0.781153,149.93121,0.999541,0.000154,0.999547,-0.124166,-0.734934,149.92207,0.999481,0.000248,0.999576,0.920982,-1.688973,-0.000289,0.000406,-0.000002,0.000033,0.000000,11.326935,-1.186579,-0.000653,0.000614,-4.350038e-06,0.000050,0.0,141.634582,-11.914139,0.017084,0.000114,0.000105,0.000086,1.017301,1.487177,0.061040,0.000407,6.290679e-08,0.000407,0.977114,1.725171,0.061013,0.000407,2.263804e-08,0.000407,0.978790,1.725900,-0.061011,-0.000407,0.000000e+00,-0.000407,-3.000000,0.000000,3705074,24700.493333,1749.543725,24668.5,-0.885320,-0.045490,593902,3959.346667,1983.670031,3574.0,-0.737909,0.258339,299.85287,0.999510,0.000253,0.999528,0.158565,0.744103,299.81332,0.999378,0.000357,0.999572,-1.226197,0.009576,-0.000916,0.000812,-3.054283e-06,0.000047,0.0,54.435214,-4.249926,-0.001098,0.001236,-3.660867e-06,...,2.212761,0.816544,0.000026,0.000060,0.000057,1.962641,0.948402,0.000041,6.837199e-10,-0.192109,-2.018644e+06,-5.900947e-06,0.000029,111,0.000049,0.000080,1.799629,0.791116,0.000009,0.000083,0.000093,0.811167,0.936012,0.000024,1.018778e-09,-0.159516,-6830.699859,-2.763424e-06,0.000028,332,0.000032,0.000034,2.108411,0.782123,0.000020,0.000049,0.000041,1.607976,0.933640,0.000038,4.461562e-10,-0.155669,-3.010693e+06,-3.628469e-06,0.000022,332,0.000031,0.000045,3.118680,0.776416,0.000016,0.000050,0.000057,1.885350,0.930587,0.000027,3.850483e-10,-0.172884,-3.488144e+06,-2.568895e-06,0.000021,111,0.000052,0.000098,3.730325,0.799215,0.000019,0.000085,0.000124,2.529222,0.932008,0.000036,1.445554e-09,-0.263158,-782938.944806,-0.000009,0.000035,0.001024,0.001667,0.001271,7.444752,0.001077,0.000254,0.0,0.964175,9.533051,13.996746,0.999768,0.000297,1.000203,0.999390,0.999797,17721.0,1265.785714,1499.487665,3921.0,7.0,448.0,109.0,7.785714,5.191392,15.0,1.0,9.0,4755.0,339.642857,171.139443,574.0,8.0,335.0,0.001949,0.001015,0.007754,0.000115,0.001798,0.002858,0.001561,0.010666,0.000008,0.002547,0.002000,0.000985,0.007375,0.000057,0.001835,,,,0.000000,12.609031,0.003337,0.002546,0.035924,0.000369,0.002642,0.004335,0.003075,0.038709,0.000376,0.003548,0.003629,0.002615,0.034763,0.000405,0.002935,,,,0.000000,12.628781
428929,37,14273,0.002531,37-14273,601.11096,1.001852,0.000367,1.001833,0.624756,1.055845,601.35460,1.002258,0.000556,1.002294,-0.976299,-0.146546,-1.316365e-03,0.002124,-2.197604e-06,0.000087,0.0,,,0.000596,0.005234,9.953217e-07,0.000214,0.0,,,0.404903,0.000675,0.000359,0.000584,-0.233344,0.428476,0.765416,0.001276,3.093680e-04,0.001303,-1.447699,-0.091916,0.093891,0.000156,1.623810e-04,0.000030,-1.662358,0.491494,-0.036006,-0.000060,1.071243e-04,-0.000006,2.064486,-1.846837,103454,172.423333,100.354185,125.5,-0.980879,0.182233,47972,79.953333,61.444013,89.0,2.488920,1.288776,150.27243,1.001816,0.000176,1.001920,-0.110227,-0.487537,150.35689,1.002379,0.000251,1.002554,1.989640,-1.451404,-0.000238,0.001060,-0.000002,0.000087,0.000000,30.835999,-2.929819,-0.000248,0.001680,-1.655800e-06,0.000138,0.0,46.323563,-0.219829,0.089504,0.000597,0.000148,0.000634,4.806844,-1.734691,0.140031,0.000934,1.211388e-04,0.000877,0.552668,1.508953,0.044171,0.000294,1.026674e-04,0.000338,2.707623,-2.134799,-0.017555,-0.000117,1.033026e-04,-0.000214,-1.980851,0.134039,9660,64.400000,51.013618,16.0,-1.926529,0.115360,6910,46.066667,42.313573,6.0,-1.950850,0.118561,300.50052,1.001668,0.000206,1.001709,-1.047710,0.447769,300.65912,1.002197,0.000318,1.002294,0.190176,-0.758860,-0.000041,0.001089,-1.364900e-07,0.000063,0.0,58.774581,-3.711293,-0.000411,0.002053,-1.369017e-06,...,3.164773,0.733154,0.000009,0.000079,0.000075,1.790216,0.758723,0.000077,5.864491e-07,-0.259867,-6.967489e+02,-2.929097e-05,0.000046,30,0.000127,0.000139,1.632102,0.943471,0.000079,0.000123,0.000107,1.741227,0.972804,0.000093,2.473260e-07,-0.195165,-333.491527,-2.014435e-05,0.000091,88,0.000087,0.000111,2.039533,0.791564,0.000050,0.000114,0.000103,1.087390,0.870514,0.000084,2.157696e-07,-0.228411,-7.570795e+03,-1.877391e-05,0.000075,81,0.000108,0.000122,1.599728,0.795689,0.000065,0.000138,0.000115,1.302259,0.897712,0.000102,1.156783e-07,-0.214877,-1.137163e+04,-1.733242e-05,0.000079,37,0.000066,0.000115,2.721480,0.662802,0.000004,0.000110,0.000090,1.158944,0.764461,0.000119,1.208993e-06,-0.458126,-455.084352,-0.000037,0.000040,0.002124,0.005234,0.002519,5.873809,1.068967,6.146358,0.0,7.140325,2.397895,3.006461,1.002154,0.000578,1.002805,1.001701,1.001956,40.0,13.333333,20.502032,37.0,1.0,2.0,4.0,1.333333,0.577350,2.0,1.0,1.0,1195.0,398.333333,311.206255,581.0,39.0,575.0,0.002076,0.000836,0.004408,0.000767,0.001833,0.003012,0.001376,0.007255,0.000411,0.002610,0.002104,0.000814,0.004375,0.000577,0.001854,,,,2.619852,14.016216,0.007163,0.004996,0.053782,0.000603,0.005614,0.009888,0.007433,0.096552,0.000927,0.007564,0.006088,0.004394,0.055484,0.000688,0.004739,,,,0.655598,9.141956
428930,41,11351,0.001864,41-11351,600.30000,1.000500,0.000194,1.000479,-0.102242,-0.335757,600.28180,1.000470,0.000254,1.000469,0.128287,-0.210395,-1.884784e-04,0.001252,-3.146550e-07,0.000051,0.0,,,-0.000210,0.002172,-3.510817e-07,0.000089,0.0,,,0.047055,0.000078,0.000048,0.000073,0.584539,0.803946,0.136816,0.000228,9.300933e-06,0.000228,594.889339,24.430163,0.136676,0.000228,3.183415e-08,0.000228,2.706872,-1.908859,-0.136652,-0.000228,5.952166e-08,-0.000228,-1.982151,0.133582,16360223,27267.038333,3021.952883,27049.5,-0.017006,0.194480,3003171,5005.285000,3831.373475,3972.0,-0.047303,0.852849,150.07831,1.000522,0.000111,1.000487,-0.003667,-0.106204,150.07579,1.000505,0.000171,1.000411,-1.029364,0.369141,0.000309,0.000536,0.000002,0.000044,0.000000,10.206429,-0.585830,0.000271,0.000930,1.809912e-06,0.000076,0.0,18.780652,0.150879,0.012084,0.000081,0.000027,0.000074,2.010435,0.924002,0.034148,0.000228,8.138696e-08,0.000228,-1.389327,-0.730384,0.034171,0.000228,9.634912e-09,0.000228,32.535455,-5.877031,-0.034160,-0.000228,5.692277e-08,-0.000228,-1.584843,-0.644299,4212732,28084.880000,2638.984259,28636.5,0.095796,-0.522562,442000,2946.666667,2254.018329,2656.0,1.244195,1.099054,300.14554,1.000485,0.000178,1.000487,0.082977,-0.864219,300.13773,1.000459,0.000241,1.000412,-0.147260,-0.527192,-0.000110,0.000897,-3.665666e-07,0.000052,0.0,12.689356,-1.183722,-0.000189,0.001603,-6.291133e-07,...,1.473789,0.801439,0.000031,0.000076,0.000055,0.861355,0.933936,0.000073,5.034433e-10,-0.027177,2.918465e+05,-2.268164e-07,0.000034,149,0.000061,0.000068,1.061131,0.737387,0.000019,0.000099,0.000069,0.312353,0.919451,0.000099,5.894416e-10,-0.041394,-523483.118854,3.018005e-07,0.000037,447,0.000039,0.000040,1.534255,0.776848,0.000024,0.000063,0.000046,0.880489,0.931837,0.000056,3.195294e-10,-0.021550,4.487251e+05,7.707369e-08,0.000027,446,0.000038,0.000047,1.494983,0.788940,0.000014,0.000060,0.000050,0.675034,0.932300,0.000059,2.928702e-10,-0.016679,4.157925e+05,6.948591e-07,0.000025,150,0.000062,0.000059,1.211235,0.763423,0.000041,0.000098,0.000061,0.423055,0.921784,0.000093,9.586547e-10,-0.064925,-190504.508629,-0.000003,0.000041,0.001252,0.002172,0.001654,8.634210,0.980267,0.001336,0.0,1.756378,10.551867,91.044660,1.000491,0.000179,1.000797,1.000114,1.000569,126563.0,1390.802198,2045.340679,9450.0,1.0,500.0,585.0,6.428571,6.157458,30.0,1.0,4.0,26072.0,286.505495,165.568071,580.0,18.0,265.0,0.002390,0.001159,0.006706,0.000824,0.002102,0.003412,0.001626,0.009134,0.000956,0.002970,0.002328,0.000999,0.006171,0.000847,0.002099,,,,5.623664,12.058868,0.002252,0.001799,0.020220,0.000304,0.001681,0.002925,0.002118,0.023693,0.000322,0.002292,0.002461,0.001852,0.020295,0.000328,0.001882,,,,0.000000,12.104390


In [7]:
# feature_groups = get_feature_groups(train)
# pruned_groups = ["timeagg_450_log_return1",
#     "trade_seconds_in_bucket_450",
#     "wap1_300",
#     "timeagg_450_trade_log_return",
#     "trade_seconds_in_bucket",
#     "ask_spread_450"]
# feature_cols = list(itertools.chain.from_iterable([c for g, c in feature_groups.items() if g not in pruned_groups]))
# print(f"# features: {len(feature_cols)}")
feature_cols = [c for c in train.columns if c not in ['row_id', 'target', 'time_id', 'stock_id', 'target', 'logtarget']]
target_col = 'target'
# {'reg_alpha': 9.594283186777315e-06, 'reg_lambda': 0.00030328360027000927, 'n_estimators': 3178, 'learning_rate': 0.019233318286949023, 'num_leaves': 1251, 'feature_fraction': 0.26088472222018966, 'bagging_fraction': 0.20674682558678448, 'bagging_freq': 25, 'min_child_samples': 263}
params = {
    'random_state': SEED,
    'objective': 'rmse',  
    'boosting_type': 'gbdt',
#     'boosting_type': 'dart',
#     'num_leaves': 100,
#     'learning_rate': 0.1,
#     'colsample_bytree': 0.8,
#     'subsample': 0.8,
#     'n_estimators': 10000,
    'min_child_samples': int(0.01*train.shape[0])
}


oof_predictions = np.zeros(train.shape[0])
kfold = GroupKFold(n_splits=5)
for fold, (trn_ind, val_ind) in enumerate(kfold.split(train, groups=train.time_id)):
    print(f'Training fold {fold}')
    x_train, x_val = train.loc[trn_ind, feature_cols], train.loc[val_ind, feature_cols]
    y_train, y_val = train.loc[trn_ind, target_col], train.loc[val_ind, target_col]

    # Root mean squared percentage error weights
    if target_col == 'logtarget':
        train_weights = 1 / np.square(np.exp(y_train))
        val_weights = 1 / np.square(np.exp(y_val))
    else:
        train_weights = 1 / np.square(y_train)
        val_weights = 1 / np.square(y_val)

    # Fit with sklearn API
    model = lgb.LGBMRegressor(**params)
    model.fit(x_train, 
              y_train, 
              sample_weight=train_weights,
              eval_set=[(x_val, y_val)],
              eval_sample_weight=[val_weights],
              eval_metric='rmse',
              early_stopping_rounds=100,
              verbose=False)

    # Add predictions to the out of folds array
    oof_predictions[val_ind] = model.predict(x_val)
if target_col == 'logtarget':
    oof_predictions = np.exp(oof_predictions)
oof_score = rmspe(train['target'], oof_predictions)

print(f"oof rmspe: {oof_score}") # 0.2260 # dart 0.2465 #

Training fold 0
Training fold 1
Training fold 2
Training fold 3
Training fold 4
oof rmspe: 0.225594981740629


In [5]:
df_importance = pd.DataFrame({"feature": model.feature_name_, "importance": model.feature_importances_})
df_importance = df_importance.sort_values(by=["importance"], ascending=False).reset_index(drop=True)
df_importance

Unnamed: 0,feature,importance
0,log_return1_realized_volatility,86
1,trade_log_return_realized_volatility_std_time,74
2,log_return1_realized_volatility_450_median_stock,74
3,log_return1_kurtosis_150,69
4,trade_log_return_realized_volatility_450_media...,61
...,...,...
419,total_volume_kurtosis_450,0
420,total_volume_median_450,0
421,log_return2_realized_volatility_max_stock,0
422,bid_spread_mean_150,0
