In [16]:
SEED=42
# SEEDS = [42, 0, 2000,]
SEEDS = [42]

import os
import glob
from joblib import Parallel, delayed
import pandas as pd
import numpy as np
import scipy as sc
from sklearn.model_selection import KFold, GroupKFold
import lightgbm as lgb
import warnings
warnings.filterwarnings('ignore')
pd.set_option('max_columns', 300)
pd.set_option('max_rows', 300)

# Function to read our base train and test set
def read_train_test():
    train = pd.read_csv('../input/optiver-realized-volatility-prediction/train.csv')
    test = pd.read_csv('../input/optiver-realized-volatility-prediction/test.csv')
    # Create a key to merge with book and trade data
    train['row_id'] = train['stock_id'].astype(str) + '-' + train['time_id'].astype(str)
    test['row_id'] = test['stock_id'].astype(str) + '-' + test['time_id'].astype(str)
    print(f'Our training set has {train.shape[0]} rows')
    return train, test

# Function to get group stats for the stock_id and time_id
def get_time_stock(df):
    # Get realized volatility columns
    vol_cols = ['log_return1_realized_volatility', 'log_return2_realized_volatility', 'log_return1_realized_volatility_450', 'log_return2_realized_volatility_450', 
                'log_return1_realized_volatility_300', 'log_return2_realized_volatility_300', 'log_return1_realized_volatility_150', 'log_return2_realized_volatility_150', 
                'trade_log_return_realized_volatility', 'trade_log_return_realized_volatility_450', 'trade_log_return_realized_volatility_300', 'trade_log_return_realized_volatility_150']

    # Group by the stock id
    df_stock_id = df.groupby(['stock_id'])[vol_cols].agg(['mean', 'std', 'max', 'min', 'median']).reset_index()
    # Rename columns joining suffix
    df_stock_id.columns = ['_'.join(col) for col in df_stock_id.columns]
    df_stock_id = df_stock_id.add_suffix('_' + 'stock')

    # Group by the time id
    df_time_id = df.groupby(['time_id'])[vol_cols].agg(['mean', 'std', 'max', 'min', 'median']).reset_index()
    # Rename columns joining suffix
    df_time_id.columns = ['_'.join(col) for col in df_time_id.columns]
    df_time_id = df_time_id.add_suffix('_' + 'time')
    
    # Merge with original dataframe
    df = df.merge(df_stock_id, how = 'left', left_on = ['stock_id'], right_on = ['stock_id__stock'])
    df = df.merge(df_time_id, how = 'left', left_on = ['time_id'], right_on = ['time_id__time'])
    df.drop(['stock_id__stock', 'time_id__time'], axis = 1, inplace = True)
    return df

# Function to calculate the root mean squared percentage error
def rmspe(y_true, y_pred):
    return np.sqrt(np.mean(np.square((y_true - y_pred) / y_true)))

In [2]:
train, _ = read_train_test()
df_book = pd.read_csv('../input/processed-book-ffill/df_book.csv')
print(df_book.shape)
df_trade = pd.read_csv('../input/processed-book-ffill/df_trade.csv')
print(df_trade.shape)
train_ = df_book.merge(df_trade, on = ['row_id'], how = 'left')
train = train.merge(train_, on = ['row_id'], how = 'left')

# Get group stats of time_id and stock_id
train = get_time_stock(train)
train['logtarget'] = train['target'].apply(np.log)
train

Our training set has 428932 rows
(428932, 169)
(428913, 41)


Unnamed: 0,stock_id,time_id,target,row_id,wap1_sum,wap1_mean,wap1_std,wap1_median,wap2_sum,wap2_mean,wap2_std,wap2_median,log_return1_sum,log_return1_realized_volatility,log_return1_mean,log_return1_std,log_return1_median,log_return2_sum,log_return2_realized_volatility,log_return2_mean,log_return2_std,log_return2_median,wap_balance_sum,wap_balance_mean,wap_balance_std,wap_balance_median,price_spread_sum,price_spread_mean,price_spread_std,price_spread_median,bid_spread_sum,bid_spread_mean,bid_spread_std,bid_spread_median,ask_spread_sum,ask_spread_mean,ask_spread_std,ask_spread_median,total_volume_sum,total_volume_mean,total_volume_std,total_volume_median,volume_imbalance_sum,volume_imbalance_mean,volume_imbalance_std,volume_imbalance_median,wap1_sum_450,wap1_mean_450,wap1_std_450,wap1_median_450,wap2_sum_450,wap2_mean_450,wap2_std_450,wap2_median_450,log_return1_sum_450,log_return1_realized_volatility_450,log_return1_mean_450,log_return1_std_450,log_return1_median_450,log_return2_sum_450,log_return2_realized_volatility_450,log_return2_mean_450,log_return2_std_450,log_return2_median_450,wap_balance_sum_450,wap_balance_mean_450,wap_balance_std_450,wap_balance_median_450,price_spread_sum_450,price_spread_mean_450,price_spread_std_450,price_spread_median_450,bid_spread_sum_450,bid_spread_mean_450,bid_spread_std_450,bid_spread_median_450,ask_spread_sum_450,ask_spread_mean_450,ask_spread_std_450,ask_spread_median_450,total_volume_sum_450,total_volume_mean_450,total_volume_std_450,total_volume_median_450,volume_imbalance_sum_450,volume_imbalance_mean_450,volume_imbalance_std_450,volume_imbalance_median_450,wap1_sum_300,wap1_mean_300,wap1_std_300,wap1_median_300,wap2_sum_300,wap2_mean_300,wap2_std_300,wap2_median_300,log_return1_sum_300,log_return1_realized_volatility_300,log_return1_mean_300,log_return1_std_300,log_return1_median_300,log_return2_sum_300,log_return2_realized_volatility_300,log_return2_mean_300,log_return2_std_300,log_return2_median_300,wap_balance_sum_300,wap_balance_mean_300,wap_balance_std_300,wap_balance_median_300,price_spread_sum_300,price_spread_mean_300,price_spread_std_300,price_spread_median_300,bid_spread_sum_300,bid_spread_mean_300,bid_spread_std_300,bid_spread_median_300,ask_spread_sum_300,ask_spread_mean_300,ask_spread_std_300,ask_spread_median_300,total_volume_sum_300,total_volume_mean_300,total_volume_std_300,total_volume_median_300,volume_imbalance_sum_300,volume_imbalance_mean_300,volume_imbalance_std_300,volume_imbalance_median_300,wap1_sum_150,wap1_mean_150,wap1_std_150,wap1_median_150,wap2_sum_150,wap2_mean_150,wap2_std_150,wap2_median_150,log_return1_sum_150,log_return1_realized_volatility_150,log_return1_mean_150,log_return1_std_150,log_return1_median_150,log_return2_sum_150,log_return2_realized_volatility_150,log_return2_mean_150,log_return2_std_150,log_return2_median_150,wap_balance_sum_150,wap_balance_mean_150,...,trade_seconds_in_bucket_count_unique_450,trade_size_mean_450,trade_size_median_450,trade_size_std_450,trade_size_sum_450,trade_order_count_mean_450,trade_order_count_median_450,trade_order_count_std_450,trade_order_count_sum_450,trade_log_return_realized_volatility_300,trade_seconds_in_bucket_count_unique_300,trade_size_mean_300,trade_size_median_300,trade_size_std_300,trade_size_sum_300,trade_order_count_mean_300,trade_order_count_median_300,trade_order_count_std_300,trade_order_count_sum_300,trade_log_return_realized_volatility_150,trade_seconds_in_bucket_count_unique_150,trade_size_mean_150,trade_size_median_150,trade_size_std_150,trade_size_sum_150,trade_order_count_mean_150,trade_order_count_median_150,trade_order_count_std_150,trade_order_count_sum_150,log_return1_realized_volatility_mean_stock,log_return1_realized_volatility_std_stock,log_return1_realized_volatility_max_stock,log_return1_realized_volatility_min_stock,log_return1_realized_volatility_median_stock,log_return2_realized_volatility_mean_stock,log_return2_realized_volatility_std_stock,log_return2_realized_volatility_max_stock,log_return2_realized_volatility_min_stock,log_return2_realized_volatility_median_stock,log_return1_realized_volatility_450_mean_stock,log_return1_realized_volatility_450_std_stock,log_return1_realized_volatility_450_max_stock,log_return1_realized_volatility_450_min_stock,log_return1_realized_volatility_450_median_stock,log_return2_realized_volatility_450_mean_stock,log_return2_realized_volatility_450_std_stock,log_return2_realized_volatility_450_max_stock,log_return2_realized_volatility_450_min_stock,log_return2_realized_volatility_450_median_stock,log_return1_realized_volatility_300_mean_stock,log_return1_realized_volatility_300_std_stock,log_return1_realized_volatility_300_max_stock,log_return1_realized_volatility_300_min_stock,log_return1_realized_volatility_300_median_stock,log_return2_realized_volatility_300_mean_stock,log_return2_realized_volatility_300_std_stock,log_return2_realized_volatility_300_max_stock,log_return2_realized_volatility_300_min_stock,log_return2_realized_volatility_300_median_stock,log_return1_realized_volatility_150_mean_stock,log_return1_realized_volatility_150_std_stock,log_return1_realized_volatility_150_max_stock,log_return1_realized_volatility_150_min_stock,log_return1_realized_volatility_150_median_stock,log_return2_realized_volatility_150_mean_stock,log_return2_realized_volatility_150_std_stock,log_return2_realized_volatility_150_max_stock,log_return2_realized_volatility_150_min_stock,log_return2_realized_volatility_150_median_stock,trade_log_return_realized_volatility_mean_stock,trade_log_return_realized_volatility_std_stock,trade_log_return_realized_volatility_max_stock,trade_log_return_realized_volatility_min_stock,trade_log_return_realized_volatility_median_stock,trade_log_return_realized_volatility_450_mean_stock,trade_log_return_realized_volatility_450_std_stock,trade_log_return_realized_volatility_450_max_stock,trade_log_return_realized_volatility_450_min_stock,trade_log_return_realized_volatility_450_median_stock,trade_log_return_realized_volatility_300_mean_stock,trade_log_return_realized_volatility_300_std_stock,trade_log_return_realized_volatility_300_max_stock,trade_log_return_realized_volatility_300_min_stock,trade_log_return_realized_volatility_300_median_stock,trade_log_return_realized_volatility_150_mean_stock,trade_log_return_realized_volatility_150_std_stock,trade_log_return_realized_volatility_150_max_stock,trade_log_return_realized_volatility_150_min_stock,trade_log_return_realized_volatility_150_median_stock,log_return1_realized_volatility_mean_time,log_return1_realized_volatility_std_time,log_return1_realized_volatility_max_time,log_return1_realized_volatility_min_time,log_return1_realized_volatility_median_time,log_return2_realized_volatility_mean_time,log_return2_realized_volatility_std_time,log_return2_realized_volatility_max_time,log_return2_realized_volatility_min_time,log_return2_realized_volatility_median_time,log_return1_realized_volatility_450_mean_time,log_return1_realized_volatility_450_std_time,log_return1_realized_volatility_450_max_time,log_return1_realized_volatility_450_min_time,log_return1_realized_volatility_450_median_time,log_return2_realized_volatility_450_mean_time,log_return2_realized_volatility_450_std_time,log_return2_realized_volatility_450_max_time,log_return2_realized_volatility_450_min_time,log_return2_realized_volatility_450_median_time,log_return1_realized_volatility_300_mean_time,log_return1_realized_volatility_300_std_time,log_return1_realized_volatility_300_max_time,log_return1_realized_volatility_300_min_time,log_return1_realized_volatility_300_median_time,log_return2_realized_volatility_300_mean_time,log_return2_realized_volatility_300_std_time,log_return2_realized_volatility_300_max_time,log_return2_realized_volatility_300_min_time,log_return2_realized_volatility_300_median_time,log_return1_realized_volatility_150_mean_time,log_return1_realized_volatility_150_std_time,log_return1_realized_volatility_150_max_time,log_return1_realized_volatility_150_min_time,log_return1_realized_volatility_150_median_time,log_return2_realized_volatility_150_mean_time,log_return2_realized_volatility_150_std_time,log_return2_realized_volatility_150_max_time,log_return2_realized_volatility_150_min_time,log_return2_realized_volatility_150_median_time,trade_log_return_realized_volatility_mean_time,trade_log_return_realized_volatility_std_time,trade_log_return_realized_volatility_max_time,trade_log_return_realized_volatility_min_time,trade_log_return_realized_volatility_median_time,trade_log_return_realized_volatility_450_mean_time,trade_log_return_realized_volatility_450_std_time,trade_log_return_realized_volatility_450_max_time,trade_log_return_realized_volatility_450_min_time,trade_log_return_realized_volatility_450_median_time,trade_log_return_realized_volatility_300_mean_time,trade_log_return_realized_volatility_300_std_time,trade_log_return_realized_volatility_300_max_time,trade_log_return_realized_volatility_300_min_time,trade_log_return_realized_volatility_300_median_time,trade_log_return_realized_volatility_150_mean_time,trade_log_return_realized_volatility_150_std_time,trade_log_return_realized_volatility_150_max_time,trade_log_return_realized_volatility_150_min_time,trade_log_return_realized_volatility_150_median_time,logtarget
0,0,5,0.004136,0-5,602.21423,1.003690,0.000702,1.003862,602.15405,1.003590,0.000829,1.003777,0.002292,0.004499,3.825914e-06,0.000184,0.0,0.002325,0.006999,3.881997e-06,0.000286,0.0,0.236105,0.000394,0.000303,0.000317,0.518973,0.000865,0.000212,0.000876,0.109890,0.000183,0.000166,0.000103,-0.078963,-0.000132,0.000111,-0.000103,187640,312.733333,137.593491,304.0,84124,140.206667,110.228465,119.0,150.53326,1.003555,0.000558,1.003731,150.51950,1.003463,0.000662,1.003721,-0.000361,0.001722,-2.409727e-06,0.000141,0.0,0.000068,0.004114,4.537046e-07,0.000337,0.0,0.048312,0.000322,0.000272,0.000262,0.115701,0.000771,0.000177,0.000876,0.034752,0.000232,0.000177,0.000103,-0.019135,-0.000128,0.000112,-0.000052,37829,252.193333,106.508890,255.5,24453,163.020000,80.862587,158.0,301.13525,1.003784,0.000496,1.003849,301.10052,1.003668,0.000578,1.003768,0.000157,0.002953,5.241972e-07,0.000171,0.0,0.000274,0.004864,9.122584e-07,0.000281,0.0,0.106716,0.000356,0.000269,0.000307,0.249618,0.000832,0.000237,0.000876,0.064952,0.000217,0.000169,0.000103,-0.038580,-0.000129,0.000113,-0.000052,84729,282.430000,133.923324,275.0,45347,151.156667,95.469683,124.0,451.72480,1.003833,0.000457,1.003917,451.68774,1.003751,0.000528,1.003843,0.000276,0.003796,6.131817e-07,0.000179,0.0,0.000003,0.006087,6.597903e-09,0.000287,0.0,0.168148,0.000374,...,14.0,74.428571,10.5,137.880502,1042.0,2.642857,2.0,2.023217,37.0,0.001308,21.0,75.571429,6.0,141.675888,1587.0,2.571429,2.0,2.292846,54.0,0.001701,30.0,68.966667,7.0,122.252560,2069.0,2.433333,2.0,2.062528,73.0,0.004459,0.003698,0.052704,0.000747,0.003302,0.006856,0.005494,0.086670,0.001347,0.005213,0.002020,0.001690,0.036490,0.000047,0.001527,0.003102,0.002308,0.028931,0.000000,0.002465,0.002973,0.002408,0.050501,0.000227,0.002270,0.004559,0.003414,0.047745,0.000454,0.003572,0.003751,0.003075,0.052446,0.000485,0.002818,0.005746,0.004383,0.059070,0.000941,0.004461,0.002330,0.001763,0.028551,0.000000,0.001791,0.001102,0.000860,0.008911,0.000000,0.000867,0.001613,0.001212,0.021736,0.000000,0.001258,0.002028,0.001545,0.027483,0.000000,0.001566,0.004583,0.002185,0.014391,0.001429,0.004141,0.006028,0.003248,0.024314,0.001970,0.005662,0.002144,0.001098,0.008361,0.000714,0.001917,0.002799,0.001415,0.008819,0.000841,0.002582,0.003033,0.001487,0.009931,0.000944,0.002755,0.003999,0.002142,0.015091,0.001343,0.003667,0.003884,0.001939,0.012437,0.001233,0.003543,0.005075,0.002795,0.020310,0.001693,0.004534,0.002675,0.000943,0.006251,0.001109,0.002532,0.001308,0.000504,0.003242,0.000543,0.001245,0.001820,0.000692,0.004595,0.000710,0.001664,0.002286,0.000836,0.005362,0.000888,0.002165,-5.488082
1,0,11,0.001445,0-11,600.11053,1.000184,0.000263,1.000196,600.09200,1.000153,0.000276,1.000117,0.000360,0.001204,6.014438e-07,0.000049,0.0,0.000801,0.002476,1.336801e-06,0.000101,0.0,0.123366,0.000206,0.000143,0.000212,0.259401,0.000432,0.000185,0.000402,0.078852,0.000131,0.000131,0.000050,-0.082809,-0.000138,0.000071,-0.000151,228378,380.630000,172.053743,350.5,77466,129.110000,94.455038,99.0,150.07066,1.000471,0.000218,1.000365,150.05269,1.000351,0.000303,1.000275,-0.000059,0.000918,-3.932587e-07,0.000075,0.0,0.000488,0.001883,3.252445e-06,0.000154,0.0,0.038899,0.000259,0.000140,0.000247,0.057944,0.000386,0.000164,0.000301,0.026803,0.000179,0.000210,0.000050,-0.020727,-0.000138,0.000066,-0.000151,62317,415.446667,189.278054,374.0,14745,98.300000,96.763099,78.0,300.11435,1.000381,0.000191,1.000321,300.09717,1.000324,0.000247,1.000360,0.000096,0.000981,3.213850e-07,0.000057,0.0,0.000413,0.002009,1.375524e-06,0.000116,0.0,0.070866,0.000236,0.000141,0.000247,0.109072,0.000364,0.000139,0.000351,0.041612,0.000139,0.000158,0.000050,-0.036486,-0.000122,0.000059,-0.000100,136900,456.333333,189.160376,456.5,37016,123.386667,102.993021,87.0,450.12970,1.000288,0.000208,1.000244,450.10610,1.000236,0.000258,1.000192,0.000298,0.001058,6.619052e-07,0.000050,0.0,0.000873,0.002262,1.939473e-06,0.000107,0.0,0.089617,0.000199,...,10.0,82.800000,19.0,107.246134,828.0,2.200000,1.0,2.097618,22.0,0.000587,16.0,56.250000,12.5,90.504144,900.0,2.250000,1.0,1.807392,36.0,0.000813,24.0,48.875000,5.5,83.807913,1173.0,2.041667,1.0,1.573674,49.0,0.004459,0.003698,0.052704,0.000747,0.003302,0.006856,0.005494,0.086670,0.001347,0.005213,0.002020,0.001690,0.036490,0.000047,0.001527,0.003102,0.002308,0.028931,0.000000,0.002465,0.002973,0.002408,0.050501,0.000227,0.002270,0.004559,0.003414,0.047745,0.000454,0.003572,0.003751,0.003075,0.052446,0.000485,0.002818,0.005746,0.004383,0.059070,0.000941,0.004461,0.002330,0.001763,0.028551,0.000000,0.001791,0.001102,0.000860,0.008911,0.000000,0.000867,0.001613,0.001212,0.021736,0.000000,0.001258,0.002028,0.001545,0.027483,0.000000,0.001566,0.002206,0.001292,0.007436,0.000509,0.001968,0.003193,0.001797,0.009370,0.000632,0.002794,0.001000,0.000582,0.003656,0.000174,0.000904,0.001455,0.000839,0.004079,0.000110,0.001292,0.001411,0.000759,0.003792,0.000291,0.001325,0.002073,0.001157,0.005398,0.000252,0.001880,0.001834,0.001080,0.005812,0.000407,0.001634,0.002695,0.001566,0.008323,0.000507,0.002269,0.001331,0.000747,0.005637,0.000000,0.001146,0.000621,0.000363,0.002701,0.000000,0.000568,0.000906,0.000460,0.002783,0.000000,0.000843,0.001140,0.000583,0.002851,0.000000,0.000975,-6.539932
2,0,16,0.002168,0-16,599.62950,0.999382,0.000926,0.999595,599.70780,0.999513,0.001005,0.999699,-0.002074,0.002369,-3.462679e-06,0.000097,0.0,-0.001493,0.004801,-2.492618e-06,0.000196,0.0,0.231060,0.000385,0.000261,0.000366,0.439923,0.000733,0.000159,0.000718,0.127955,0.000213,0.000203,0.000096,-0.142032,-0.000237,0.000187,-0.000192,250465,417.441667,127.822328,420.0,88737,147.895000,123.922147,111.0,149.70398,0.998027,0.000587,0.998210,149.72102,0.998140,0.000944,0.998397,-0.001469,0.001158,-9.795031e-06,0.000094,0.0,-0.001831,0.002972,-1.220757e-05,0.000243,0.0,0.060879,0.000406,0.000243,0.000379,0.091635,0.000611,0.000089,0.000671,0.047392,0.000316,0.000292,0.000096,-0.032791,-0.000219,0.000139,-0.000239,65240,434.933333,89.137980,426.0,33082,220.546667,115.800371,195.0,299.64136,0.998805,0.000923,0.999072,299.67490,0.998916,0.001043,0.999465,-0.002591,0.001295,-8.637301e-06,0.000074,0.0,-0.001549,0.003196,-5.163603e-06,0.000185,0.0,0.140363,0.000468,0.000250,0.000448,0.221500,0.000738,0.000164,0.000672,0.057395,0.000191,0.000242,0.000048,-0.090712,-0.000302,0.000186,-0.000239,126369,421.230000,113.050158,426.0,47815,159.383333,119.709751,121.0,449.59010,0.999089,0.000888,0.999297,449.65400,0.999231,0.000994,0.999465,-0.002854,0.002138,-6.343196e-06,0.000101,0.0,-0.002986,0.004019,-6.635058e-06,0.000190,0.0,0.195632,0.000435,...,9.0,120.555556,13.0,143.461764,1085.0,3.666667,3.0,2.915476,33.0,0.001137,12.0,99.083333,12.0,130.679663,1189.0,3.166667,2.5,2.691175,38.0,0.001621,20.0,100.500000,29.5,120.976509,2010.0,2.950000,2.0,2.459675,59.0,0.004459,0.003698,0.052704,0.000747,0.003302,0.006856,0.005494,0.086670,0.001347,0.005213,0.002020,0.001690,0.036490,0.000047,0.001527,0.003102,0.002308,0.028931,0.000000,0.002465,0.002973,0.002408,0.050501,0.000227,0.002270,0.004559,0.003414,0.047745,0.000454,0.003572,0.003751,0.003075,0.052446,0.000485,0.002818,0.005746,0.004383,0.059070,0.000941,0.004461,0.002330,0.001763,0.028551,0.000000,0.001791,0.001102,0.000860,0.008911,0.000000,0.000867,0.001613,0.001212,0.021736,0.000000,0.001258,0.002028,0.001545,0.027483,0.000000,0.001566,0.002289,0.000739,0.005226,0.001039,0.002203,0.003313,0.001356,0.012372,0.001104,0.002985,0.001150,0.000445,0.002957,0.000424,0.001067,0.001677,0.000643,0.003679,0.000612,0.001557,0.001627,0.000599,0.003883,0.000728,0.001527,0.002337,0.000956,0.008073,0.000775,0.002210,0.002003,0.000672,0.004962,0.000830,0.001894,0.002870,0.001161,0.010223,0.000955,0.002594,0.001541,0.000551,0.003609,0.000841,0.001424,0.000796,0.000371,0.002751,0.000114,0.000693,0.001100,0.000428,0.003082,0.000497,0.000999,0.001347,0.000484,0.003414,0.000717,0.001231,-6.133863
3,0,31,0.002195,0-31,599.26965,0.998783,0.000791,0.998615,599.18396,0.998640,0.000647,0.998568,-0.002828,0.002574,-4.721707e-06,0.000105,0.0,-0.002053,0.003637,-3.427948e-06,0.000149,0.0,0.233864,0.000390,0.000235,0.000419,0.538276,0.000897,0.000252,0.000973,0.094576,0.000158,0.000186,0.000093,-0.058204,-0.000097,0.000077,-0.000046,279314,465.523333,170.065163,454.0,73030,121.716667,111.004112,104.0,149.72840,0.998189,0.000367,0.998125,149.78554,0.998570,0.000417,0.998751,-0.000526,0.000993,-3.504679e-06,0.000081,0.0,-0.000882,0.001424,-5.880876e-06,0.000116,0.0,0.057724,0.000385,0.000246,0.000354,0.156023,0.001040,0.000063,0.001019,0.015872,0.000106,0.000036,0.000093,-0.008004,-0.000053,0.000017,-0.000046,90503,603.353333,186.573020,611.0,14847,98.980000,88.608669,88.5,299.50380,0.998346,0.000396,0.998397,299.53333,0.998444,0.000425,0.998568,-0.001179,0.001776,-3.929532e-06,0.000103,0.0,-0.000440,0.002713,-1.465964e-06,0.000157,0.0,0.105733,0.000352,0.000246,0.000354,0.268060,0.000894,0.000229,0.001019,0.049231,0.000164,0.000178,0.000093,-0.026143,-0.000087,0.000065,-0.000046,140791,469.303333,194.186489,376.5,35483,118.276667,85.061379,139.0,449.28284,0.998406,0.000354,0.998418,449.26535,0.998367,0.000399,0.998268,-0.001291,0.002196,-2.867828e-06,0.000104,0.0,-0.001112,0.003273,-2.470517e-06,0.000154,0.0,0.163870,0.000364,...,3.0,171.333333,59.0,242.838080,514.0,3.666667,2.0,3.785939,11.0,0.001089,9.0,172.888889,116.0,167.747909,1556.0,5.111111,4.0,4.702245,46.0,0.001401,11.0,148.272727,70.0,160.381477,1631.0,4.545455,3.0,4.412791,50.0,0.004459,0.003698,0.052704,0.000747,0.003302,0.006856,0.005494,0.086670,0.001347,0.005213,0.002020,0.001690,0.036490,0.000047,0.001527,0.003102,0.002308,0.028931,0.000000,0.002465,0.002973,0.002408,0.050501,0.000227,0.002270,0.004559,0.003414,0.047745,0.000454,0.003572,0.003751,0.003075,0.052446,0.000485,0.002818,0.005746,0.004383,0.059070,0.000941,0.004461,0.002330,0.001763,0.028551,0.000000,0.001791,0.001102,0.000860,0.008911,0.000000,0.000867,0.001613,0.001212,0.021736,0.000000,0.001258,0.002028,0.001545,0.027483,0.000000,0.001566,0.002598,0.001259,0.006787,0.000354,0.002232,0.003622,0.001779,0.009417,0.000488,0.003374,0.001191,0.000683,0.003717,0.000179,0.000999,0.001637,0.000872,0.004377,0.000277,0.001443,0.001714,0.000867,0.004712,0.000258,0.001507,0.002413,0.001211,0.006672,0.000359,0.002191,0.002203,0.001130,0.006071,0.000290,0.001937,0.003054,0.001541,0.008290,0.000407,0.002820,0.001561,0.000742,0.005395,0.000313,0.001356,0.000696,0.000452,0.003404,0.000000,0.000618,0.001052,0.000600,0.004218,0.000000,0.000934,0.001349,0.000698,0.004974,0.000269,0.001172,-6.121454
4,0,62,0.001747,0-62,599.77264,0.999621,0.000274,0.999585,599.80664,0.999678,0.000299,0.999807,-0.000002,0.001894,-2.985050e-09,0.000077,0.0,-0.000281,0.003257,-4.683512e-07,0.000133,0.0,0.150974,0.000252,0.000199,0.000230,0.240802,0.000401,0.000122,0.000373,0.114073,0.000190,0.000080,0.000187,-0.065728,-0.000110,0.000069,-0.000093,199573,332.621667,153.960932,316.0,67253,112.088333,101.350582,93.0,149.92055,0.999470,0.000274,0.999417,149.96729,0.999782,0.000187,0.999834,0.000397,0.001378,2.646369e-06,0.000113,0.0,-0.000298,0.000966,-1.988698e-06,0.000079,0.0,0.061375,0.000409,0.000160,0.000371,0.072794,0.000485,0.000127,0.000420,0.029652,0.000198,0.000026,0.000187,-0.021676,-0.000145,0.000067,-0.000186,56104,374.026667,118.762803,398.0,16796,111.973333,99.667565,85.0,299.84183,0.999473,0.000222,0.999427,299.90152,0.999672,0.000260,0.999606,0.000645,0.001520,2.150864e-06,0.000088,0.0,-0.000201,0.002188,-6.710789e-07,0.000127,0.0,0.090602,0.000302,0.000192,0.000324,0.131321,0.000438,0.000130,0.000420,0.058974,0.000197,0.000067,0.000187,-0.039530,-0.000132,0.000070,-0.000140,123184,410.613333,157.792942,399.0,29194,97.313333,92.291971,85.0,449.81912,0.999598,0.000269,0.999577,449.87457,0.999721,0.000265,0.999834,0.000491,0.001609,1.091611e-06,0.000076,0.0,0.000299,0.002927,6.640250e-07,0.000138,0.0,0.115498,0.000257,...,4.0,10.750000,4.0,15.585784,43.0,3.500000,1.5,4.358899,14.0,0.000453,11.0,110.818182,34.0,140.061285,1219.0,4.909091,2.0,4.887833,54.0,0.000550,16.0,98.125000,20.0,127.212093,1570.0,4.500000,2.0,4.412105,72.0,0.004459,0.003698,0.052704,0.000747,0.003302,0.006856,0.005494,0.086670,0.001347,0.005213,0.002020,0.001690,0.036490,0.000047,0.001527,0.003102,0.002308,0.028931,0.000000,0.002465,0.002973,0.002408,0.050501,0.000227,0.002270,0.004559,0.003414,0.047745,0.000454,0.003572,0.003751,0.003075,0.052446,0.000485,0.002818,0.005746,0.004383,0.059070,0.000941,0.004461,0.002330,0.001763,0.028551,0.000000,0.001791,0.001102,0.000860,0.008911,0.000000,0.000867,0.001613,0.001212,0.021736,0.000000,0.001258,0.002028,0.001545,0.027483,0.000000,0.001566,0.002041,0.000947,0.005626,0.000472,0.001857,0.003036,0.001572,0.008931,0.000640,0.002734,0.000937,0.000523,0.002687,0.000010,0.000827,0.001372,0.000746,0.004716,0.000155,0.001227,0.001360,0.000651,0.003832,0.000351,0.001180,0.002033,0.001057,0.005446,0.000432,0.001770,0.001697,0.000765,0.004734,0.000390,0.001503,0.002555,0.001333,0.006868,0.000507,0.002245,0.001222,0.000539,0.003759,0.000397,0.001068,0.000555,0.000282,0.001936,0.000158,0.000491,0.000812,0.000372,0.002470,0.000278,0.000726,0.001036,0.000466,0.003281,0.000317,0.000879,-6.349732
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
428927,126,32751,0.003461,126-32751,599.74090,0.999568,0.000471,0.999575,599.76700,0.999612,0.000629,0.999570,-0.000527,0.003691,-8.805515e-07,0.000151,0.0,-0.000960,0.005876,-1.602486e-06,0.000240,0.0,0.229176,0.000382,0.000288,0.000326,0.521890,0.000870,0.000223,0.000882,0.054663,0.000091,0.000115,0.000033,-0.124835,-0.000208,0.000158,-0.000229,251084,418.473333,152.901015,420.0,96898,161.496667,135.047361,109.0,149.89204,0.999280,0.000269,0.999267,149.86443,0.999096,0.000316,0.999087,0.000314,0.001701,2.090094e-06,0.000139,0.0,-0.000864,0.002461,-5.762912e-06,0.000202,0.0,0.050836,0.000339,0.000229,0.000229,0.125534,0.000837,0.000176,0.000866,0.013714,0.000091,0.000088,0.000033,-0.018449,-0.000123,0.000128,-0.000065,55169,367.793333,138.771663,322.0,18331,122.206667,81.899701,103.0,299.81550,0.999385,0.000301,0.999345,299.78455,0.999282,0.000347,0.999412,0.000327,0.002899,1.091175e-06,0.000168,0.0,-0.000449,0.003776,-1.496513e-06,0.000218,0.0,0.089975,0.000300,0.000242,0.000208,0.268271,0.000894,0.000214,0.000882,0.025339,0.000084,0.000114,0.000033,-0.047055,-0.000157,0.000119,-0.000196,118991,396.636667,133.090828,402.0,46521,155.070000,122.095849,106.5,449.71948,0.999377,0.000339,0.999452,449.73320,0.999407,0.000551,0.999445,-0.000350,0.003438,-7.788715e-07,0.000162,0.0,-0.000922,0.005201,-2.048826e-06,0.000245,0.0,0.177888,0.000395,...,12.0,40.916667,12.0,61.842113,491.0,1.833333,1.0,1.337116,22.0,0.001451,18.0,44.222222,14.5,57.245144,796.0,2.055556,1.5,1.392088,37.0,0.001924,27.0,52.814815,17.0,64.651752,1426.0,2.259259,2.0,1.654658,61.0,0.005800,0.004063,0.045786,0.001076,0.004609,0.008262,0.005659,0.072964,0.001539,0.006619,0.002682,0.001824,0.017742,0.000237,0.002175,0.003825,0.002492,0.024892,0.000293,0.003138,0.003896,0.002592,0.023843,0.000598,0.003157,0.005544,0.003544,0.040637,0.000866,0.004537,0.004881,0.003313,0.031950,0.000623,0.003921,0.006928,0.004505,0.044264,0.001151,0.005652,0.003117,0.002053,0.021485,0.000509,0.002513,0.001468,0.000996,0.010657,0.000002,0.001196,0.002149,0.001394,0.013680,0.000268,0.001768,0.002688,0.001744,0.019110,0.000339,0.002182,0.002975,0.001542,0.012393,0.000865,0.002633,0.004081,0.002084,0.014936,0.001205,0.003705,0.001499,0.000678,0.004133,0.000441,0.001289,0.002070,0.001052,0.006893,0.000624,0.001832,0.002036,0.000905,0.005720,0.000561,0.001874,0.002830,0.001397,0.009094,0.000927,0.002551,0.002589,0.001384,0.011390,0.000792,0.002361,0.003540,0.001848,0.013275,0.001087,0.003218,0.001805,0.000730,0.005121,0.000722,0.001646,0.000909,0.000372,0.003079,0.000000,0.000850,0.001261,0.000485,0.004049,0.000534,0.001164,0.001576,0.000651,0.004783,0.000647,0.001447,-5.666308
428928,126,32753,0.003113,126-32753,601.44480,1.002408,0.001165,1.002360,601.50560,1.002509,0.001204,1.002768,0.004436,0.004104,7.405183e-06,0.000168,0.0,0.004829,0.004991,8.061013e-06,0.000204,0.0,0.168830,0.000281,0.000216,0.000222,0.402075,0.000670,0.000217,0.000585,0.084885,0.000141,0.000139,0.000069,-0.072828,-0.000121,0.000112,-0.000069,133355,222.258333,176.419381,163.5,77605,129.341667,140.363938,76.0,150.57918,1.003861,0.000879,1.003464,150.58992,1.003933,0.000857,1.003535,0.002632,0.002613,1.754373e-05,0.000213,0.0,0.002500,0.002698,1.666703e-05,0.000220,0.0,0.033051,0.000220,0.000232,0.000125,0.095944,0.000640,0.000278,0.000516,0.014855,0.000099,0.000121,0.000034,-0.021403,-0.000143,0.000118,-0.000069,28422,189.480000,191.316973,71.0,13712,91.413333,132.452103,23.0,301.00390,1.003346,0.000833,1.003085,301.05185,1.003506,0.000768,1.003298,0.003337,0.003454,1.112384e-05,0.000199,0.0,0.003007,0.003402,1.002277e-05,0.000196,0.0,0.072718,0.000242,0.000210,0.000191,0.197961,0.000660,0.000252,0.000516,0.045218,0.000151,0.000157,0.000035,-0.042083,-0.000140,0.000121,-0.000103,56748,189.160000,197.275255,81.0,34716,115.720000,163.561782,23.0,451.27390,1.002831,0.001035,1.002875,451.31580,1.002924,0.001105,1.003084,0.004116,0.003972,9.147641e-06,0.000187,0.0,0.004016,0.004569,8.923740e-06,0.000215,0.0,0.122441,0.000272,...,13.0,25.076923,3.0,54.619077,326.0,1.769231,2.0,0.926809,23.0,0.001791,20.0,55.350000,19.5,80.625368,1107.0,3.550000,2.0,3.831655,71.0,0.002101,31.0,50.000000,18.0,70.259044,1550.0,3.161290,2.0,3.317597,98.0,0.005800,0.004063,0.045786,0.001076,0.004609,0.008262,0.005659,0.072964,0.001539,0.006619,0.002682,0.001824,0.017742,0.000237,0.002175,0.003825,0.002492,0.024892,0.000293,0.003138,0.003896,0.002592,0.023843,0.000598,0.003157,0.005544,0.003544,0.040637,0.000866,0.004537,0.004881,0.003313,0.031950,0.000623,0.003921,0.006928,0.004505,0.044264,0.001151,0.005652,0.003117,0.002053,0.021485,0.000509,0.002513,0.001468,0.000996,0.010657,0.000002,0.001196,0.002149,0.001394,0.013680,0.000268,0.001768,0.002688,0.001744,0.019110,0.000339,0.002182,0.002196,0.001329,0.010829,0.000517,0.001806,0.002963,0.001597,0.012168,0.000704,0.002618,0.001031,0.000668,0.004968,0.000146,0.000834,0.001404,0.000845,0.006510,0.000334,0.001169,0.001519,0.001033,0.008499,0.000361,0.001254,0.002054,0.001257,0.009971,0.000516,0.001741,0.001901,0.001229,0.010290,0.000449,0.001566,0.002568,0.001474,0.011509,0.000604,0.002225,0.001419,0.000869,0.008492,0.000454,0.001260,0.000684,0.000458,0.003531,0.000000,0.000594,0.001008,0.000687,0.006310,0.000329,0.000837,0.001241,0.000814,0.007915,0.000404,0.001064,-5.772267
428929,126,32758,0.004070,126-32758,600.56890,1.000948,0.000492,1.000837,600.54890,1.000915,0.000599,1.000828,0.001525,0.003117,2.545348e-06,0.000127,0.0,0.002525,0.006020,4.215600e-06,0.000246,0.0,0.209859,0.000350,0.000293,0.000288,0.452340,0.000754,0.000241,0.000790,0.096117,0.000160,0.000184,0.000049,-0.116510,-0.000194,0.000117,-0.000198,207530,345.883333,168.520468,335.0,153376,255.626667,162.607295,265.0,150.23146,1.001543,0.000314,1.001467,150.22218,1.001481,0.000637,1.001553,0.001962,0.001551,1.308319e-05,0.000126,0.0,0.001760,0.003079,1.173016e-05,0.000252,0.0,0.064624,0.000431,0.000349,0.000343,0.096819,0.000645,0.000260,0.000641,0.048826,0.000326,0.000243,0.000346,-0.036039,-0.000240,0.000120,-0.000247,54287,361.913333,201.137401,308.0,45953,306.353333,202.756578,218.0,300.37210,1.001240,0.000461,1.001366,300.37323,1.001244,0.000586,1.001224,0.002253,0.002792,7.511431e-06,0.000161,0.0,0.001732,0.005387,5.774980e-06,0.000311,0.0,0.125792,0.000419,0.000312,0.000343,0.207265,0.000691,0.000243,0.000788,0.068672,0.000229,0.000214,0.000173,-0.063336,-0.000211,0.000122,-0.000197,102642,342.140000,187.723398,327.0,73812,246.040000,191.583295,197.0,450.43927,1.000976,0.000550,1.000946,450.44330,1.000985,0.000652,1.000874,0.002049,0.002955,4.554322e-06,0.000139,0.0,0.002234,0.005654,4.963501e-06,0.000267,0.0,0.153097,0.000340,...,6.0,58.000000,59.0,53.669358,348.0,2.166667,1.5,1.940790,13.0,0.001580,24.0,114.583333,100.0,124.324581,2750.0,2.541667,2.0,1.955575,61.0,0.001913,31.0,112.677419,100.0,119.312304,3493.0,2.838710,2.0,1.984889,88.0,0.005800,0.004063,0.045786,0.001076,0.004609,0.008262,0.005659,0.072964,0.001539,0.006619,0.002682,0.001824,0.017742,0.000237,0.002175,0.003825,0.002492,0.024892,0.000293,0.003138,0.003896,0.002592,0.023843,0.000598,0.003157,0.005544,0.003544,0.040637,0.000866,0.004537,0.004881,0.003313,0.031950,0.000623,0.003921,0.006928,0.004505,0.044264,0.001151,0.005652,0.003117,0.002053,0.021485,0.000509,0.002513,0.001468,0.000996,0.010657,0.000002,0.001196,0.002149,0.001394,0.013680,0.000268,0.001768,0.002688,0.001744,0.019110,0.000339,0.002182,0.002402,0.000809,0.004503,0.000900,0.002315,0.003509,0.001562,0.010416,0.001095,0.003267,0.001195,0.000514,0.003381,0.000347,0.001115,0.001720,0.000831,0.004654,0.000422,0.001580,0.001665,0.000642,0.003826,0.000553,0.001514,0.002420,0.001113,0.006426,0.000736,0.002303,0.002064,0.000729,0.004044,0.000778,0.002004,0.003048,0.001458,0.010074,0.000913,0.002766,0.001491,0.000465,0.002850,0.000000,0.001517,0.000740,0.000320,0.001669,0.000000,0.000743,0.001055,0.000376,0.001995,0.000000,0.001040,0.001306,0.000422,0.002566,0.000000,0.001295,-5.504192
428930,126,32763,0.003357,126-32763,601.07590,1.001793,0.000468,1.001763,601.06866,1.001781,0.000501,1.001822,0.000256,0.003661,4.271871e-07,0.000150,0.0,0.000804,0.005362,1.341685e-06,0.000219,0.0,0.136448,0.000227,0.000176,0.000195,0.315773,0.000526,0.000160,0.000526,0.092835,0.000155,0.000122,0.000132,-0.079795,-0.000133,0.000099,-0.000066,262649,437.748333,162.905972,436.5,89365,148.941667,113.937048,119.5,150.24767,1.001651,0.000443,1.001684,150.23717,1.001581,0.000493,1.001655,-0.000914,0.001704,-6.090981e-06,0.000139,0.0,-0.000223,0.001979,-1.485572e-06,0.000162,0.0,0.025439,0.000170,0.000136,0.000126,0.068747,0.000458,0.000152,0.000460,0.022056,0.000147,0.000117,0.000066,-0.019687,-0.000131,0.000111,-0.000066,71068,473.786667,161.669461,500.0,24396,162.640000,109.212943,160.0,300.53995,1.001800,0.000486,1.001853,300.53055,1.001769,0.000508,1.001846,-0.001759,0.002379,-5.861896e-06,0.000137,0.0,-0.001379,0.003182,-4.596904e-06,0.000184,0.0,0.055616,0.000185,0.000144,0.000145,0.147859,0.000493,0.000164,0.000460,0.049182,0.000164,0.000141,0.000066,-0.035289,-0.000118,0.000090,-0.000066,144603,482.010000,154.771954,501.0,49615,165.383333,111.073975,153.5,450.83005,1.001845,0.000479,1.001853,450.81820,1.001818,0.000516,1.001859,-0.001867,0.003042,-4.149686e-06,0.000144,0.0,-0.001585,0.004462,-3.521339e-06,0.000211,0.0,0.090938,0.000202,...,22.0,104.545455,100.0,124.796874,2300.0,2.727273,2.0,2.333643,60.0,0.001520,43.0,119.767442,100.0,152.541772,5150.0,2.813953,2.0,2.280934,121.0,0.001714,62.0,117.112903,100.0,147.661343,7261.0,2.822581,2.0,2.378346,175.0,0.005800,0.004063,0.045786,0.001076,0.004609,0.008262,0.005659,0.072964,0.001539,0.006619,0.002682,0.001824,0.017742,0.000237,0.002175,0.003825,0.002492,0.024892,0.000293,0.003138,0.003896,0.002592,0.023843,0.000598,0.003157,0.005544,0.003544,0.040637,0.000866,0.004537,0.004881,0.003313,0.031950,0.000623,0.003921,0.006928,0.004505,0.044264,0.001151,0.005652,0.003117,0.002053,0.021485,0.000509,0.002513,0.001468,0.000996,0.010657,0.000002,0.001196,0.002149,0.001394,0.013680,0.000268,0.001768,0.002688,0.001744,0.019110,0.000339,0.002182,0.003117,0.001291,0.007572,0.001271,0.002807,0.004316,0.001883,0.011422,0.001557,0.003843,0.001550,0.000738,0.004069,0.000595,0.001357,0.002132,0.001055,0.006886,0.000713,0.001835,0.002170,0.000968,0.005387,0.000874,0.001994,0.003007,0.001374,0.008491,0.000986,0.002696,0.002678,0.001160,0.007137,0.001142,0.002422,0.003703,0.001634,0.010415,0.001324,0.003282,0.002105,0.000784,0.007343,0.001122,0.001948,0.001062,0.000423,0.003270,0.000400,0.001007,0.001474,0.000591,0.005284,0.000686,0.001373,0.001839,0.000731,0.006914,0.001004,0.001690,-5.696792


In [17]:
feature_cols = [c for c in train.columns if c not in ['row_id', 'target', 'time_id', 'stock_id', 'target', 'logtarget']]
wap1_cols = [c for c in feature_cols if c.split('_')[0]=='wap1']
feature_cols = [c for c in feature_cols if c not in wap1_cols]
print(f"# features: {len(feature_cols)}")

params = {
    'random_state': SEED,
    'objective': 'rmse',  
    'boosting_type': 'gbdt',
    'num_leaves': 100,
    'learning_rate': 0.1,
    'colsample_bytree': 0.8,
    'subsample': 0.8,
    'n_estimators': 10000,
    'min_child_samples': int(0.01*train.shape[0])
}

scores_by_seed = []
for j, s in enumerate(SEEDS):
    print(f"shuffle train with seed {s}")
    train_shuffled = train.sample(frac=1, random_state=s).reset_index(drop=True)
    oof_predictions = np.zeros(train.shape[0])
    kfold = GroupKFold(n_splits=5)
    for fold, (trn_ind, val_ind) in enumerate(kfold.split(train_shuffled, groups=train_shuffled.time_id)):
        print(f'Training fold {fold}')
        x_train, x_val = train_shuffled.loc[trn_ind, feature_cols], train_shuffled.loc[val_ind, feature_cols]
        y_train, y_val = train_shuffled.loc[trn_ind, 'target'], train_shuffled.loc[val_ind, 'target']
        
        # Root mean squared percentage error weights
        train_weights = 1 / np.square(y_train)
        val_weights = 1 / np.square(y_val)

        # Fit with sklearn API
        model = lgb.LGBMRegressor(**params)
        model.fit(x_train, 
                  y_train, 
                  sample_weight=train_weights,
                  eval_set=[(x_val, y_val)],
                  eval_sample_weight=[val_weights],
                  eval_metric='rmse',
                  early_stopping_rounds=100,
                  verbose=False)

        # Add predictions to the out of folds array
        oof_predictions[val_ind] = model.predict(x_val)
    oof_score = rmspe(train_shuffled['target'], oof_predictions)
    scores_by_seed.append(oof_score)

    print(f"seed {s} oof rmspe: {oof_score}") # 0.2262, 0.2263, 0.2260
print(f"score averaged by {len(SEEDS)} seeds: {np.mean(scores_by_seed)}")

# features: 328
shuffle train with seed 42
Training fold 0
Training fold 1
Training fold 2
Training fold 3
Training fold 4
seed 42 oof rmspe: 0.22625313580807158
score averaged by seed: 0.22625313580807158


In [8]:
df_importance = pd.DataFrame({"feature": model.feature_name_, "importance": model.feature_importances_})
df_importance = df_importance.sort_values(by=["importance"], ascending=False).reset_index(drop=True)
df_importance

Unnamed: 0,feature,importance
0,log_return1_realized_volatility,138
1,trade_log_return_realized_volatility_450_media...,133
2,log_return1_realized_volatility_450_median_stock,109
3,log_return2_realized_volatility_450_min_time,106
4,trade_log_return_realized_volatility_450_min_time,92
...,...,...
323,wap_balance_std_450,0
324,wap_balance_sum_450,0
325,log_return2_median_450,0
326,log_return1_median_450,0
