In [1]:
import pandas as pd
import numpy as np
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import KFold
from sklearn.metrics import accuracy_score
# optuna経由でLightGBMをインポート
import optuna.integration.lightgbm as lgb_o

In [2]:
# csvファイルからPandas DataFrameへ読み込み
train = pd.read_csv('train.csv', delimiter=',', low_memory=False)

# 冒頭を表示して確認
train.head()

Unnamed: 0,id,feature_0,feature_1,feature_2,feature_3,feature_4,feature_5,feature_6,feature_7,feature_8,...,feature_66,feature_67,feature_68,feature_69,feature_70,feature_71,feature_72,feature_73,feature_74,target
0,0,0,0,6,1,0,0,0,0,7,...,0,0,0,0,0,0,2,0,0,Class_6
1,1,0,0,0,0,0,0,0,0,0,...,2,0,0,0,0,0,0,1,0,Class_6
2,2,0,0,0,0,0,1,0,3,0,...,0,0,0,0,1,0,0,0,0,Class_2
3,3,0,0,7,0,1,5,2,2,0,...,0,4,0,2,2,0,4,3,0,Class_8
4,4,1,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Class_2


In [3]:
# trainのtargetをカテゴリーに変換
train.target = train.target.astype('category')

train.dtypes

id               int64
feature_0        int64
feature_1        int64
feature_2        int64
feature_3        int64
                ...   
feature_71       int64
feature_72       int64
feature_73       int64
feature_74       int64
target        category
Length: 77, dtype: object

In [4]:
# ラベルエンコーディング（LabelEncoder）
le = LabelEncoder()
encoded = le.fit_transform(train.target.values)
decoded = le.inverse_transform(encoded)
train.target = encoded

# 冒頭を表示して確認
train.target.head()

0    5
1    5
2    1
3    7
4    1
Name: target, dtype: int64

In [5]:
# 訓練データとテストデータに分割
from sklearn.model_selection import train_test_split

train_set, test_set = train_test_split(train, test_size=0.2, random_state = 0)

# 表示して確認
(train_set.shape, test_set.shape)

((160000, 77), (40000, 77))

In [6]:
# 訓練データとラベルを分割する
X_train, y_train = train_set.drop(['target'], axis=1).drop(['id'], axis=1).values, train_set.target.values

# 評価データとラベルを分割する
X_test, y_test = test_set.drop(['target'], axis=1).drop(['id'], axis=1).values, test_set.target.values

# 表示して確認
(X_train.shape, y_train.shape, X_test.shape, y_test.shape)

((160000, 75), (160000,), (40000, 75), (40000,))

In [7]:
# データをセット
# 訓練データ
lgb_train = lgb_o.Dataset(X_train, y_train)
# 評価データ
lgb_eval = lgb_o.Dataset(X_test, y_test)

In [8]:
# lightgbmを実装して識別を行う--------------------------------------------------

# ハイパーパラメータサーチ&モデル構築
params = {'objective': 'multiclass',
          'num_class': 9,
          'metric': 'multi_error',
          'random_seed': 0} 

# Optunaでのパラメータ探索
gbm_o = lgb_o.train(params,
                    lgb_train,
                    valid_sets=lgb_eval,
                    early_stopping_rounds=100,
                    verbose_eval=100,)

[32m[I 2021-06-30 00:09:48,038][0m A new study created in memory with name: no-name-f35b93c2-5954-454f-9c2b-e96ec8402c09[0m
feature_fraction, val_score: inf:   0%|          | 0/7 [00:00<?, ?it/s]

You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.638325


feature_fraction, val_score: 0.636475:  14%|#4        | 1/7 [00:12<01:17, 12.84s/it][32m[I 2021-06-30 00:10:00,901][0m Trial 0 finished with value: 0.636475 and parameters: {'feature_fraction': 0.8999999999999999}. Best is trial 0 with value: 0.636475.[0m
feature_fraction, val_score: 0.636475:  14%|#4        | 1/7 [00:12<01:17, 12.84s/it]

Early stopping, best iteration is:
[55]	valid_0's multi_error: 0.636475
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63715


feature_fraction, val_score: 0.635950:  29%|##8       | 2/7 [00:27<01:06, 13.32s/it][32m[I 2021-06-30 00:10:15,347][0m Trial 1 finished with value: 0.63595 and parameters: {'feature_fraction': 0.8}. Best is trial 1 with value: 0.63595.[0m
feature_fraction, val_score: 0.635950:  29%|##8       | 2/7 [00:27<01:06, 13.32s/it]

Early stopping, best iteration is:
[53]	valid_0's multi_error: 0.63595
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63715


feature_fraction, val_score: 0.635950:  43%|####2     | 3/7 [00:54<01:10, 17.60s/it][32m[I 2021-06-30 00:10:42,947][0m Trial 2 finished with value: 0.6362 and parameters: {'feature_fraction': 0.6}. Best is trial 1 with value: 0.63595.[0m
feature_fraction, val_score: 0.635950:  43%|####2     | 3/7 [00:54<01:10, 17.60s/it]

Early stopping, best iteration is:
[71]	valid_0's multi_error: 0.6362
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6364


feature_fraction, val_score: 0.635075:  57%|#####7    | 4/7 [01:31<01:10, 23.34s/it][32m[I 2021-06-30 00:11:19,661][0m Trial 3 finished with value: 0.635075 and parameters: {'feature_fraction': 0.4}. Best is trial 3 with value: 0.635075.[0m
feature_fraction, val_score: 0.635075:  57%|#####7    | 4/7 [01:31<01:10, 23.34s/it]

Early stopping, best iteration is:
[54]	valid_0's multi_error: 0.635075
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.637075


feature_fraction, val_score: 0.635075:  71%|#######1  | 5/7 [01:55<00:47, 23.54s/it][32m[I 2021-06-30 00:11:43,669][0m Trial 4 finished with value: 0.6363 and parameters: {'feature_fraction': 1.0}. Best is trial 3 with value: 0.635075.[0m
feature_fraction, val_score: 0.635075:  71%|#######1  | 5/7 [01:55<00:47, 23.54s/it]

Early stopping, best iteration is:
[65]	valid_0's multi_error: 0.6363
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63645


feature_fraction, val_score: 0.634825:  86%|########5 | 6/7 [02:28<00:26, 26.49s/it][32m[I 2021-06-30 00:12:17,050][0m Trial 5 finished with value: 0.634825 and parameters: {'feature_fraction': 0.5}. Best is trial 5 with value: 0.634825.[0m
feature_fraction, val_score: 0.634825:  86%|########5 | 6/7 [02:28<00:26, 26.49s/it]

Early stopping, best iteration is:
[34]	valid_0's multi_error: 0.634825
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.636525


feature_fraction, val_score: 0.634775: 100%|##########| 7/7 [02:42<00:00, 22.63s/it][32m[I 2021-06-30 00:12:30,665][0m Trial 6 finished with value: 0.634775 and parameters: {'feature_fraction': 0.7}. Best is trial 6 with value: 0.634775.[0m
feature_fraction, val_score: 0.634775: 100%|##########| 7/7 [02:42<00:00, 23.23s/it]
num_leaves, val_score: 0.634775:   0%|          | 0/20 [00:00<?, ?it/s]

Early stopping, best iteration is:
[50]	valid_0's multi_error: 0.634775
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.644875
Early stopping, best iteration is:
[28]	valid_0's multi_error: 0.637125


num_leaves, val_score: 0.634775:   5%|5         | 1/20 [00:23<07:33, 23.86s/it][32m[I 2021-06-30 00:12:54,540][0m Trial 7 finished with value: 0.637125 and parameters: {'num_leaves': 205}. Best is trial 7 with value: 0.637125.[0m
num_leaves, val_score: 0.634775:   5%|5         | 1/20 [00:23<07:33, 23.86s/it]

You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.636625


num_leaves, val_score: 0.634775:  10%|#         | 2/20 [00:37<06:15, 20.86s/it][32m[I 2021-06-30 00:13:08,410][0m Trial 8 finished with value: 0.635225 and parameters: {'num_leaves': 32}. Best is trial 8 with value: 0.635225.[0m
num_leaves, val_score: 0.634775:  10%|#         | 2/20 [00:37<06:15, 20.86s/it]

Early stopping, best iteration is:
[68]	valid_0's multi_error: 0.635225
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.64335
Early stopping, best iteration is:
[28]	valid_0's multi_error: 0.63855


num_leaves, val_score: 0.634775:  15%|#5        | 3/20 [01:05<06:30, 22.97s/it][32m[I 2021-06-30 00:13:36,313][0m Trial 9 finished with value: 0.63855 and parameters: {'num_leaves': 186}. Best is trial 8 with value: 0.635225.[0m
num_leaves, val_score: 0.634775:  15%|#5        | 3/20 [01:05<06:30, 22.97s/it]

You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6366


num_leaves, val_score: 0.634775:  20%|##        | 4/20 [01:25<05:52, 22.04s/it][32m[I 2021-06-30 00:13:56,192][0m Trial 10 finished with value: 0.636025 and parameters: {'num_leaves': 22}. Best is trial 8 with value: 0.635225.[0m
num_leaves, val_score: 0.634775:  20%|##        | 4/20 [01:25<05:52, 22.04s/it]

Early stopping, best iteration is:
[90]	valid_0's multi_error: 0.636025
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.64225


num_leaves, val_score: 0.634775:  25%|##5       | 5/20 [01:47<05:30, 22.00s/it][32m[I 2021-06-30 00:14:18,089][0m Trial 11 finished with value: 0.638025 and parameters: {'num_leaves': 115}. Best is trial 8 with value: 0.635225.[0m
num_leaves, val_score: 0.634775:  25%|##5       | 5/20 [01:47<05:30, 22.00s/it]

Early stopping, best iteration is:
[29]	valid_0's multi_error: 0.638025
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


num_leaves, val_score: 0.633975:  30%|###       | 6/20 [02:01<04:33, 19.54s/it][32m[I 2021-06-30 00:14:31,868][0m Trial 12 finished with value: 0.633975 and parameters: {'num_leaves': 19}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  30%|###       | 6/20 [02:01<04:33, 19.54s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.645
Early stopping, best iteration is:
[17]	valid_0's multi_error: 0.638625


num_leaves, val_score: 0.633975:  35%|###5      | 7/20 [02:23<04:25, 20.39s/it][32m[I 2021-06-30 00:14:54,243][0m Trial 13 finished with value: 0.638625 and parameters: {'num_leaves': 229}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  35%|###5      | 7/20 [02:23<04:25, 20.39s/it]

You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.64245


num_leaves, val_score: 0.633975:  40%|####      | 8/20 [02:50<04:27, 22.27s/it]

Early stopping, best iteration is:
[24]	valid_0's multi_error: 0.6379


[32m[I 2021-06-30 00:15:20,927][0m Trial 14 finished with value: 0.6379 and parameters: {'num_leaves': 161}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  40%|####      | 8/20 [02:50<04:27, 22.27s/it]

You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63545


num_leaves, val_score: 0.633975:  45%|####5     | 9/20 [03:02<03:33, 19.37s/it][32m[I 2021-06-30 00:15:33,504][0m Trial 15 finished with value: 0.63475 and parameters: {'num_leaves': 20}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  45%|####5     | 9/20 [03:02<03:33, 19.37s/it]

Early stopping, best iteration is:
[73]	valid_0's multi_error: 0.63475
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.64735


num_leaves, val_score: 0.633975:  50%|#####     | 10/20 [03:26<03:25, 20.55s/it][32m[I 2021-06-30 00:15:56,823][0m Trial 16 finished with value: 0.6382 and parameters: {'num_leaves': 236}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  50%|#####     | 10/20 [03:26<03:25, 20.55s/it]

Early stopping, best iteration is:
[18]	valid_0's multi_error: 0.6382
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.640175


num_leaves, val_score: 0.633975:  55%|#####5    | 11/20 [03:42<02:53, 19.32s/it][32m[I 2021-06-30 00:16:13,280][0m Trial 17 finished with value: 0.636825 and parameters: {'num_leaves': 83}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  55%|#####5    | 11/20 [03:42<02:53, 19.32s/it]

Early stopping, best iteration is:
[33]	valid_0's multi_error: 0.636825
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.639675


num_leaves, val_score: 0.633975:  60%|######    | 12/20 [03:56<02:22, 17.77s/it][32m[I 2021-06-30 00:16:27,405][0m Trial 18 finished with value: 0.636575 and parameters: {'num_leaves': 66}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  60%|######    | 12/20 [03:56<02:22, 17.77s/it]

Early stopping, best iteration is:
[31]	valid_0's multi_error: 0.636575
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635875
[200]	valid_0's multi_error: 0.6347


num_leaves, val_score: 0.633975:  65%|######5   | 13/20 [04:07<01:48, 15.52s/it][32m[I 2021-06-30 00:16:37,698][0m Trial 19 finished with value: 0.634175 and parameters: {'num_leaves': 2}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  65%|######5   | 13/20 [04:07<01:48, 15.52s/it]

Early stopping, best iteration is:
[155]	valid_0's multi_error: 0.634175
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6362
[200]	valid_0's multi_error: 0.63575
[300]	valid_0's multi_error: 0.635725


num_leaves, val_score: 0.633975:  70%|#######   | 14/20 [04:24<01:36, 16.14s/it][32m[I 2021-06-30 00:16:55,275][0m Trial 20 finished with value: 0.634875 and parameters: {'num_leaves': 3}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  70%|#######   | 14/20 [04:24<01:36, 16.14s/it]

Early stopping, best iteration is:
[266]	valid_0's multi_error: 0.634875
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6387


num_leaves, val_score: 0.633975:  75%|#######5  | 15/20 [04:39<01:19, 15.90s/it][32m[I 2021-06-30 00:17:10,600][0m Trial 21 finished with value: 0.6352 and parameters: {'num_leaves': 57}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  75%|#######5  | 15/20 [04:39<01:19, 15.90s/it]

Early stopping, best iteration is:
[43]	valid_0's multi_error: 0.6352
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.64035
Early stopping, best iteration is:
[37]	valid_0's multi_error: 0.63665


num_leaves, val_score: 0.633975:  80%|########  | 16/20 [04:58<01:06, 16.73s/it][32m[I 2021-06-30 00:17:29,278][0m Trial 22 finished with value: 0.63665 and parameters: {'num_leaves': 101}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  80%|########  | 16/20 [04:58<01:06, 16.73s/it]

You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6362
[200]	valid_0's multi_error: 0.63575
[300]	valid_0's multi_error: 0.635725


num_leaves, val_score: 0.633975:  85%|########5 | 17/20 [05:16<00:51, 17.10s/it][32m[I 2021-06-30 00:17:47,243][0m Trial 23 finished with value: 0.634875 and parameters: {'num_leaves': 3}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  85%|########5 | 17/20 [05:16<00:51, 17.10s/it]

Early stopping, best iteration is:
[266]	valid_0's multi_error: 0.634875
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.637175


num_leaves, val_score: 0.633975:  90%|######### | 18/20 [05:30<00:32, 16.15s/it][32m[I 2021-06-30 00:18:01,186][0m Trial 24 finished with value: 0.63555 and parameters: {'num_leaves': 44}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  90%|######### | 18/20 [05:30<00:32, 16.15s/it]

Early stopping, best iteration is:
[31]	valid_0's multi_error: 0.63555
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.644975
Early stopping, best iteration is:
[37]	valid_0's multi_error: 0.638525


num_leaves, val_score: 0.633975:  95%|#########5| 19/20 [05:51<00:17, 17.64s/it][32m[I 2021-06-30 00:18:22,301][0m Trial 25 finished with value: 0.638525 and parameters: {'num_leaves': 149}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975:  95%|#########5| 19/20 [05:51<00:17, 17.64s/it]

You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635875
[200]	valid_0's multi_error: 0.6347


num_leaves, val_score: 0.633975: 100%|##########| 20/20 [06:02<00:00, 15.58s/it][32m[I 2021-06-30 00:18:33,069][0m Trial 26 finished with value: 0.634175 and parameters: {'num_leaves': 2}. Best is trial 12 with value: 0.633975.[0m
num_leaves, val_score: 0.633975: 100%|##########| 20/20 [06:02<00:00, 18.12s/it]
bagging, val_score: 0.633975:   0%|          | 0/10 [00:00<?, ?it/s]

Early stopping, best iteration is:
[155]	valid_0's multi_error: 0.634175
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.636725


bagging, val_score: 0.633975:  10%|#         | 1/10 [00:15<02:16, 15.12s/it][32m[I 2021-06-30 00:18:48,205][0m Trial 27 finished with value: 0.635975 and parameters: {'bagging_fraction': 0.9699812750727377, 'bagging_freq': 7}. Best is trial 27 with value: 0.635975.[0m
bagging, val_score: 0.633975:  10%|#         | 1/10 [00:15<02:16, 15.12s/it]

Early stopping, best iteration is:
[50]	valid_0's multi_error: 0.635975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.636475


bagging, val_score: 0.633975:  20%|##        | 2/10 [00:29<01:59, 14.95s/it][32m[I 2021-06-30 00:19:02,760][0m Trial 28 finished with value: 0.63585 and parameters: {'bagging_fraction': 0.7286334134319907, 'bagging_freq': 1}. Best is trial 28 with value: 0.63585.[0m
bagging, val_score: 0.633975:  20%|##        | 2/10 [00:29<01:59, 14.95s/it]

Early stopping, best iteration is:
[97]	valid_0's multi_error: 0.63585
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6381


bagging, val_score: 0.633975:  30%|###       | 3/10 [00:42<01:39, 14.19s/it][32m[I 2021-06-30 00:19:15,167][0m Trial 29 finished with value: 0.6367 and parameters: {'bagging_fraction': 0.5452216407481592, 'bagging_freq': 3}. Best is trial 28 with value: 0.63585.[0m
bagging, val_score: 0.633975:  30%|###       | 3/10 [00:42<01:39, 14.19s/it]

Early stopping, best iteration is:
[35]	valid_0's multi_error: 0.6367
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.637075


bagging, val_score: 0.633975:  40%|####      | 4/10 [00:55<01:24, 14.03s/it][32m[I 2021-06-30 00:19:28,815][0m Trial 30 finished with value: 0.636175 and parameters: {'bagging_fraction': 0.6449310260934901, 'bagging_freq': 4}. Best is trial 28 with value: 0.63585.[0m
bagging, val_score: 0.633975:  40%|####      | 4/10 [00:55<01:24, 14.03s/it]

Early stopping, best iteration is:
[49]	valid_0's multi_error: 0.636175
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63665
[200]	valid_0's multi_error: 0.639175
Early stopping, best iteration is:
[102]	valid_0's mult

bagging, val_score: 0.633975:  50%|#####     | 5/10 [01:13<01:15, 15.12s/it][32m[I 2021-06-30 00:19:46,474][0m Trial 31 finished with value: 0.636425 and parameters: {'bagging_fraction': 0.7396272996014521, 'bagging_freq': 7}. Best is trial 28 with value: 0.63585.[0m
bagging, val_score: 0.633975:  50%|#####     | 5/10 [01:13<01:15, 15.12s/it]

You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6395


bagging, val_score: 0.633975:  60%|######    | 6/10 [01:28<01:00, 15.06s/it][32m[I 2021-06-30 00:20:01,388][0m Trial 32 finished with value: 0.637775 and parameters: {'bagging_fraction': 0.40529948306809854, 'bagging_freq': 1}. Best is trial 28 with value: 0.63585.[0m
bagging, val_score: 0.633975:  60%|######    | 6/10 [01:28<01:00, 15.06s/it]

Early stopping, best iteration is:
[35]	valid_0's multi_error: 0.637775
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.636025


bagging, val_score: 0.633975:  70%|#######   | 7/10 [01:45<00:47, 15.73s/it][32m[I 2021-06-30 00:20:18,706][0m Trial 33 finished with value: 0.634725 and parameters: {'bagging_fraction': 0.8941409087474881, 'bagging_freq': 7}. Best is trial 33 with value: 0.634725.[0m
bagging, val_score: 0.633975:  70%|#######   | 7/10 [01:45<00:47, 15.73s/it]

Early stopping, best iteration is:
[74]	valid_0's multi_error: 0.634725
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.636575


bagging, val_score: 0.633975:  80%|########  | 8/10 [02:02<00:32, 16.20s/it][32m[I 2021-06-30 00:20:35,990][0m Trial 34 finished with value: 0.6349 and parameters: {'bagging_fraction': 0.9230948881476997, 'bagging_freq': 3}. Best is trial 33 with value: 0.634725.[0m
bagging, val_score: 0.633975:  80%|########  | 8/10 [02:02<00:32, 16.20s/it]

Early stopping, best iteration is:
[56]	valid_0's multi_error: 0.6349
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.638225


bagging, val_score: 0.633975:  90%|######### | 9/10 [02:18<00:15, 15.98s/it][32m[I 2021-06-30 00:20:51,458][0m Trial 35 finished with value: 0.63605 and parameters: {'bagging_fraction': 0.6978055019986031, 'bagging_freq': 6}. Best is trial 33 with value: 0.634725.[0m
bagging, val_score: 0.633975:  90%|######### | 9/10 [02:18<00:15, 15.98s/it]

Early stopping, best iteration is:
[55]	valid_0's multi_error: 0.63605
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.639725


bagging, val_score: 0.633975: 100%|##########| 10/10 [02:31<00:00, 15.04s/it][32m[I 2021-06-30 00:21:04,319][0m Trial 36 finished with value: 0.6377 and parameters: {'bagging_fraction': 0.45439132886394173, 'bagging_freq': 7}. Best is trial 33 with value: 0.634725.[0m
bagging, val_score: 0.633975: 100%|##########| 10/10 [02:31<00:00, 15.12s/it]
feature_fraction_stage2, val_score: 0.633975:   0%|          | 0/6 [00:00<?, ?it/s]

Early stopping, best iteration is:
[28]	valid_0's multi_error: 0.6377
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63675


feature_fraction_stage2, val_score: 0.633975:  17%|#6        | 1/6 [00:16<01:22, 16.55s/it][32m[I 2021-06-30 00:21:20,889][0m Trial 37 finished with value: 0.63615 and parameters: {'feature_fraction': 0.748}. Best is trial 37 with value: 0.63615.[0m
feature_fraction_stage2, val_score: 0.633975:  17%|#6        | 1/6 [00:16<01:22, 16.55s/it]

Early stopping, best iteration is:
[85]	valid_0's multi_error: 0.63615
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63645


feature_fraction_stage2, val_score: 0.633975:  33%|###3      | 2/6 [00:32<01:04, 16.25s/it][32m[I 2021-06-30 00:21:36,443][0m Trial 38 finished with value: 0.635875 and parameters: {'feature_fraction': 0.652}. Best is trial 38 with value: 0.635875.[0m
feature_fraction_stage2, val_score: 0.633975:  33%|###3      | 2/6 [00:32<01:04, 16.25s/it]

Early stopping, best iteration is:
[80]	valid_0's multi_error: 0.635875
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63525


feature_fraction_stage2, val_score: 0.633975:  50%|#####     | 3/6 [00:50<00:51, 17.02s/it][32m[I 2021-06-30 00:21:55,273][0m Trial 39 finished with value: 0.634525 and parameters: {'feature_fraction': 0.62}. Best is trial 39 with value: 0.634525.[0m
feature_fraction_stage2, val_score: 0.633975:  50%|#####     | 3/6 [00:50<00:51, 17.02s/it]

Early stopping, best iteration is:
[69]	valid_0's multi_error: 0.634525
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635875
[200]	valid_0's multi_error: 0.63745


feature_fraction_stage2, val_score: 0.633975:  67%|######6   | 4/6 [01:04<00:32, 16.06s/it][32m[I 2021-06-30 00:22:09,073][0m Trial 40 finished with value: 0.6352 and parameters: {'feature_fraction': 0.6839999999999999}. Best is trial 39 with value: 0.634525.[0m
feature_fraction_stage2, val_score: 0.633975:  67%|######6   | 4/6 [01:04<00:32, 16.06s/it]

Early stopping, best iteration is:
[105]	valid_0's multi_error: 0.6352
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.634925


feature_fraction_stage2, val_score: 0.633975:  83%|########3 | 5/6 [01:17<00:14, 14.99s/it][32m[I 2021-06-30 00:22:21,572][0m Trial 41 finished with value: 0.63415 and parameters: {'feature_fraction': 0.7799999999999999}. Best is trial 41 with value: 0.63415.[0m
feature_fraction_stage2, val_score: 0.633975:  83%|########3 | 5/6 [01:17<00:14, 14.99s/it]

Early stopping, best iteration is:
[81]	valid_0's multi_error: 0.63415
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63555


feature_fraction_stage2, val_score: 0.633975: 100%|##########| 6/6 [01:31<00:00, 14.81s/it][32m[I 2021-06-30 00:22:35,961][0m Trial 42 finished with value: 0.6346 and parameters: {'feature_fraction': 0.716}. Best is trial 41 with value: 0.63415.[0m
feature_fraction_stage2, val_score: 0.633975: 100%|##########| 6/6 [01:31<00:00, 15.27s/it]
regularization_factors, val_score: 0.633975:   0%|          | 0/20 [00:00<?, ?it/s]

Early stopping, best iteration is:
[59]	valid_0's multi_error: 0.6346
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635525


regularization_factors, val_score: 0.633975:   5%|5         | 1/20 [00:16<05:07, 16.19s/it][32m[I 2021-06-30 00:22:52,163][0m Trial 43 finished with value: 0.635475 and parameters: {'lambda_l1': 2.200727780899263e-05, 'lambda_l2': 0.5194656353014179}. Best is trial 43 with value: 0.635475.[0m
regularization_factors, val_score: 0.633975:   5%|5         | 1/20 [00:16<05:07, 16.19s/it]

Early stopping, best iteration is:
[99]	valid_0's multi_error: 0.635475
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  10%|#         | 2/20 [00:29<04:38, 15.46s/it][32m[I 2021-06-30 00:23:05,923][0m Trial 44 finished with value: 0.633975 and parameters: {'lambda_l1': 1.4777805050741642e-07, 'lambda_l2': 1.069139832806073e-08}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  10%|#         | 2/20 [00:29<04:38, 15.46s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6353


regularization_factors, val_score: 0.633975:  15%|#5        | 3/20 [00:46<04:28, 15.80s/it][32m[I 2021-06-30 00:23:22,527][0m Trial 45 finished with value: 0.63495 and parameters: {'lambda_l1': 1.5159989752582712, 'lambda_l2': 0.00042375529460374813}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  15%|#5        | 3/20 [00:46<04:28, 15.80s/it]

Early stopping, best iteration is:
[85]	valid_0's multi_error: 0.63495
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63595
[200]	valid_0's multi_error: 0.638125


regularization_factors, val_score: 0.633975:  20%|##        | 4/20 [01:04<04:23, 16.50s/it][32m[I 2021-06-30 00:23:40,647][0m Trial 46 finished with value: 0.635875 and parameters: {'lambda_l1': 0.11513264675707735, 'lambda_l2': 0.0023517787625033024}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  20%|##        | 4/20 [01:04<04:23, 16.50s/it]

Early stopping, best iteration is:
[133]	valid_0's multi_error: 0.635875
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63585


regularization_factors, val_score: 0.633975:  25%|##5       | 5/20 [01:21<04:08, 16.57s/it][32m[I 2021-06-30 00:23:57,376][0m Trial 47 finished with value: 0.634925 and parameters: {'lambda_l1': 0.5659829571600496, 'lambda_l2': 7.933585999145839}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  25%|##5       | 5/20 [01:21<04:08, 16.57s/it]

Early stopping, best iteration is:
[65]	valid_0's multi_error: 0.634925
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  30%|###       | 6/20 [01:47<04:31, 19.39s/it][32m[I 2021-06-30 00:24:23,341][0m Trial 48 finished with value: 0.633975 and parameters: {'lambda_l1': 1.3479676497356033e-06, 'lambda_l2': 4.933195728557726e-07}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  30%|###       | 6/20 [01:47<04:31, 19.39s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635275


regularization_factors, val_score: 0.633975:  35%|###5      | 7/20 [02:00<03:49, 17.62s/it][32m[I 2021-06-30 00:24:36,835][0m Trial 49 finished with value: 0.633975 and parameters: {'lambda_l1': 9.627187674023124e-05, 'lambda_l2': 0.4723108185862983}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  35%|###5      | 7/20 [02:00<03:49, 17.62s/it]

Early stopping, best iteration is:
[64]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63525


regularization_factors, val_score: 0.633975:  40%|####      | 8/20 [02:14<03:18, 16.53s/it][32m[I 2021-06-30 00:24:50,835][0m Trial 50 finished with value: 0.634575 and parameters: {'lambda_l1': 0.005769878132021392, 'lambda_l2': 1.7230064744112648e-06}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  40%|####      | 8/20 [02:14<03:18, 16.53s/it]

Early stopping, best iteration is:
[77]	valid_0's multi_error: 0.634575
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.636775


regularization_factors, val_score: 0.633975:  45%|####5     | 9/20 [02:29<02:54, 15.85s/it][32m[I 2021-06-30 00:25:05,086][0m Trial 51 finished with value: 0.6353 and parameters: {'lambda_l1': 0.0028491274516079627, 'lambda_l2': 3.1101941092978434e-05}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  45%|####5     | 9/20 [02:29<02:54, 15.85s/it]

Early stopping, best iteration is:
[50]	valid_0's multi_error: 0.6353
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63585


regularization_factors, val_score: 0.633975:  50%|#####     | 10/20 [02:41<02:29, 14.93s/it][32m[I 2021-06-30 00:25:17,857][0m Trial 52 finished with value: 0.6346 and parameters: {'lambda_l1': 0.483834261251929, 'lambda_l2': 2.0927330805963532e-05}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  50%|#####     | 10/20 [02:41<02:29, 14.93s/it]

Early stopping, best iteration is:
[62]	valid_0's multi_error: 0.6346
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  55%|#####5    | 11/20 [02:56<02:13, 14.82s/it][32m[I 2021-06-30 00:25:32,420][0m Trial 53 finished with value: 0.633975 and parameters: {'lambda_l1': 1.9556775606108463e-08, 'lambda_l2': 2.2059792236696343e-08}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  55%|#####5    | 11/20 [02:56<02:13, 14.82s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  60%|######    | 12/20 [03:14<02:07, 15.88s/it][32m[I 2021-06-30 00:25:50,796][0m Trial 54 finished with value: 0.633975 and parameters: {'lambda_l1': 1.638475036907605e-07, 'lambda_l2': 2.597584345894281e-08}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  60%|######    | 12/20 [03:14<02:07, 15.88s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  65%|######5   | 13/20 [03:28<01:47, 15.32s/it][32m[I 2021-06-30 00:26:04,812][0m Trial 55 finished with value: 0.633975 and parameters: {'lambda_l1': 8.954776480946923e-07, 'lambda_l2': 3.7215077493264554e-07}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  65%|######5   | 13/20 [03:28<01:47, 15.32s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  70%|#######   | 14/20 [03:42<01:29, 14.85s/it][32m[I 2021-06-30 00:26:18,552][0m Trial 56 finished with value: 0.633975 and parameters: {'lambda_l1': 2.6675692360367713e-06, 'lambda_l2': 2.3308411220255027e-08}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  70%|#######   | 14/20 [03:42<01:29, 14.85s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  75%|#######5  | 15/20 [03:56<01:13, 14.65s/it][32m[I 2021-06-30 00:26:32,733][0m Trial 57 finished with value: 0.633975 and parameters: {'lambda_l1': 2.1084320888817302e-08, 'lambda_l2': 5.984799941673662e-07}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  75%|#######5  | 15/20 [03:56<01:13, 14.65s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  80%|########  | 16/20 [04:10<00:56, 14.24s/it][32m[I 2021-06-30 00:26:46,030][0m Trial 58 finished with value: 0.633975 and parameters: {'lambda_l1': 5.544030580540719e-06, 'lambda_l2': 1.2941175435709873e-08}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  80%|########  | 16/20 [04:10<00:56, 14.24s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  85%|########5 | 17/20 [04:23<00:41, 13.95s/it][32m[I 2021-06-30 00:26:59,306][0m Trial 59 finished with value: 0.633975 and parameters: {'lambda_l1': 1.379807701084494e-07, 'lambda_l2': 2.2643380278631868e-07}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  85%|########5 | 17/20 [04:23<00:41, 13.95s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975:  90%|######### | 18/20 [04:36<00:27, 13.82s/it][32m[I 2021-06-30 00:27:12,811][0m Trial 60 finished with value: 0.633975 and parameters: {'lambda_l1': 1.1567211678647001e-07, 'lambda_l2': 9.225840637944367e-06}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  90%|######### | 18/20 [04:36<00:27, 13.82s/it]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635875


regularization_factors, val_score: 0.633975:  95%|#########5| 19/20 [04:49<00:13, 13.33s/it][32m[I 2021-06-30 00:27:25,010][0m Trial 61 finished with value: 0.635075 and parameters: {'lambda_l1': 1.5293425980076164e-08, 'lambda_l2': 0.002500883332790761}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975:  95%|#########5| 19/20 [04:49<00:13, 13.33s/it]

Early stopping, best iteration is:
[76]	valid_0's multi_error: 0.635075
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6348


regularization_factors, val_score: 0.633975: 100%|##########| 20/20 [05:02<00:00, 13.31s/it][32m[I 2021-06-30 00:27:38,283][0m Trial 62 finished with value: 0.633975 and parameters: {'lambda_l1': 1.840280065821245e-07, 'lambda_l2': 1.4556512924300431e-07}. Best is trial 44 with value: 0.633975.[0m
regularization_factors, val_score: 0.633975: 100%|##########| 20/20 [05:02<00:00, 15.12s/it]
min_data_in_leaf, val_score: 0.633975:   0%|          | 0/5 [00:00<?, ?it/s]

Early stopping, best iteration is:
[93]	valid_0's multi_error: 0.633975
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.63605
[200]	valid_0's multi_error: 0.636175
Early stopping, best iteration is:
[103]	valid_0's mult

min_data_in_leaf, val_score: 0.633975:  20%|##        | 1/5 [00:14<00:57, 14.30s/it][32m[I 2021-06-30 00:27:52,591][0m Trial 63 finished with value: 0.6355 and parameters: {'min_child_samples': 50}. Best is trial 63 with value: 0.6355.[0m
min_data_in_leaf, val_score: 0.633975:  20%|##        | 1/5 [00:14<00:57, 14.30s/it]

You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635625


min_data_in_leaf, val_score: 0.633975:  40%|####      | 2/5 [00:26<00:40, 13.57s/it][32m[I 2021-06-30 00:28:04,469][0m Trial 64 finished with value: 0.634925 and parameters: {'min_child_samples': 100}. Best is trial 64 with value: 0.634925.[0m
min_data_in_leaf, val_score: 0.633975:  40%|####      | 2/5 [00:26<00:40, 13.57s/it]

Early stopping, best iteration is:
[62]	valid_0's multi_error: 0.634925
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635725
[200]	valid_0's multi_error: 0.638275


min_data_in_leaf, val_score: 0.633975:  60%|######    | 3/5 [00:40<00:27, 13.69s/it][32m[I 2021-06-30 00:28:18,427][0m Trial 65 finished with value: 0.6356 and parameters: {'min_child_samples': 5}. Best is trial 64 with value: 0.634925.[0m
min_data_in_leaf, val_score: 0.633975:  60%|######    | 3/5 [00:40<00:27, 13.69s/it]

Early stopping, best iteration is:
[109]	valid_0's multi_error: 0.6356
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.635625


min_data_in_leaf, val_score: 0.633975:  80%|########  | 4/5 [00:51<00:13, 13.03s/it][32m[I 2021-06-30 00:28:29,932][0m Trial 66 finished with value: 0.634675 and parameters: {'min_child_samples': 25}. Best is trial 66 with value: 0.634675.[0m
min_data_in_leaf, val_score: 0.633975:  80%|########  | 4/5 [00:51<00:13, 13.03s/it]

Early stopping, best iteration is:
[62]	valid_0's multi_error: 0.634675
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3288
[LightGBM] [Info] Number of data points in the train set: 160000, number of used features: 75
[LightGBM] [Info] Start training from score -3.086615
[LightGBM] [Info] Start training from score -2.096791
[LightGBM] [Info] Start training from score -2.601750
[LightGBM] [Info] Start training from score -3.752885
[LightGBM] [Info] Start training from score -4.183176
[LightGBM] [Info] Start training from score -1.351507
[LightGBM] [Info] Start training from score -2.606566
[LightGBM] [Info] Start training from score -1.353174
[LightGBM] [Info] Start training from score -2.058904
Training until validation scores don't improve for 100 rounds
[100]	valid_0's multi_error: 0.6359


min_data_in_leaf, val_score: 0.633975: 100%|##########| 5/5 [01:03<00:00, 12.53s/it][32m[I 2021-06-30 00:28:41,307][0m Trial 67 finished with value: 0.6352 and parameters: {'min_child_samples': 10}. Best is trial 66 with value: 0.634675.[0m
min_data_in_leaf, val_score: 0.633975: 100%|##########| 5/5 [01:03<00:00, 12.60s/it]

Early stopping, best iteration is:
[63]	valid_0's multi_error: 0.6352





In [9]:
# ベストパラメータの取得
best_params = gbm_o.params
print("  Params: ")
for key, value in best_params.items():
    print("    {}: {}".format(key, value))

  Params: 
    objective: multiclass
    num_class: 9
    metric: multi_error
    random_seed: 0
    feature_pre_filter: False
    lambda_l1: 0.0
    lambda_l2: 0.0
    num_leaves: 19
    feature_fraction: 0.7
    bagging_fraction: 1.0
    bagging_freq: 0
    min_child_samples: 20
    num_iterations: 1000
    early_stopping_round: 100


In [10]:
# 調整後モデルで予測の実行
Y_pred = gbm_o.predict(X_test, num_iteration = gbm_o.best_iteration)

# 予測確率を整数へ
y_pred = np.argmax(Y_pred, axis=1)

# 識別率を求める
score = accuracy_score(y_test, y_pred)
print(f'score: {score}')

score: 0.366025


In [11]:
from sklearn.metrics import confusion_matrix
# 混同行列を表示
cmx = confusion_matrix(y_test, y_pred)
cmx

array([[   0,  436,    1,    1,    0,  457,    0,  909,    9],
       [   0, 2376,    6,    0,    1,  992,    2, 1368,   30],
       [   0, 1127,    3,    1,    2,  698,    0, 1084,   20],
       [   0,  226,    2,    0,    0,  257,    0,  459,    8],
       [   0,  129,    0,    1,    0,  156,    0,  330,    8],
       [   1,  857,    3,    0,    0, 5408,    0, 4105,   21],
       [   1,  317,    1,    1,    0,  789,    0, 1842,   12],
       [   1,  781,    8,    1,    0, 2750,    2, 6830,   43],
       [   0, 1177,    6,    1,    1, 1384,    2, 2532,   24]])

In [12]:
# csvファイルからPandas DataFrameへ読み込み
submit_data = pd.read_csv('test.csv', delimiter=',', low_memory=False)

# 冒頭を表示して確認
submit_data.head()

Unnamed: 0,id,feature_0,feature_1,feature_2,feature_3,feature_4,feature_5,feature_6,feature_7,feature_8,...,feature_65,feature_66,feature_67,feature_68,feature_69,feature_70,feature_71,feature_72,feature_73,feature_74
0,200000,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
1,200001,1,2,0,0,0,0,0,0,0,...,3,1,3,0,0,0,0,3,0,0
2,200002,0,1,7,1,0,0,0,0,6,...,3,0,0,0,0,3,0,2,0,0
3,200003,0,0,0,4,3,1,0,0,0,...,0,0,0,1,0,0,0,4,0,0
4,200004,0,0,5,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,1,0


In [13]:
# 提出データを適用できる形にする
x_submit = submit_data.drop(['id'], axis=1)

# 冒頭を表示して確認
x_submit.head()

Unnamed: 0,feature_0,feature_1,feature_2,feature_3,feature_4,feature_5,feature_6,feature_7,feature_8,feature_9,...,feature_65,feature_66,feature_67,feature_68,feature_69,feature_70,feature_71,feature_72,feature_73,feature_74
0,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
1,1,2,0,0,0,0,0,0,0,0,...,3,1,3,0,0,0,0,3,0,0
2,0,1,7,1,0,0,0,0,6,0,...,3,0,0,0,0,3,0,2,0,0
3,0,0,0,4,3,1,0,0,0,0,...,0,0,0,1,0,0,0,4,0,0
4,0,0,5,0,0,0,0,0,0,8,...,0,0,0,0,0,0,0,0,1,0


In [14]:
# 提出データを予測する
predictions = gbm_o.predict(x_submit, num_iteration = gbm_o.best_iteration)

# データの形を確認
predictions.shape

(100000, 9)

In [15]:
# 結果を提出形式に変形
df_predictions = pd.DataFrame(predictions)
df_predictions.columns = ['Class_1', 'Class_2', 'Class_3', 'Class_4', 'Class_5', 'Class_6', 'Class_7', 'Class_8', 'Class_9']
submit_data = pd.concat([submit_data.id,df_predictions],axis=1)
submit_data = submit_data.set_index('id')
submit_data.head()

Unnamed: 0_level_0,Class_1,Class_2,Class_3,Class_4,Class_5,Class_6,Class_7,Class_8,Class_9
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
200000,0.047166,0.386004,0.16352,0.025399,0.013095,0.173671,0.025002,0.053809,0.112334
200001,0.044906,0.084482,0.087967,0.020954,0.011719,0.221131,0.080786,0.322586,0.12547
200002,0.028194,0.033264,0.024879,0.013417,0.008328,0.672826,0.034104,0.12819,0.056798
200003,0.057256,0.082436,0.08239,0.048024,0.015027,0.248217,0.062445,0.241977,0.162228
200004,0.037939,0.116377,0.082335,0.028219,0.014011,0.285166,0.054686,0.235892,0.145374


In [16]:
# CSVファイルとして出力
submit_data.to_csv("submission_LGBM_optuna.csv")