In [46]:
#ライブラリ
import pandas as pd
import numpy as np
from sklearn.metrics import accuracy_score
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline
from sklearn.impute import SimpleImputer
from sklearn.decomposition import PCA
from sklearn.metrics import log_loss
import optuna
from sklearn.model_selection import KFold
from sklearn.model_selection import StratifiedKFold

#検証方法：クロスバリデーション
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import GridSearchCV

#モデル
import lightgbm as lgb

In [29]:
#データ準備
train =pd.read_table('data/train.tsv', index_col=0)
test = pd.read_table('data/test.tsv',index_col=0)
sample = pd.read_table('data/sample_submit.tsv' , index_col=0, header=None)

In [30]:
train= train.reset_index(drop=True)
train

Unnamed: 0,survived,pclass,sex,age,sibsp,parch,fare,embarked
0,1,1,female,35.0,1,0,53.1000,S
1,0,3,male,35.0,0,0,8.0500,S
2,0,3,male,2.0,3,1,21.0750,S
3,1,2,female,14.0,1,0,30.0708,C
4,1,1,female,58.0,0,0,26.5500,S
...,...,...,...,...,...,...,...,...
440,0,3,male,47.0,0,0,9.0000,S
441,1,2,female,28.0,1,0,24.0000,C
442,1,1,female,56.0,0,1,83.1583,C
443,0,3,male,25.0,0,0,7.0500,S


In [31]:
test = test.reset_index(drop=True)
test

Unnamed: 0,pclass,sex,age,sibsp,parch,fare,embarked
0,3,male,22.0,1,0,7.2500,S
1,1,female,38.0,1,0,71.2833,C
2,3,female,26.0,0,0,7.9250,S
3,3,male,,0,0,8.4583,Q
4,1,male,54.0,0,0,51.8625,S
...,...,...,...,...,...,...,...
441,3,female,39.0,0,5,29.1250,Q
442,2,male,27.0,0,0,13.0000,S
443,1,female,19.0,0,0,30.0000,S
444,1,male,26.0,0,0,30.0000,C


In [32]:
#データの確認と前処理　テストデータ
print(train.shape)
train.head()

(445, 8)


Unnamed: 0,survived,pclass,sex,age,sibsp,parch,fare,embarked
0,1,1,female,35.0,1,0,53.1,S
1,0,3,male,35.0,0,0,8.05,S
2,0,3,male,2.0,3,1,21.075,S
3,1,2,female,14.0,1,0,30.0708,C
4,1,1,female,58.0,0,0,26.55,S


In [33]:
#説明変数と目的変数に分ける
train_x = train.drop('survived',axis = 1)
train_y = train.iloc[:,0]
print(train_x.shape)
print(train_y.shape)

(445, 7)
(445,)


In [34]:
#trainデータ：one-hot-encoding
train_ohe = pd.get_dummies(train_x,dummy_na=True)
train_ohe.head()

Unnamed: 0,pclass,age,sibsp,parch,fare,sex_female,sex_male,sex_nan,embarked_C,embarked_Q,embarked_S,embarked_nan
0,1,35.0,1,0,53.1,1,0,0,0,0,1,0
1,3,35.0,0,0,8.05,0,1,0,0,0,1,0
2,3,2.0,3,1,21.075,0,1,0,0,0,1,0
3,2,14.0,1,0,30.0708,1,0,0,1,0,0,0
4,1,58.0,0,0,26.55,1,0,0,0,0,1,0


In [35]:
#trainデータ：欠損値の補完
#インピュータークラスのインスタンス化と（列平均）の学習
imp = SimpleImputer()
imp.fit(train_ohe)

#学習済みimputerの適用：各列欠損値の置換
train_fin = pd.DataFrame(imp.transform(train_ohe) , columns = train_ohe.columns.values)

#結果表示
display(train_fin.iloc[10:20,1])

10    38.000000
11    29.211583
12    29.211583
13    29.211583
14    29.211583
15    66.000000
16    29.211583
17    27.000000
18    29.211583
19     3.000000
Name: age, dtype: float64

In [36]:
#family sizeのみ追加
train_fin['FamilySize'] = train_fin['sibsp'] + train_fin['parch'] + 1
train_fin['IsAlone'] = 0
train_fin.loc[train_fin['FamilySize'] == 1 , 'IsAlone']  = 1
train_fin.iloc[30:40,-1]

30    0
31    1
32    1
33    0
34    1
35    1
36    1
37    1
38    0
39    1
Name: IsAlone, dtype: int64

In [37]:
#testデータ：one_hot_encoding
test_ohe = pd.get_dummies(test,dummy_na=True)
test_ohe.head()

Unnamed: 0,pclass,age,sibsp,parch,fare,sex_female,sex_male,sex_nan,embarked_C,embarked_Q,embarked_S,embarked_nan
0,3,22.0,1,0,7.25,0,1,0,0,0,1,0
1,1,38.0,1,0,71.2833,1,0,0,1,0,0,0
2,3,26.0,0,0,7.925,1,0,0,0,0,1,0
3,3,,0,0,8.4583,0,1,0,0,1,0,0
4,1,54.0,0,0,51.8625,0,1,0,0,0,1,0


In [38]:
#testデータ：欠損値の補完
#インピュータークラスのインスタンス化と（列平均）の学習
imp = SimpleImputer()
imp.fit(test_ohe)

#学習済みimputerの適用：各列欠損値の置換
test_fin = pd.DataFrame(imp.transform(test_ohe) , columns = test_ohe.columns.values)

#結果表示
display(test_fin.iloc[10:20,1])

10    30.194915
11    31.000000
12    35.000000
13    34.000000
14    15.000000
15    19.000000
16    40.000000
17    30.194915
18    28.000000
19    42.000000
Name: age, dtype: float64

In [39]:
#特徴量追加
test_fin['FamilySize'] = test_fin['sibsp'] + test_fin['parch'] + 1
test_fin['IsAlone'] = 0
test_fin.loc[test_fin['FamilySize'] == 1 , 'IsAlone']  = 1
test_fin.iloc[30:40,-1]

30    0
31    0
32    1
33    1
34    0
35    1
36    0
37    1
38    0
39    0
Name: IsAlone, dtype: int64

In [40]:
#columnsのデータ項目を確認
cols_train = set(train_fin.columns.values)
cols_test = set(test_fin.columns.values)

#trainにあってtestにないデータ項目
diff1 = cols_train -cols_test
print('trainのみ：%s' % diff1)

#testにあってtrainにないデータ項目
diff2 = cols_test - cols_train
print('testのみ：%s' % diff2)

trainのみ：set()
testのみ：set()


#パラメータ探索
def objective(trial):
    param = {
    'objective':'binary',
    'max_bin': trial.suggest_int('max_bin',255,500) ,
    'learning_rate': 0.001,
    'num_leaves': trial.suggest_int('num_leaves',32,128)}
    
    #XGBoostClassifierのインスタンス作成
    lgb_train = lgb.Dataset(x_train,y_train)
    lgb_eval = lgb.Dataset(x_valid,y_valid, reference=lgb_train)

    #モデルフィッティング
    model = lgb.train(param,
                      lgb_train,
                      valid_sets=[lgb_train,lgb_eval],
                      verbose_eval=10,
                      num_boost_round=1000,
                      early_stopping_rounds=10
                     )

    y_pred_valid = model.predict(x_valid,num_iteration=model.best_iteration)
    score = log_loss(y_valid , y_pred_valid)
    return score


study = optuna.create_study(sampler=optuna.samplers.RandomSampler(seed=1))
study.optimize(objective,n_trials=40)
study.best_params

In [41]:
print(train_fin.shape)
print(train_y.shape)

(445, 14)
(445,)


In [42]:
train_y[3]

1

In [47]:
#交差検証法の実装
y_preds = []
models = []
oof_train = np.zeros((len(train_fin),))
cv = StratifiedKFold(n_splits=5,shuffle=True,random_state=1)

params = {
    'objective':'binary',
    'max_bin': 357 ,
    'learning_rate': 0.001,
    'num_leaves': 101
}

#StratifiedKFldを利用する事で正例と負例の割合を均一に保つ
for fold_id , (train_index ,valid_index) in enumerate(cv.split(train_fin,train_y)):
    x_tr = train_fin.loc[train_index, :]
    x_val = train_fin.loc[valid_index, :]
    y_tr = train_y[train_index]
    y_val = train_y[valid_index]
    
    lgb_train = lgb.Dataset(x_tr,y_tr)
    lgb_eval = lgb.Dataset(x_val,y_val,
                          reference=lgb_train)
    
    model = lgb.train(params,lgb_train,
                     valid_sets=[lgb_train,lgb_eval],
                     verbose_eval=10,
                      num_boost_round=1000,
                     early_stopping_rounds=10)
    
    oof_train[valid_index] = model.predict(x_val,num_iteration=model.best_iteration)
    y_pred = model.predict(test_fin,num_iteration=model.best_iteration)
    
    y_preds.append(y_pred)
    models.append(model)



[LightGBM] [Info] Number of positive: 143, number of negative: 213
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 164
[LightGBM] [Info] Number of data points in the train set: 356, number of used features: 12
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.401685 -> initscore=-0.398448
[LightGBM] [Info] Start training from score -0.398448
Training until validation scores don't improve for 10 rounds
[10]	training's binary_logloss: 0.66955	valid_1's binary_logloss: 0.670771
[20]	training's binary_logloss: 0.665498	valid_1's binary_logloss: 0.666817
[30]	training's binary_logloss: 0.661531	valid_1's binary_logloss: 0.662944
[40]	training's binary_logloss: 0.657645	valid_1's binary_logloss: 0.65915
[50]	training's binary_logloss: 0.653838	valid_1's binary_logloss: 0.655321
[60]	training's binary_logloss: 0.650107	valid_1's binary_logloss: 0.65154
[70]	training's binary_logloss: 0.64645

[100]	training's binary_logloss: 0.635902	valid_1's binary_logloss: 0.637131
[110]	training's binary_logloss: 0.632521	valid_1's binary_logloss: 0.633698
[120]	training's binary_logloss: 0.629204	valid_1's binary_logloss: 0.630329
[130]	training's binary_logloss: 0.62595	valid_1's binary_logloss: 0.627022
[140]	training's binary_logloss: 0.622757	valid_1's binary_logloss: 0.623776
[150]	training's binary_logloss: 0.619623	valid_1's binary_logloss: 0.62059
[160]	training's binary_logloss: 0.616548	valid_1's binary_logloss: 0.617462
[170]	training's binary_logloss: 0.61353	valid_1's binary_logloss: 0.61439
[180]	training's binary_logloss: 0.610566	valid_1's binary_logloss: 0.611373
[190]	training's binary_logloss: 0.607657	valid_1's binary_logloss: 0.60841
[200]	training's binary_logloss: 0.6048	valid_1's binary_logloss: 0.6055
[210]	training's binary_logloss: 0.601995	valid_1's binary_logloss: 0.602641
[220]	training's binary_logloss: 0.59924	valid_1's binary_logloss: 0.599832
[230]	tra

[250]	training's binary_logloss: 0.591264	valid_1's binary_logloss: 0.591719
[260]	training's binary_logloss: 0.588699	valid_1's binary_logloss: 0.589099
[270]	training's binary_logloss: 0.586178	valid_1's binary_logloss: 0.586524
[280]	training's binary_logloss: 0.583702	valid_1's binary_logloss: 0.583993
[290]	training's binary_logloss: 0.581268	valid_1's binary_logloss: 0.581503
[300]	training's binary_logloss: 0.578876	valid_1's binary_logloss: 0.579055
[310]	training's binary_logloss: 0.576524	valid_1's binary_logloss: 0.576657
[320]	training's binary_logloss: 0.574202	valid_1's binary_logloss: 0.574298
[330]	training's binary_logloss: 0.571861	valid_1's binary_logloss: 0.571978
[340]	training's binary_logloss: 0.569558	valid_1's binary_logloss: 0.569696
[350]	training's binary_logloss: 0.567302	valid_1's binary_logloss: 0.567451
[360]	training's binary_logloss: 0.565072	valid_1's binary_logloss: 0.565241


[370]	training's binary_logloss: 0.562878	valid_1's binary_logloss: 0.563068
[380]	training's binary_logloss: 0.560719	valid_1's binary_logloss: 0.560929
[390]	training's binary_logloss: 0.558594	valid_1's binary_logloss: 0.558823
[400]	training's binary_logloss: 0.556511	valid_1's binary_logloss: 0.556751
[410]	training's binary_logloss: 0.554452	valid_1's binary_logloss: 0.554711
[420]	training's binary_logloss: 0.552425	valid_1's binary_logloss: 0.552704
[430]	training's binary_logloss: 0.550429	valid_1's binary_logloss: 0.550728
[440]	training's binary_logloss: 0.548465	valid_1's binary_logloss: 0.548783
[450]	training's binary_logloss: 0.54653	valid_1's binary_logloss: 0.546821
[460]	training's binary_logloss: 0.544625	valid_1's binary_logloss: 0.544878
[470]	training's binary_logloss: 0.542754	valid_1's binary_logloss: 0.542933
[480]	training's binary_logloss: 0.540913	valid_1's binary_logloss: 0.541039
[490]	training's binary_logloss: 0.539101	valid_1's binary_logloss: 0.539164


[500]	training's binary_logloss: 0.537317	valid_1's binary_logloss: 0.537307
[510]	training's binary_logloss: 0.535561	valid_1's binary_logloss: 0.53548
[520]	training's binary_logloss: 0.533833	valid_1's binary_logloss: 0.533692
[530]	training's binary_logloss: 0.532132	valid_1's binary_logloss: 0.531921
[540]	training's binary_logloss: 0.530458	valid_1's binary_logloss: 0.530177
[550]	training's binary_logloss: 0.528809	valid_1's binary_logloss: 0.528471
[560]	training's binary_logloss: 0.527186	valid_1's binary_logloss: 0.52678
[570]	training's binary_logloss: 0.525588	valid_1's binary_logloss: 0.525115
[580]	training's binary_logloss: 0.524009	valid_1's binary_logloss: 0.523475
[590]	training's binary_logloss: 0.522453	valid_1's binary_logloss: 0.521846


[600]	training's binary_logloss: 0.520919	valid_1's binary_logloss: 0.520238
[610]	training's binary_logloss: 0.519409	valid_1's binary_logloss: 0.518663
[620]	training's binary_logloss: 0.517922	valid_1's binary_logloss: 0.517116
[630]	training's binary_logloss: 0.516457	valid_1's binary_logloss: 0.515579
[640]	training's binary_logloss: 0.515013	valid_1's binary_logloss: 0.514064
[650]	training's binary_logloss: 0.513593	valid_1's binary_logloss: 0.512585
[660]	training's binary_logloss: 0.512183	valid_1's binary_logloss: 0.511121
[670]	training's binary_logloss: 0.510765	valid_1's binary_logloss: 0.509669
[680]	training's binary_logloss: 0.509162	valid_1's binary_logloss: 0.508305
[690]	training's binary_logloss: 0.507584	valid_1's binary_logloss: 0.506971
[700]	training's binary_logloss: 0.506001	valid_1's binary_logloss: 0.505689
[710]	training's binary_logloss: 0.50444	valid_1's binary_logloss: 0.504418
[720]	training's binary_logloss: 0.502903	valid_1's binary_logloss: 0.503168


[790]	training's binary_logloss: 0.492753	valid_1's binary_logloss: 0.49502
[800]	training's binary_logloss: 0.491386	valid_1's binary_logloss: 0.493925
[810]	training's binary_logloss: 0.490043	valid_1's binary_logloss: 0.492834
[820]	training's binary_logloss: 0.488713	valid_1's binary_logloss: 0.491731
[830]	training's binary_logloss: 0.487401	valid_1's binary_logloss: 0.490647
[840]	training's binary_logloss: 0.486109	valid_1's binary_logloss: 0.489554
[850]	training's binary_logloss: 0.484834	valid_1's binary_logloss: 0.48847
[860]	training's binary_logloss: 0.483585	valid_1's binary_logloss: 0.487401
[870]	training's binary_logloss: 0.482352	valid_1's binary_logloss: 0.486368
[880]	training's binary_logloss: 0.481139	valid_1's binary_logloss: 0.485392
[890]	training's binary_logloss: 0.479942	valid_1's binary_logloss: 0.484422


[900]	training's binary_logloss: 0.478765	valid_1's binary_logloss: 0.483473
[910]	training's binary_logloss: 0.477601	valid_1's binary_logloss: 0.482535
[920]	training's binary_logloss: 0.476454	valid_1's binary_logloss: 0.481619
[930]	training's binary_logloss: 0.475321	valid_1's binary_logloss: 0.48071
[940]	training's binary_logloss: 0.474205	valid_1's binary_logloss: 0.479805
[950]	training's binary_logloss: 0.473107	valid_1's binary_logloss: 0.478935
[960]	training's binary_logloss: 0.472021	valid_1's binary_logloss: 0.47808
[970]	training's binary_logloss: 0.470949	valid_1's binary_logloss: 0.477219
[980]	training's binary_logloss: 0.469892	valid_1's binary_logloss: 0.476375
[990]	training's binary_logloss: 0.468848	valid_1's binary_logloss: 0.475545
[1000]	training's binary_logloss: 0.467819	valid_1's binary_logloss: 0.474735
Did not meet early stopping. Best iteration is:
[1000]	training's binary_logloss: 0.467819	valid_1's binary_logloss: 0.474735


[LightGBM] [Info] Number of positive: 143, number of negative: 213
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 160
[LightGBM] [Info] Number of data points in the train set: 356, number of used features: 12
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.401685 -> initscore=-0.398448
[LightGBM] [Info] Start training from score -0.398448
Training until validation scores don't improve for 10 rounds
[10]	training's binary_logloss: 0.669306	valid_1's binary_logloss: 0.670785
[20]	training's binary_logloss: 0.665026	valid_1's binary_logloss: 0.666864
[30]	training's binary_logloss: 0.660837	valid_1's binary_logloss: 0.663084
[40]	training's binary_logloss: 0.656734	valid_1's binary_logloss: 0.659374
[50]	training's binary_logloss: 0.652713	valid_1's binary_logloss: 0.655744
[60]	training's binary_logloss: 0.648772	valid_1's binary_logloss: 0.6522
[70]	training's binary_logloss: 0.6449

[110]	training's binary_logloss: 0.630193	valid_1's binary_logloss: 0.635679
[120]	training's binary_logloss: 0.626688	valid_1's binary_logloss: 0.632581
[130]	training's binary_logloss: 0.62325	valid_1's binary_logloss: 0.629517
[140]	training's binary_logloss: 0.619875	valid_1's binary_logloss: 0.626516
[150]	training's binary_logloss: 0.616563	valid_1's binary_logloss: 0.623534
[160]	training's binary_logloss: 0.613312	valid_1's binary_logloss: 0.620609
[170]	training's binary_logloss: 0.610119	valid_1's binary_logloss: 0.617755
[180]	training's binary_logloss: 0.606983	valid_1's binary_logloss: 0.61498
[190]	training's binary_logloss: 0.603904	valid_1's binary_logloss: 0.612237
[200]	training's binary_logloss: 0.60088	valid_1's binary_logloss: 0.609566
[210]	training's binary_logloss: 0.597908	valid_1's binary_logloss: 0.606963
[220]	training's binary_logloss: 0.594989	valid_1's binary_logloss: 0.604382
[230]	training's binary_logloss: 0.592112	valid_1's binary_logloss: 0.601902
[2

[290]	training's binary_logloss: 0.575802	valid_1's binary_logloss: 0.588273
[300]	training's binary_logloss: 0.573243	valid_1's binary_logloss: 0.586159
[310]	training's binary_logloss: 0.570723	valid_1's binary_logloss: 0.584113
[320]	training's binary_logloss: 0.568248	valid_1's binary_logloss: 0.582059
[330]	training's binary_logloss: 0.565811	valid_1's binary_logloss: 0.5801
[340]	training's binary_logloss: 0.563417	valid_1's binary_logloss: 0.578173
[350]	training's binary_logloss: 0.561059	valid_1's binary_logloss: 0.576284
[360]	training's binary_logloss: 0.558742	valid_1's binary_logloss: 0.57441
[370]	training's binary_logloss: 0.55646	valid_1's binary_logloss: 0.572589
[380]	training's binary_logloss: 0.554217	valid_1's binary_logloss: 0.570806


[390]	training's binary_logloss: 0.552008	valid_1's binary_logloss: 0.569075
[400]	training's binary_logloss: 0.549835	valid_1's binary_logloss: 0.567356
[410]	training's binary_logloss: 0.547699	valid_1's binary_logloss: 0.565625
[420]	training's binary_logloss: 0.545599	valid_1's binary_logloss: 0.563892
[430]	training's binary_logloss: 0.543534	valid_1's binary_logloss: 0.562196
[440]	training's binary_logloss: 0.541502	valid_1's binary_logloss: 0.560517
[450]	training's binary_logloss: 0.539501	valid_1's binary_logloss: 0.558843
[460]	training's binary_logloss: 0.537531	valid_1's binary_logloss: 0.557242
[470]	training's binary_logloss: 0.535589	valid_1's binary_logloss: 0.555639
[480]	training's binary_logloss: 0.533679	valid_1's binary_logloss: 0.554075
[490]	training's binary_logloss: 0.531797	valid_1's binary_logloss: 0.552562
[500]	training's binary_logloss: 0.529944	valid_1's binary_logloss: 0.551049
[510]	training's binary_logloss: 0.528119	valid_1's binary_logloss: 0.549572

[600]	training's binary_logloss: 0.512242	valid_1's binary_logloss: 0.538991
[610]	training's binary_logloss: 0.510615	valid_1's binary_logloss: 0.537973
[620]	training's binary_logloss: 0.509013	valid_1's binary_logloss: 0.536987
[630]	training's binary_logloss: 0.507426	valid_1's binary_logloss: 0.535968
[640]	training's binary_logloss: 0.505856	valid_1's binary_logloss: 0.534955
[650]	training's binary_logloss: 0.50431	valid_1's binary_logloss: 0.533955
[660]	training's binary_logloss: 0.502786	valid_1's binary_logloss: 0.532988
[670]	training's binary_logloss: 0.501288	valid_1's binary_logloss: 0.532045
[680]	training's binary_logloss: 0.499808	valid_1's binary_logloss: 0.531112
[690]	training's binary_logloss: 0.498351	valid_1's binary_logloss: 0.530207
[700]	training's binary_logloss: 0.496917	valid_1's binary_logloss: 0.529329
[710]	training's binary_logloss: 0.495504	valid_1's binary_logloss: 0.528478


[720]	training's binary_logloss: 0.494115	valid_1's binary_logloss: 0.527668
[730]	training's binary_logloss: 0.492681	valid_1's binary_logloss: 0.526591
[740]	training's binary_logloss: 0.491174	valid_1's binary_logloss: 0.525135
[750]	training's binary_logloss: 0.489691	valid_1's binary_logloss: 0.523721
[760]	training's binary_logloss: 0.488229	valid_1's binary_logloss: 0.522317
[770]	training's binary_logloss: 0.486791	valid_1's binary_logloss: 0.520946
[780]	training's binary_logloss: 0.485366	valid_1's binary_logloss: 0.519609
[790]	training's binary_logloss: 0.483955	valid_1's binary_logloss: 0.518308
[800]	training's binary_logloss: 0.482565	valid_1's binary_logloss: 0.517013
[810]	training's binary_logloss: 0.481192	valid_1's binary_logloss: 0.515759
[820]	training's binary_logloss: 0.479842	valid_1's binary_logloss: 0.514512


[830]	training's binary_logloss: 0.478508	valid_1's binary_logloss: 0.513283
[840]	training's binary_logloss: 0.477193	valid_1's binary_logloss: 0.512064
[850]	training's binary_logloss: 0.475896	valid_1's binary_logloss: 0.510873
[860]	training's binary_logloss: 0.474618	valid_1's binary_logloss: 0.5097
[870]	training's binary_logloss: 0.473357	valid_1's binary_logloss: 0.508537
[880]	training's binary_logloss: 0.472115	valid_1's binary_logloss: 0.507395
[890]	training's binary_logloss: 0.470886	valid_1's binary_logloss: 0.506414
[900]	training's binary_logloss: 0.469714	valid_1's binary_logloss: 0.505589
[910]	training's binary_logloss: 0.468572	valid_1's binary_logloss: 0.504843
[920]	training's binary_logloss: 0.46743	valid_1's binary_logloss: 0.504064
[930]	training's binary_logloss: 0.4663	valid_1's binary_logloss: 0.503283
[940]	training's binary_logloss: 0.465258	valid_1's binary_logloss: 0.502852
[950]	training's binary_logloss: 0.46423	valid_1's binary_logloss: 0.502429
[960]

[LightGBM] [Info] Number of positive: 143, number of negative: 213
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 165
[LightGBM] [Info] Number of data points in the train set: 356, number of used features: 12
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.401685 -> initscore=-0.398448
[LightGBM] [Info] Start training from score -0.398448
Training until validation scores don't improve for 10 rounds
[10]	training's binary_logloss: 0.66936	valid_1's binary_logloss: 0.670502
[20]	training's binary_logloss: 0.665157	valid_1's binary_logloss: 0.666349
[30]	training's binary_logloss: 0.661042	valid_1's binary_logloss: 0.662286
[40]	training's binary_logloss: 0.657006	valid_1's binary_logloss: 0.658302
[50]	training's binary_logloss: 0.65306	valid_1's binary_logloss: 0.654413
[60]	training's binary_logloss: 0.649187	valid_1's binary_logloss: 0.650597
[70]	training's binary_logloss: 0.6453

[140]	training's binary_logloss: 0.620826	valid_1's binary_logloss: 0.622782
[150]	training's binary_logloss: 0.617577	valid_1's binary_logloss: 0.619608
[160]	training's binary_logloss: 0.614388	valid_1's binary_logloss: 0.616496
[170]	training's binary_logloss: 0.611259	valid_1's binary_logloss: 0.613452
[180]	training's binary_logloss: 0.608191	valid_1's binary_logloss: 0.610483
[190]	training's binary_logloss: 0.605174	valid_1's binary_logloss: 0.607562
[200]	training's binary_logloss: 0.602211	valid_1's binary_logloss: 0.604691
[210]	training's binary_logloss: 0.599303	valid_1's binary_logloss: 0.601876
[220]	training's binary_logloss: 0.596433	valid_1's binary_logloss: 0.5991
[230]	training's binary_logloss: 0.593626	valid_1's binary_logloss: 0.596394
[240]	training's binary_logloss: 0.590863	valid_1's binary_logloss: 0.59373
[250]	training's binary_logloss: 0.588142	valid_1's binary_logloss: 0.591108
[260]	training's binary_logloss: 0.585474	valid_1's binary_logloss: 0.588542
[2

[290]	training's binary_logloss: 0.577707	valid_1's binary_logloss: 0.58122
[300]	training's binary_logloss: 0.575202	valid_1's binary_logloss: 0.578871
[310]	training's binary_logloss: 0.572739	valid_1's binary_logloss: 0.576565
[320]	training's binary_logloss: 0.570319	valid_1's binary_logloss: 0.574296
[330]	training's binary_logloss: 0.567937	valid_1's binary_logloss: 0.572073
[340]	training's binary_logloss: 0.565595	valid_1's binary_logloss: 0.56989
[350]	training's binary_logloss: 0.56329	valid_1's binary_logloss: 0.567726
[360]	training's binary_logloss: 0.561031	valid_1's binary_logloss: 0.565612
[370]	training's binary_logloss: 0.558807	valid_1's binary_logloss: 0.56351
[380]	training's binary_logloss: 0.556613	valid_1's binary_logloss: 0.56145
[390]	training's binary_logloss: 0.554436	valid_1's binary_logloss: 0.559442
[400]	training's binary_logloss: 0.552299	valid_1's binary_logloss: 0.557452
[410]	training's binary_logloss: 0.550192	valid_1's binary_logloss: 0.555506
[420

[450]	training's binary_logloss: 0.542171	valid_1's binary_logloss: 0.548018
[460]	training's binary_logloss: 0.540251	valid_1's binary_logloss: 0.546226
[470]	training's binary_logloss: 0.538362	valid_1's binary_logloss: 0.544466
[480]	training's binary_logloss: 0.536505	valid_1's binary_logloss: 0.542675
[490]	training's binary_logloss: 0.534562	valid_1's binary_logloss: 0.540812
[500]	training's binary_logloss: 0.532637	valid_1's binary_logloss: 0.538976
[510]	training's binary_logloss: 0.530744	valid_1's binary_logloss: 0.537172
[520]	training's binary_logloss: 0.528881	valid_1's binary_logloss: 0.535392
[530]	training's binary_logloss: 0.527048	valid_1's binary_logloss: 0.533625
[540]	training's binary_logloss: 0.525243	valid_1's binary_logloss: 0.531896
[550]	training's binary_logloss: 0.523467	valid_1's binary_logloss: 0.530197
[560]	training's binary_logloss: 0.521718	valid_1's binary_logloss: 0.528527
[570]	training's binary_logloss: 0.519998	valid_1's binary_logloss: 0.526879

[600]	training's binary_logloss: 0.51493	valid_1's binary_logloss: 0.522257
[610]	training's binary_logloss: 0.513265	valid_1's binary_logloss: 0.520916
[620]	training's binary_logloss: 0.511626	valid_1's binary_logloss: 0.51963
[630]	training's binary_logloss: 0.510011	valid_1's binary_logloss: 0.518368
[640]	training's binary_logloss: 0.508422	valid_1's binary_logloss: 0.517122
[650]	training's binary_logloss: 0.506842	valid_1's binary_logloss: 0.515872
[660]	training's binary_logloss: 0.505211	valid_1's binary_logloss: 0.514451
[670]	training's binary_logloss: 0.503616	valid_1's binary_logloss: 0.513085
[680]	training's binary_logloss: 0.502061	valid_1's binary_logloss: 0.511792
[690]	training's binary_logloss: 0.500529	valid_1's binary_logloss: 0.51052
[700]	training's binary_logloss: 0.49903	valid_1's binary_logloss: 0.509244
[710]	training's binary_logloss: 0.497421	valid_1's binary_logloss: 0.508033
[720]	training's binary_logloss: 0.495818	valid_1's binary_logloss: 0.50684
[730

[740]	training's binary_logloss: 0.4927	valid_1's binary_logloss: 0.50453
[750]	training's binary_logloss: 0.491188	valid_1's binary_logloss: 0.503411
[760]	training's binary_logloss: 0.489674	valid_1's binary_logloss: 0.502388
[770]	training's binary_logloss: 0.488181	valid_1's binary_logloss: 0.501382
[780]	training's binary_logloss: 0.486711	valid_1's binary_logloss: 0.500335
[790]	training's binary_logloss: 0.485263	valid_1's binary_logloss: 0.499175
[800]	training's binary_logloss: 0.483826	valid_1's binary_logloss: 0.498076
[810]	training's binary_logloss: 0.482407	valid_1's binary_logloss: 0.49704
[820]	training's binary_logloss: 0.480999	valid_1's binary_logloss: 0.496006
[830]	training's binary_logloss: 0.479644	valid_1's binary_logloss: 0.494974
[840]	training's binary_logloss: 0.478292	valid_1's binary_logloss: 0.49397
[850]	training's binary_logloss: 0.476979	valid_1's binary_logloss: 0.492982
[860]	training's binary_logloss: 0.475638	valid_1's binary_logloss: 0.492082


[870]	training's binary_logloss: 0.474311	valid_1's binary_logloss: 0.491245
[880]	training's binary_logloss: 0.472987	valid_1's binary_logloss: 0.490424
[890]	training's binary_logloss: 0.471697	valid_1's binary_logloss: 0.489622
[900]	training's binary_logloss: 0.470411	valid_1's binary_logloss: 0.488828
[910]	training's binary_logloss: 0.469165	valid_1's binary_logloss: 0.48807
[920]	training's binary_logloss: 0.467923	valid_1's binary_logloss: 0.487348
[930]	training's binary_logloss: 0.466699	valid_1's binary_logloss: 0.486644
[940]	training's binary_logloss: 0.465507	valid_1's binary_logloss: 0.485957
[950]	training's binary_logloss: 0.464319	valid_1's binary_logloss: 0.485287
[960]	training's binary_logloss: 0.463148	valid_1's binary_logloss: 0.484635
[970]	training's binary_logloss: 0.462007	valid_1's binary_logloss: 0.483997
[980]	training's binary_logloss: 0.460869	valid_1's binary_logloss: 0.483377
[990]	training's binary_logloss: 0.459767	valid_1's binary_logloss: 0.482716


[LightGBM] [Info] Number of positive: 143, number of negative: 213
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 162
[LightGBM] [Info] Number of data points in the train set: 356, number of used features: 12
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.401685 -> initscore=-0.398448
[LightGBM] [Info] Start training from score -0.398448
Training until validation scores don't improve for 10 rounds
[10]	training's binary_logloss: 0.669293	valid_1's binary_logloss: 0.670803
[20]	training's binary_logloss: 0.664987	valid_1's binary_logloss: 0.666881
[30]	training's binary_logloss: 0.660769	valid_1's binary_logloss: 0.663045
[40]	training's binary_logloss: 0.65664	valid_1's binary_logloss: 0.659299
[50]	training's binary_logloss: 0.652593	valid_1's binary_logloss: 0.655636
[60]	training's binary_logloss: 0.648629	valid_1's binary_logloss: 0.652062
[70]	training's binary_logloss: 0.644

[150]	training's binary_logloss: 0.61625	valid_1's binary_logloss: 0.623065
[160]	training's binary_logloss: 0.612949	valid_1's binary_logloss: 0.620137
[170]	training's binary_logloss: 0.609713	valid_1's binary_logloss: 0.617267
[180]	training's binary_logloss: 0.606535	valid_1's binary_logloss: 0.614453
[190]	training's binary_logloss: 0.603415	valid_1's binary_logloss: 0.611694
[200]	training's binary_logloss: 0.600347	valid_1's binary_logloss: 0.608987
[210]	training's binary_logloss: 0.59734	valid_1's binary_logloss: 0.606341
[220]	training's binary_logloss: 0.594384	valid_1's binary_logloss: 0.603737
[230]	training's binary_logloss: 0.59148	valid_1's binary_logloss: 0.601183
[240]	training's binary_logloss: 0.588629	valid_1's binary_logloss: 0.598685
[250]	training's binary_logloss: 0.585826	valid_1's binary_logloss: 0.596225
[260]	training's binary_logloss: 0.583072	valid_1's binary_logloss: 0.593812
[270]	training's binary_logloss: 0.580367	valid_1's binary_logloss: 0.59144
[28

[290]	training's binary_logloss: 0.575093	valid_1's binary_logloss: 0.586828
[300]	training's binary_logloss: 0.572524	valid_1's binary_logloss: 0.584594
[310]	training's binary_logloss: 0.569996	valid_1's binary_logloss: 0.582418
[320]	training's binary_logloss: 0.56751	valid_1's binary_logloss: 0.580282
[330]	training's binary_logloss: 0.565065	valid_1's binary_logloss: 0.578186
[340]	training's binary_logloss: 0.562661	valid_1's binary_logloss: 0.576129
[350]	training's binary_logloss: 0.560297	valid_1's binary_logloss: 0.57411
[360]	training's binary_logloss: 0.557971	valid_1's binary_logloss: 0.572127
[370]	training's binary_logloss: 0.555683	valid_1's binary_logloss: 0.570184
[380]	training's binary_logloss: 0.553432	valid_1's binary_logloss: 0.56827
[390]	training's binary_logloss: 0.551218	valid_1's binary_logloss: 0.566398
[400]	training's binary_logloss: 0.549039	valid_1's binary_logloss: 0.564582
[410]	training's binary_logloss: 0.546895	valid_1's binary_logloss: 0.562797
[4

[440]	training's binary_logloss: 0.540666	valid_1's binary_logloss: 0.557656
[450]	training's binary_logloss: 0.538654	valid_1's binary_logloss: 0.556001
[460]	training's binary_logloss: 0.536673	valid_1's binary_logloss: 0.554376
[470]	training's binary_logloss: 0.534722	valid_1's binary_logloss: 0.552776
[480]	training's binary_logloss: 0.532804	valid_1's binary_logloss: 0.551217
[490]	training's binary_logloss: 0.530912	valid_1's binary_logloss: 0.549678
[500]	training's binary_logloss: 0.529059	valid_1's binary_logloss: 0.548215
[510]	training's binary_logloss: 0.527239	valid_1's binary_logloss: 0.546806
[520]	training's binary_logloss: 0.525449	valid_1's binary_logloss: 0.545421
[530]	training's binary_logloss: 0.523689	valid_1's binary_logloss: 0.544066
[540]	training's binary_logloss: 0.521884	valid_1's binary_logloss: 0.54271
[550]	training's binary_logloss: 0.520079	valid_1's binary_logloss: 0.541373


[560]	training's binary_logloss: 0.518314	valid_1's binary_logloss: 0.540038
[570]	training's binary_logloss: 0.516624	valid_1's binary_logloss: 0.538624
[580]	training's binary_logloss: 0.51496	valid_1's binary_logloss: 0.537246
[590]	training's binary_logloss: 0.513323	valid_1's binary_logloss: 0.535903
[600]	training's binary_logloss: 0.51172	valid_1's binary_logloss: 0.534634
[610]	training's binary_logloss: 0.510147	valid_1's binary_logloss: 0.53341
[620]	training's binary_logloss: 0.508593	valid_1's binary_logloss: 0.532198
[630]	training's binary_logloss: 0.507025	valid_1's binary_logloss: 0.531028
[640]	training's binary_logloss: 0.505441	valid_1's binary_logloss: 0.529895
[650]	training's binary_logloss: 0.503882	valid_1's binary_logloss: 0.528782
[660]	training's binary_logloss: 0.502347	valid_1's binary_logloss: 0.527693
[670]	training's binary_logloss: 0.500835	valid_1's binary_logloss: 0.526622
[680]	training's binary_logloss: 0.499347	valid_1's binary_logloss: 0.525575
[6

[700]	training's binary_logloss: 0.496439	valid_1's binary_logloss: 0.523539
[710]	training's binary_logloss: 0.495019	valid_1's binary_logloss: 0.522547
[720]	training's binary_logloss: 0.493602	valid_1's binary_logloss: 0.521581
[730]	training's binary_logloss: 0.492203	valid_1's binary_logloss: 0.52055
[740]	training's binary_logloss: 0.490826	valid_1's binary_logloss: 0.519488
[750]	training's binary_logloss: 0.489489	valid_1's binary_logloss: 0.518431
[760]	training's binary_logloss: 0.488169	valid_1's binary_logloss: 0.517391
[770]	training's binary_logloss: 0.486866	valid_1's binary_logloss: 0.516358
[780]	training's binary_logloss: 0.485582	valid_1's binary_logloss: 0.515352
[790]	training's binary_logloss: 0.484316	valid_1's binary_logloss: 0.514361
[800]	training's binary_logloss: 0.483065	valid_1's binary_logloss: 0.513381
[810]	training's binary_logloss: 0.481827	valid_1's binary_logloss: 0.51242
[820]	training's binary_logloss: 0.480554	valid_1's binary_logloss: 0.511549
[

[840]	training's binary_logloss: 0.477958	valid_1's binary_logloss: 0.510041
[850]	training's binary_logloss: 0.47673	valid_1's binary_logloss: 0.509283
[860]	training's binary_logloss: 0.475523	valid_1's binary_logloss: 0.508563
[870]	training's binary_logloss: 0.474346	valid_1's binary_logloss: 0.507868
[880]	training's binary_logloss: 0.473185	valid_1's binary_logloss: 0.507181
[890]	training's binary_logloss: 0.472034	valid_1's binary_logloss: 0.506506
[900]	training's binary_logloss: 0.470891	valid_1's binary_logloss: 0.505847
[910]	training's binary_logloss: 0.469769	valid_1's binary_logloss: 0.50519
[920]	training's binary_logloss: 0.46866	valid_1's binary_logloss: 0.504554
[930]	training's binary_logloss: 0.467552	valid_1's binary_logloss: 0.503879
[940]	training's binary_logloss: 0.466314	valid_1's binary_logloss: 0.502835
[950]	training's binary_logloss: 0.465089	valid_1's binary_logloss: 0.501809
[960]	training's binary_logloss: 0.463961	valid_1's binary_logloss: 0.500953
[9

[1000]	training's binary_logloss: 0.459697	valid_1's binary_logloss: 0.498155
Did not meet early stopping. Best iteration is:
[1000]	training's binary_logloss: 0.459697	valid_1's binary_logloss: 0.498155
[LightGBM] [Info] Number of positive: 144, number of negative: 212
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 159
[LightGBM] [Info] Number of data points in the train set: 356, number of used features: 12
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.404494 -> initscore=-0.386773
[LightGBM] [Info] Start training from score -0.386773
Training until validation scores don't improve for 10 rounds
[10]	training's binary_logloss: 0.670242	valid_1's binary_logloss: 0.666697
[20]	training's binary_logloss: 0.665787	valid_1's binary_logloss: 0.66303
[30]	training's binary_logloss: 0.661423	valid_1's binary_logloss: 0.659469
[40]	training's binary_logloss: 0.657148	valid_1's binary_log

[200]	training's binary_logloss: 0.599001	valid_1's binary_logloss: 0.60947
[210]	training's binary_logloss: 0.595915	valid_1's binary_logloss: 0.607043
[220]	training's binary_logloss: 0.592884	valid_1's binary_logloss: 0.604661
[230]	training's binary_logloss: 0.589907	valid_1's binary_logloss: 0.602327
[240]	training's binary_logloss: 0.586983	valid_1's binary_logloss: 0.600039
[250]	training's binary_logloss: 0.58411	valid_1's binary_logloss: 0.597802
[260]	training's binary_logloss: 0.581288	valid_1's binary_logloss: 0.595604
[270]	training's binary_logloss: 0.578514	valid_1's binary_logloss: 0.593449
[280]	training's binary_logloss: 0.575789	valid_1's binary_logloss: 0.591336
[290]	training's binary_logloss: 0.573111	valid_1's binary_logloss: 0.589267
[300]	training's binary_logloss: 0.570479	valid_1's binary_logloss: 0.587237
[310]	training's binary_logloss: 0.567892	valid_1's binary_logloss: 0.585245
[320]	training's binary_logloss: 0.565349	valid_1's binary_logloss: 0.583293
[

[360]	training's binary_logloss: 0.555598	valid_1's binary_logloss: 0.575854
[370]	training's binary_logloss: 0.553261	valid_1's binary_logloss: 0.574087
[380]	training's binary_logloss: 0.550963	valid_1's binary_logloss: 0.57235
[390]	training's binary_logloss: 0.548703	valid_1's binary_logloss: 0.570648
[400]	training's binary_logloss: 0.54648	valid_1's binary_logloss: 0.568977
[410]	training's binary_logloss: 0.544293	valid_1's binary_logloss: 0.567337
[420]	training's binary_logloss: 0.542141	valid_1's binary_logloss: 0.565728
[430]	training's binary_logloss: 0.540024	valid_1's binary_logloss: 0.56415
[440]	training's binary_logloss: 0.53794	valid_1's binary_logloss: 0.5626
[450]	training's binary_logloss: 0.535889	valid_1's binary_logloss: 0.56108
[460]	training's binary_logloss: 0.533871	valid_1's binary_logloss: 0.559588
[470]	training's binary_logloss: 0.531833	valid_1's binary_logloss: 0.558224
[480]	training's binary_logloss: 0.529759	valid_1's binary_logloss: 0.557014
[490]	

[510]	training's binary_logloss: 0.523738	valid_1's binary_logloss: 0.553495
[520]	training's binary_logloss: 0.521786	valid_1's binary_logloss: 0.552383
[530]	training's binary_logloss: 0.519877	valid_1's binary_logloss: 0.551261
[540]	training's binary_logloss: 0.517982	valid_1's binary_logloss: 0.550196
[550]	training's binary_logloss: 0.516114	valid_1's binary_logloss: 0.549154
[560]	training's binary_logloss: 0.514289	valid_1's binary_logloss: 0.548136
[570]	training's binary_logloss: 0.512461	valid_1's binary_logloss: 0.547197
[580]	training's binary_logloss: 0.510635	valid_1's binary_logloss: 0.546321
[590]	training's binary_logloss: 0.508834	valid_1's binary_logloss: 0.54546
[600]	training's binary_logloss: 0.50706	valid_1's binary_logloss: 0.544619
[610]	training's binary_logloss: 0.50521	valid_1's binary_logloss: 0.543795
[620]	training's binary_logloss: 0.503321	valid_1's binary_logloss: 0.542972
[630]	training's binary_logloss: 0.501459	valid_1's binary_logloss: 0.542171
[6

[650]	training's binary_logloss: 0.497819	valid_1's binary_logloss: 0.54064
[660]	training's binary_logloss: 0.49604	valid_1's binary_logloss: 0.539904
[670]	training's binary_logloss: 0.494287	valid_1's binary_logloss: 0.539182
[680]	training's binary_logloss: 0.492557	valid_1's binary_logloss: 0.538477
[690]	training's binary_logloss: 0.490834	valid_1's binary_logloss: 0.537782
[700]	training's binary_logloss: 0.489137	valid_1's binary_logloss: 0.537096
[710]	training's binary_logloss: 0.487464	valid_1's binary_logloss: 0.536422
[720]	training's binary_logloss: 0.485815	valid_1's binary_logloss: 0.535784
[730]	training's binary_logloss: 0.484191	valid_1's binary_logloss: 0.535157
[740]	training's binary_logloss: 0.48259	valid_1's binary_logloss: 0.534543
[750]	training's binary_logloss: 0.481012	valid_1's binary_logloss: 0.533959


[760]	training's binary_logloss: 0.479457	valid_1's binary_logloss: 0.53338
[770]	training's binary_logloss: 0.477924	valid_1's binary_logloss: 0.532829
[780]	training's binary_logloss: 0.476413	valid_1's binary_logloss: 0.532278
[790]	training's binary_logloss: 0.474924	valid_1's binary_logloss: 0.53175
[800]	training's binary_logloss: 0.473483	valid_1's binary_logloss: 0.531238
[810]	training's binary_logloss: 0.47207	valid_1's binary_logloss: 0.53073
[820]	training's binary_logloss: 0.470676	valid_1's binary_logloss: 0.53024
[830]	training's binary_logloss: 0.469302	valid_1's binary_logloss: 0.52976
[840]	training's binary_logloss: 0.46794	valid_1's binary_logloss: 0.529296
[850]	training's binary_logloss: 0.466604	valid_1's binary_logloss: 0.528854
[860]	training's binary_logloss: 0.465286	valid_1's binary_logloss: 0.52841
[870]	training's binary_logloss: 0.463987	valid_1's binary_logloss: 0.527994


[880]	training's binary_logloss: 0.462706	valid_1's binary_logloss: 0.527569
[890]	training's binary_logloss: 0.461442	valid_1's binary_logloss: 0.527135
[900]	training's binary_logloss: 0.460154	valid_1's binary_logloss: 0.526692
[910]	training's binary_logloss: 0.458789	valid_1's binary_logloss: 0.526307
[920]	training's binary_logloss: 0.457427	valid_1's binary_logloss: 0.52595
[930]	training's binary_logloss: 0.456071	valid_1's binary_logloss: 0.525628
[940]	training's binary_logloss: 0.454763	valid_1's binary_logloss: 0.525263
[950]	training's binary_logloss: 0.453452	valid_1's binary_logloss: 0.524944
[960]	training's binary_logloss: 0.452157	valid_1's binary_logloss: 0.524639
[970]	training's binary_logloss: 0.450886	valid_1's binary_logloss: 0.524336
[980]	training's binary_logloss: 0.449623	valid_1's binary_logloss: 0.524049
[990]	training's binary_logloss: 0.448376	valid_1's binary_logloss: 0.523789
[1000]	training's binary_logloss: 0.447151	valid_1's binary_logloss: 0.523516

In [48]:
scores = [
    m.best_score['valid_1']['binary_logloss'] for m in models
]
score = sum(scores) / len(scores)
print('===CV scores===')
print(scores)
print(score)

===CV scores===
[0.4747349192688233, 0.49839142060163505, 0.48202954600856535, 0.49815527277434113, 0.5235159121141884]
0.49536541415351065


In [53]:
y_preds[0]

array([0.16148024, 0.78257918, 0.51382929, 0.33266366, 0.476259  ,
       0.43473274, 0.38472533, 0.19229033, 0.51785077, 0.66268578,
       0.31772435, 0.3809209 , 0.18543091, 0.22333822, 0.55562387,
       0.43601714, 0.41999877, 0.75167726, 0.43601714, 0.476259  ,
       0.1690397 , 0.38472533, 0.55562387, 0.43473274, 0.32246416,
       0.20760048, 0.28763458, 0.38472533, 0.47091458, 0.1690397 ,
       0.78257918, 0.476259  , 0.37364392, 0.28003729, 0.476259  ,
       0.38105202, 0.34098484, 0.66268578, 0.51785077, 0.38472533,
       0.31332294, 0.16096273, 0.25827974, 0.32246416, 0.47091458,
       0.43473274, 0.31064553, 0.3809209 , 0.16838872, 0.31772048,
       0.476259  , 0.41233792, 0.43601714, 0.51382929, 0.25827974,
       0.43601714, 0.22959841, 0.19314699, 0.26892454, 0.2432576 ,
       0.22916929, 0.49606106, 0.43869377, 0.22510311, 0.43601714,
       0.31244848, 0.476259  , 0.16096273, 0.3809209 , 0.66268578,
       0.49606106, 0.51785077, 0.38472533, 0.18512697, 0.20386

In [54]:
#提出用関数
sample[1] = y_preds[0]
sample.to_csv(f'submit/lightgbm3.tsv',sep='\t', header=None)