In [1]:
import lightgbm as lgb
import pandas as pd


df_train = pd.read_csv("./regression.train", header=None, sep="\t")
y = df_train[0]
X = df_train.drop(0, axis=1)


df_test = pd.read_csv("./regression.test", header=None, sep="\t")
y_test = df_train[0]
X_test = df_train.drop(0, axis=1)

train_data = lgb.Dataset(data=X, label=y)
lgb_eval = lgb.Dataset(X_test, y_test, reference=train_data)

params = {'boosting_type': 'gbdt',
          'objective': 'regression',
          'metric': {'l2', 'l1'},
         'num_leaves': 24,
        'feature_fraction': 0.7,
        'bagging_fraction': 0.85,
        'max_depth': 5,
         'learning_rate': 0.02,
        'lambda_l1': 1,
        'lambda_l2': 1,
        'min_split_gain': 0.01,
        'min_child_weight': 10}

gbm = lgb.train(params, train_data, num_boost_round=3000, valid_sets=lgb_eval, early_stopping_rounds=10)

y_pred = gbm.predict(X_test, num_iteration=gbm.best_iteration)
print("the shape of y_pred", y_pred.shape)
print("the shape of y_truth", y_test.shape)
print(sum((y_pred > 0.5) == y_test))
                                    

[1]	valid_0's l1: 0.496232	valid_0's l2: 0.247204
Training until validation scores don't improve for 10 rounds.
[2]	valid_0's l1: 0.494701	valid_0's l2: 0.245712
[3]	valid_0's l1: 0.493282	valid_0's l2: 0.244335
[4]	valid_0's l1: 0.492212	valid_0's l2: 0.243313
[5]	valid_0's l1: 0.490486	valid_0's l2: 0.24168
[6]	valid_0's l1: 0.488977	valid_0's l2: 0.240275
[7]	valid_0's l1: 0.48754	valid_0's l2: 0.238944
[8]	valid_0's l1: 0.486135	valid_0's l2: 0.237652
[9]	valid_0's l1: 0.48488	valid_0's l2: 0.236514
[10]	valid_0's l1: 0.483417	valid_0's l2: 0.235205
[11]	valid_0's l1: 0.482388	valid_0's l2: 0.234288
[12]	valid_0's l1: 0.480743	valid_0's l2: 0.232852
[13]	valid_0's l1: 0.480059	valid_0's l2: 0.232223
[14]	valid_0's l1: 0.478711	valid_0's l2: 0.231065
[15]	valid_0's l1: 0.477369	valid_0's l2: 0.229923
[16]	valid_0's l1: 0.476113	valid_0's l2: 0.228854
[17]	valid_0's l1: 0.474724	valid_0's l2: 0.227705
[18]	valid_0's l1: 0.473703	valid_0's l2: 0.226831
[19]	valid_0's l1: 0.472454	vali

[206]	valid_0's l1: 0.364592	valid_0's l2: 0.160888
[207]	valid_0's l1: 0.364252	valid_0's l2: 0.160731
[208]	valid_0's l1: 0.363996	valid_0's l2: 0.160566
[209]	valid_0's l1: 0.363833	valid_0's l2: 0.160481
[210]	valid_0's l1: 0.363637	valid_0's l2: 0.160381
[211]	valid_0's l1: 0.363417	valid_0's l2: 0.160256
[212]	valid_0's l1: 0.363287	valid_0's l2: 0.160191
[213]	valid_0's l1: 0.363051	valid_0's l2: 0.160024
[214]	valid_0's l1: 0.362905	valid_0's l2: 0.159927
[215]	valid_0's l1: 0.362732	valid_0's l2: 0.159828
[216]	valid_0's l1: 0.362481	valid_0's l2: 0.159676
[217]	valid_0's l1: 0.362303	valid_0's l2: 0.15957
[218]	valid_0's l1: 0.362159	valid_0's l2: 0.159477
[219]	valid_0's l1: 0.361875	valid_0's l2: 0.159297
[220]	valid_0's l1: 0.361758	valid_0's l2: 0.15923
[221]	valid_0's l1: 0.361577	valid_0's l2: 0.159104
[222]	valid_0's l1: 0.361276	valid_0's l2: 0.158945
[223]	valid_0's l1: 0.361015	valid_0's l2: 0.158776
[224]	valid_0's l1: 0.360778	valid_0's l2: 0.158647
[225]	valid_0'

[377]	valid_0's l1: 0.337516	valid_0's l2: 0.144056
[378]	valid_0's l1: 0.337415	valid_0's l2: 0.14398
[379]	valid_0's l1: 0.337343	valid_0's l2: 0.143932
[380]	valid_0's l1: 0.337255	valid_0's l2: 0.143865
[381]	valid_0's l1: 0.337117	valid_0's l2: 0.143766
[382]	valid_0's l1: 0.336953	valid_0's l2: 0.143655
[383]	valid_0's l1: 0.336911	valid_0's l2: 0.143624
[384]	valid_0's l1: 0.336787	valid_0's l2: 0.14354
[385]	valid_0's l1: 0.336664	valid_0's l2: 0.143458
[386]	valid_0's l1: 0.3366	valid_0's l2: 0.143427
[387]	valid_0's l1: 0.336528	valid_0's l2: 0.143368
[388]	valid_0's l1: 0.336285	valid_0's l2: 0.143225
[389]	valid_0's l1: 0.336155	valid_0's l2: 0.14316
[390]	valid_0's l1: 0.336061	valid_0's l2: 0.143108
[391]	valid_0's l1: 0.335907	valid_0's l2: 0.143007
[392]	valid_0's l1: 0.335836	valid_0's l2: 0.142952
[393]	valid_0's l1: 0.335767	valid_0's l2: 0.142894
[394]	valid_0's l1: 0.335684	valid_0's l2: 0.142828
[395]	valid_0's l1: 0.33552	valid_0's l2: 0.142725
[396]	valid_0's l1

[546]	valid_0's l1: 0.318853	valid_0's l2: 0.131161
[547]	valid_0's l1: 0.318735	valid_0's l2: 0.131065
[548]	valid_0's l1: 0.318639	valid_0's l2: 0.131006
[549]	valid_0's l1: 0.318493	valid_0's l2: 0.1309
[550]	valid_0's l1: 0.318402	valid_0's l2: 0.130834
[551]	valid_0's l1: 0.318291	valid_0's l2: 0.130742
[552]	valid_0's l1: 0.318211	valid_0's l2: 0.130691
[553]	valid_0's l1: 0.318074	valid_0's l2: 0.130591
[554]	valid_0's l1: 0.317939	valid_0's l2: 0.130492
[555]	valid_0's l1: 0.317801	valid_0's l2: 0.130396
[556]	valid_0's l1: 0.317674	valid_0's l2: 0.130302
[557]	valid_0's l1: 0.317597	valid_0's l2: 0.13025
[558]	valid_0's l1: 0.317519	valid_0's l2: 0.130193
[559]	valid_0's l1: 0.31746	valid_0's l2: 0.130144
[560]	valid_0's l1: 0.31741	valid_0's l2: 0.130107
[561]	valid_0's l1: 0.317268	valid_0's l2: 0.129995
[562]	valid_0's l1: 0.317196	valid_0's l2: 0.129955
[563]	valid_0's l1: 0.317139	valid_0's l2: 0.129911
[564]	valid_0's l1: 0.317083	valid_0's l2: 0.129865
[565]	valid_0's l

[744]	valid_0's l1: 0.29982	valid_0's l2: 0.117907
[745]	valid_0's l1: 0.299695	valid_0's l2: 0.11782
[746]	valid_0's l1: 0.299578	valid_0's l2: 0.117733
[747]	valid_0's l1: 0.299427	valid_0's l2: 0.117634
[748]	valid_0's l1: 0.299368	valid_0's l2: 0.117588
[749]	valid_0's l1: 0.299295	valid_0's l2: 0.117539
[750]	valid_0's l1: 0.299169	valid_0's l2: 0.117458
[751]	valid_0's l1: 0.299102	valid_0's l2: 0.117421
[752]	valid_0's l1: 0.299051	valid_0's l2: 0.117384
[753]	valid_0's l1: 0.29892	valid_0's l2: 0.117296
[754]	valid_0's l1: 0.298792	valid_0's l2: 0.117216
[755]	valid_0's l1: 0.29866	valid_0's l2: 0.117124
[756]	valid_0's l1: 0.298544	valid_0's l2: 0.117032
[757]	valid_0's l1: 0.298439	valid_0's l2: 0.116959
[758]	valid_0's l1: 0.298373	valid_0's l2: 0.116915
[759]	valid_0's l1: 0.298259	valid_0's l2: 0.116834
[760]	valid_0's l1: 0.298166	valid_0's l2: 0.116775
[761]	valid_0's l1: 0.298064	valid_0's l2: 0.116687
[762]	valid_0's l1: 0.297991	valid_0's l2: 0.116634
[763]	valid_0's 

[931]	valid_0's l1: 0.283074	valid_0's l2: 0.106413
[932]	valid_0's l1: 0.283019	valid_0's l2: 0.106379
[933]	valid_0's l1: 0.282908	valid_0's l2: 0.106303
[934]	valid_0's l1: 0.282793	valid_0's l2: 0.106223
[935]	valid_0's l1: 0.282662	valid_0's l2: 0.106139
[936]	valid_0's l1: 0.282604	valid_0's l2: 0.106104
[937]	valid_0's l1: 0.282538	valid_0's l2: 0.10606
[938]	valid_0's l1: 0.282405	valid_0's l2: 0.105985
[939]	valid_0's l1: 0.282369	valid_0's l2: 0.105961
[940]	valid_0's l1: 0.282276	valid_0's l2: 0.105905
[941]	valid_0's l1: 0.282184	valid_0's l2: 0.105847
[942]	valid_0's l1: 0.282078	valid_0's l2: 0.105774
[943]	valid_0's l1: 0.281948	valid_0's l2: 0.105697
[944]	valid_0's l1: 0.281879	valid_0's l2: 0.105652
[945]	valid_0's l1: 0.281794	valid_0's l2: 0.105592
[946]	valid_0's l1: 0.281689	valid_0's l2: 0.105522
[947]	valid_0's l1: 0.281586	valid_0's l2: 0.105464
[948]	valid_0's l1: 0.281531	valid_0's l2: 0.105425
[949]	valid_0's l1: 0.281458	valid_0's l2: 0.105374
[950]	valid_0

[1178]	valid_0's l1: 0.262751	valid_0's l2: 0.0931867
[1179]	valid_0's l1: 0.262656	valid_0's l2: 0.0931224
[1180]	valid_0's l1: 0.262545	valid_0's l2: 0.0930568
[1181]	valid_0's l1: 0.262454	valid_0's l2: 0.0930016
[1182]	valid_0's l1: 0.262365	valid_0's l2: 0.092942
[1183]	valid_0's l1: 0.262261	valid_0's l2: 0.0928692
[1184]	valid_0's l1: 0.262198	valid_0's l2: 0.0928313
[1185]	valid_0's l1: 0.26211	valid_0's l2: 0.092768
[1186]	valid_0's l1: 0.262018	valid_0's l2: 0.0927053
[1187]	valid_0's l1: 0.261951	valid_0's l2: 0.0926585
[1188]	valid_0's l1: 0.261924	valid_0's l2: 0.092639
[1189]	valid_0's l1: 0.261809	valid_0's l2: 0.0925701
[1190]	valid_0's l1: 0.261721	valid_0's l2: 0.0925197
[1191]	valid_0's l1: 0.261603	valid_0's l2: 0.0924528
[1192]	valid_0's l1: 0.261526	valid_0's l2: 0.0923909
[1193]	valid_0's l1: 0.261444	valid_0's l2: 0.0923358
[1194]	valid_0's l1: 0.261374	valid_0's l2: 0.0922913
[1195]	valid_0's l1: 0.261289	valid_0's l2: 0.0922313
[1196]	valid_0's l1: 0.261201	va

[1342]	valid_0's l1: 0.249674	valid_0's l2: 0.0849754
[1343]	valid_0's l1: 0.249594	valid_0's l2: 0.0849223
[1344]	valid_0's l1: 0.249509	valid_0's l2: 0.0848662
[1345]	valid_0's l1: 0.249405	valid_0's l2: 0.0847967
[1346]	valid_0's l1: 0.249368	valid_0's l2: 0.0847748
[1347]	valid_0's l1: 0.249273	valid_0's l2: 0.0847145
[1348]	valid_0's l1: 0.249205	valid_0's l2: 0.0846729
[1349]	valid_0's l1: 0.249135	valid_0's l2: 0.0846307
[1350]	valid_0's l1: 0.249029	valid_0's l2: 0.0845647
[1351]	valid_0's l1: 0.248936	valid_0's l2: 0.0845103
[1352]	valid_0's l1: 0.248889	valid_0's l2: 0.0844844
[1353]	valid_0's l1: 0.248819	valid_0's l2: 0.0844383
[1354]	valid_0's l1: 0.24874	valid_0's l2: 0.0843858
[1355]	valid_0's l1: 0.248656	valid_0's l2: 0.0843365
[1356]	valid_0's l1: 0.248607	valid_0's l2: 0.0843053
[1357]	valid_0's l1: 0.248542	valid_0's l2: 0.0842648
[1358]	valid_0's l1: 0.248468	valid_0's l2: 0.0842181
[1359]	valid_0's l1: 0.248408	valid_0's l2: 0.0841749
[1360]	valid_0's l1: 0.248319

[1500]	valid_0's l1: 0.238403	valid_0's l2: 0.0780935
[1501]	valid_0's l1: 0.238329	valid_0's l2: 0.078048
[1502]	valid_0's l1: 0.238245	valid_0's l2: 0.0780006
[1503]	valid_0's l1: 0.238172	valid_0's l2: 0.0779559
[1504]	valid_0's l1: 0.238106	valid_0's l2: 0.0779136
[1505]	valid_0's l1: 0.238025	valid_0's l2: 0.0778722
[1506]	valid_0's l1: 0.237995	valid_0's l2: 0.0778526
[1507]	valid_0's l1: 0.237917	valid_0's l2: 0.0778082
[1508]	valid_0's l1: 0.237849	valid_0's l2: 0.0777725
[1509]	valid_0's l1: 0.237793	valid_0's l2: 0.0777375
[1510]	valid_0's l1: 0.237701	valid_0's l2: 0.0776842
[1511]	valid_0's l1: 0.237599	valid_0's l2: 0.0776306
[1512]	valid_0's l1: 0.237516	valid_0's l2: 0.0775808
[1513]	valid_0's l1: 0.23742	valid_0's l2: 0.0775294
[1514]	valid_0's l1: 0.237361	valid_0's l2: 0.077499
[1515]	valid_0's l1: 0.23728	valid_0's l2: 0.0774535
[1516]	valid_0's l1: 0.237175	valid_0's l2: 0.0773979
[1517]	valid_0's l1: 0.237114	valid_0's l2: 0.0773628
[1518]	valid_0's l1: 0.237039	va

[1662]	valid_0's l1: 0.228031	valid_0's l2: 0.0719163
[1663]	valid_0's l1: 0.227983	valid_0's l2: 0.0718917
[1664]	valid_0's l1: 0.227897	valid_0's l2: 0.0718411
[1665]	valid_0's l1: 0.227835	valid_0's l2: 0.0717987
[1666]	valid_0's l1: 0.227763	valid_0's l2: 0.071751
[1667]	valid_0's l1: 0.227714	valid_0's l2: 0.0717221
[1668]	valid_0's l1: 0.227647	valid_0's l2: 0.0716778
[1669]	valid_0's l1: 0.227577	valid_0's l2: 0.0716363
[1670]	valid_0's l1: 0.227532	valid_0's l2: 0.0716112
[1671]	valid_0's l1: 0.22747	valid_0's l2: 0.0715715
[1672]	valid_0's l1: 0.227391	valid_0's l2: 0.0715225
[1673]	valid_0's l1: 0.227334	valid_0's l2: 0.0714939
[1674]	valid_0's l1: 0.227291	valid_0's l2: 0.07147
[1675]	valid_0's l1: 0.227217	valid_0's l2: 0.0714238
[1676]	valid_0's l1: 0.227144	valid_0's l2: 0.0713791
[1677]	valid_0's l1: 0.227067	valid_0's l2: 0.0713326
[1678]	valid_0's l1: 0.227015	valid_0's l2: 0.0713054
[1679]	valid_0's l1: 0.226941	valid_0's l2: 0.0712595
[1680]	valid_0's l1: 0.226872	va

[1853]	valid_0's l1: 0.216277	valid_0's l2: 0.065206
[1854]	valid_0's l1: 0.216232	valid_0's l2: 0.065182
[1855]	valid_0's l1: 0.216159	valid_0's l2: 0.065141
[1856]	valid_0's l1: 0.216098	valid_0's l2: 0.0651079
[1857]	valid_0's l1: 0.216044	valid_0's l2: 0.0650763
[1858]	valid_0's l1: 0.215977	valid_0's l2: 0.0650359
[1859]	valid_0's l1: 0.215919	valid_0's l2: 0.0650023
[1860]	valid_0's l1: 0.215883	valid_0's l2: 0.0649746
[1861]	valid_0's l1: 0.215821	valid_0's l2: 0.0649393
[1862]	valid_0's l1: 0.215742	valid_0's l2: 0.0648922
[1863]	valid_0's l1: 0.215687	valid_0's l2: 0.0648614
[1864]	valid_0's l1: 0.215627	valid_0's l2: 0.0648301
[1865]	valid_0's l1: 0.215538	valid_0's l2: 0.0647843
[1866]	valid_0's l1: 0.215477	valid_0's l2: 0.0647502
[1867]	valid_0's l1: 0.215406	valid_0's l2: 0.0647124
[1868]	valid_0's l1: 0.215326	valid_0's l2: 0.0646688
[1869]	valid_0's l1: 0.21526	valid_0's l2: 0.0646304
[1870]	valid_0's l1: 0.21519	valid_0's l2: 0.064591
[1871]	valid_0's l1: 0.2151	valid_

[2188]	valid_0's l1: 0.196777	valid_0's l2: 0.0546186
[2189]	valid_0's l1: 0.196743	valid_0's l2: 0.0546025
[2190]	valid_0's l1: 0.196673	valid_0's l2: 0.0545681
[2191]	valid_0's l1: 0.196603	valid_0's l2: 0.054532
[2192]	valid_0's l1: 0.19658	valid_0's l2: 0.0545194
[2193]	valid_0's l1: 0.196515	valid_0's l2: 0.0544852
[2194]	valid_0's l1: 0.196464	valid_0's l2: 0.0544588
[2195]	valid_0's l1: 0.196419	valid_0's l2: 0.0544368
[2196]	valid_0's l1: 0.196365	valid_0's l2: 0.0544077
[2197]	valid_0's l1: 0.196321	valid_0's l2: 0.0543848
[2198]	valid_0's l1: 0.19628	valid_0's l2: 0.0543665
[2199]	valid_0's l1: 0.196231	valid_0's l2: 0.0543398
[2200]	valid_0's l1: 0.196161	valid_0's l2: 0.0543097
[2201]	valid_0's l1: 0.196102	valid_0's l2: 0.0542827
[2202]	valid_0's l1: 0.196058	valid_0's l2: 0.0542593
[2203]	valid_0's l1: 0.196	valid_0's l2: 0.0542279
[2204]	valid_0's l1: 0.195938	valid_0's l2: 0.0542018
[2205]	valid_0's l1: 0.195881	valid_0's l2: 0.0541695
[2206]	valid_0's l1: 0.195836	vali

In [2]:
gbm.best_score

defaultdict(dict,
            {'valid_0': {'l1': 0.1944152325749874,
              'l2': 0.053404592286744504}})