forked from allenai/allennlp
-
Notifications
You must be signed in to change notification settings - Fork 0
/
latest_results_old
410 lines (384 loc) · 14.8 KB
/
latest_results_old
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
/data/tagger/chunk-iobes_conll02_tagger_crf_template
training_duration 02:25:47
training_start_epoch 0
training_epochs 38
training_precision-overall 0.9998878274037653
training_recall-overall 0.9998878274037653
training_f1-measure-overall 0.9998878274037153
training_loss 0.5204149484634399
validation_precision-overall 0.9316013628620102
validation_recall-overall 0.9400085947571981
validation_f1-measure-overall 0.9357860962566347
validation_loss 240.97845458984375
test_precision-overall 0.934309554973822
test_recall-overall 0.9348448882704429
test_f1-measure-overall 0.9345771449612855
/data/tagger/chunk-iobes_conll03_tagger_crf_template
training_duration 01:18:24
training_start_epoch 0
training_epochs 14
training_precision-overall 0.999310013799724
training_recall-overall 0.999359980799424
training_f1-measure-overall 0.9993349966749333
training_loss 1.5395371913909912
validation_precision-overall 0.9056926364872742
validation_recall-overall 0.9056222558961806
validation_f1-measure-overall 0.9056574448243205
validation_loss 187.4296112060547
test_precision-overall 0.8982826345117384
test_recall-overall 0.8931425976385104
test_f1-measure-overall 0.8957052420639843
/data/tagger/com_broadcast1_tagger_crf_template
training_duration 00:04:15
training_start_epoch 0
training_epochs 13
training_precision-overall 0.8698769334989274
training_recall-overall 0.8698769334989274
training_f1-measure-overall 0.8698769334988774
training_loss 175.78018188476562
validation_precision-overall 0.6795774647887324
validation_recall-overall 0.6795774647887324
validation_f1-measure-overall 0.6795774647886824
validation_loss 321.7848815917969
test_precision-overall 0.7348484848484849
test_recall-overall 0.7348484848484849
test_f1-measure-overall 0.7348484848484348
/data/tagger/com_broadcast2_tagger_crf_template
training_duration 00:04:20
training_start_epoch 0
training_epochs 13
training_precision-overall 0.8921563083187242
training_recall-overall 0.8921563083187242
training_f1-measure-overall 0.8921563083186742
training_loss 135.85646057128906
validation_precision-overall 0.7580739870816207
validation_recall-overall 0.7580739870816207
validation_f1-measure-overall 0.7580739870815707
validation_loss 247.6552734375
test_precision-overall 0.7869654817104585
test_recall-overall 0.7869654817104585
test_f1-measure-overall 0.7869654817104086
/data/tagger/com_broadcast3_tagger_crf_template
training_duration 00:07:10
training_start_epoch 0
training_epochs 23
training_precision-overall 0.9620539501215857
training_recall-overall 0.9620539501215857
training_f1-measure-overall 0.9620539501215357
training_loss 63.20952606201172
validation_precision-overall 0.6881972988843218
validation_recall-overall 0.6881972988843218
validation_f1-measure-overall 0.6881972988842718
validation_loss 633.2294311523438
test_precision-overall 0.6725914477073673
test_recall-overall 0.6725914477073673
test_f1-measure-overall 0.6725914477073174
/data/tagger/ner-iobes_conll03_tagger_crf_template
training_duration 01:49:22
training_start_epoch 0
training_epochs 34
training_precision-overall 0.9998297727466168
training_recall-overall 0.9997872249882974
training_f1-measure-overall 0.9998084984147424
training_loss 0.04951019212603569
validation_precision-overall 0.9295633260833194
validation_recall-overall 0.9350387075058902
validation_f1-measure-overall 0.9322929775987417
validation_loss 73.9247055053711
test_precision-overall 0.8734353268428373
test_recall-overall 0.8895184135977338
test_f1-measure-overall 0.8814035087718799
/data/tagger/ner_conll03_tagger_crf_template
training_duration 01:36:22
training_start_epoch 0
training_epochs 23
training_precision-overall 0.9998723186925434
training_recall-overall 0.9997446699859569
training_f1-measure-overall 0.9998084902648718
training_loss 0.048641666769981384
validation_precision-overall 0.9191213180229656
validation_recall-overall 0.9294850218781555
validation_f1-measure-overall 0.9242741193205091
validation_loss 60.833248138427734
test_precision-overall 0.864321608040201
test_recall-overall 0.8831444759206799
test_f1-measure-overall 0.873631666520661
/data/tagger/supsense_streusle_tagger_crf_template
training_duration 00:43:23
training_start_epoch 0
training_epochs 42
training_precision-overall 0.9997770966843131
training_recall-overall 0.9998328131966117
training_f1-measure-overall 0.9998049541641786
training_loss 2.6690115928649902
validation_precision-overall 0.6803435114503816
validation_recall-overall 0.6672905942910622
validation_f1-measure-overall 0.6737538388849016
validation_loss 313.3295593261719
test_precision-overall 0.6746987951807228
test_recall-overall 0.6548175865294668
test_f1-measure-overall 0.6646095418940872
/data/tagger/mwe_streusle_tagger_crf_template
training_duration 00:12:36
training_start_epoch 0
training_epochs 15
training_precision-overall 0.9773391812865497
training_recall-overall 0.9705284552845529
training_f1-measure-overall 0.9739219114218615
training_loss 11.303165435791016
validation_precision-overall 0.5502793296089384
validation_recall-overall 0.49127182044887774
validation_f1-measure-overall 0.5191040843214259
validation_loss 176.8157958984375
test_precision-overall 0.5483870967741935
test_recall-overall 0.5071599045346061
test_f1-measure-overall 0.5269683818970363
/data/tagger/smwe_streusle_tagger_crf_template
training_duration 00:18:28
training_start_epoch 0
training_epochs 21
training_precision-overall 0.9994757077944775
training_recall-overall 0.9982544946762087
training_f1-measure-overall 0.9988647279713062
training_loss 0.7053992748260498
validation_precision-overall 0.5620567375886524
validation_recall-overall 0.478129713423831
validation_f1-measure-overall 0.516707416462868
validation_loss 266.6455993652344
test_precision-overall 0.559618441971383
test_recall-overall 0.5325264750378214
test_f1-measure-overall 0.545736434108477
/data/tagger/sem_semcor_tagger_crf_template
training_duration 02:04:49
training_start_epoch 0
training_epochs 20
training_precision-overall 0.9913848486405921
training_recall-overall 0.9913593729924194
training_f1-measure-overall 0.9913721106527916
training_loss 13.041400909423828
validation_precision-overall 0.738763899663822
validation_recall-overall 0.7415252037585007
validation_f1-measure-overall 0.7401419762681505
validation_loss 489.9003601074219
test_precision-overall 0.747529297402387
test_recall-overall 0.7486411206360367
test_f1-measure-overall 0.7480847959141814
/data/tagger/semtr_semtraits_tagger_crf_template
training_duration 01:13:42
training_start_epoch 0
training_epochs 15
training_precision-overall 0.9902525349148651
training_recall-overall 0.9901388782615349
training_f1-measure-overall 0.9901957033267152
training_loss 10.7341947555542
validation_precision-overall 0.7254643656962192
validation_recall-overall 0.7283428117973813
validation_f1-measure-overall 0.7269007391762964
validation_loss 651.2142944335938
test_precision-overall 0.740308019118428
test_recall-overall 0.7424107935380792
test_f1-measure-overall 0.7413579152632012
/data/tagger/multitagger_multi_xpos
training_duration 02:19:31
training_start_epoch 0
training_epochs 16
training_f1-measure-overall 0.9988322579362915
training_xpos-f1-measure-overall 0.9988322579362915
training_loss 3.6433939933776855
validation_f1-measure-overall 0.9464983395193874
validation_xpos-f1-measure-overall 0.9464983395193874
validation_loss 120.0270767211914
test_f1-measure-overall 0.9446250260036946
test_xpos-f1-measure-overall 0.9446250260036946
/data/tagger/multitagger_multi_upos
training_duration 01:57:47
training_start_epoch 0
training_epochs 28
training_f1-measure-overall 0.9861582260715648
training_upos-f1-measure-overall 0.9861582260715648
training_loss 11.012274742126465
validation_f1-measure-overall 0.937757841660614
validation_upos-f1-measure-overall 0.937757841660614
validation_loss 115.06605529785156
test_f1-measure-overall 0.9382485152737631
test_upos-f1-measure-overall 0.9382485152737631
/data/tagger/multitagger_multi_uni
training_duration 04:08:01
training_start_epoch 0
training_epochs 24
training_f1-measure-overall 0.9999266812000321
training_upos-f1-measure-overall 0.9999169053600431
training_xpos-f1-measure-overall 0.9999364570400212
training_loss 0.3747028410434723
validation_f1-measure-overall 0.9473516780658002
validation_upos-f1-measure-overall 0.94850485128037
validation_xpos-f1-measure-overall 0.9461985048512305
validation_loss 125.09725189208984
test_f1-measure-overall 0.9514065986610912
test_upos-f1-measure-overall 0.9538571883965072
test_xpos-f1-measure-overall 0.9489560089256752
/data/tagger/multitagger_multi_conll03
training_duration 04:04:48
training_start_epoch 0
training_epochs 33
training_f1-measure-overall 0.9997491886010651
training_xpos-f1-measure-overall 0.9998133787771881
training_chunk-f1-measure-overall 0.9996849984249421
training_loss 1.5664803981781006
validation_f1-measure-overall 0.9350369297372303
validation_xpos-f1-measure-overall 0.9547136014952189
validation_chunk-f1-measure-overall 0.9153602579792417
validation_loss 152.3376007080078
test_f1-measure-overall 0.9260302811989182
test_xpos-f1-measure-overall 0.950942177236948
test_chunk-f1-measure-overall 0.9011183851608884
/data/tagger/taskembtagger_task_embedding_tagger_xpos
training_duration 06:50:42
training_start_epoch 0
training_epochs 53
training_precision-overall 0.9996688822125732
training_recall-overall 0.9996688822125732
training_f1-measure-overall 0.9996688822125233
training_loss 0.7365136742591858
validation_precision-overall 0.9505274467669467
validation_recall-overall 0.9505274467669467
validation_f1-measure-overall 0.9505274467668967
validation_loss 179.13174438476562
test_precision-overall 0.9481095277719992
test_recall-overall 0.9481095277719992
test_f1-measure-overall 0.9481095277719492
/data/tagger/taskembtagger_task_embedding_tagger_upos
training_duration 03:10:43
training_start_epoch 0
training_epochs 28
training_precision-overall 0.9998716869160752
training_recall-overall 0.9998716869160752
training_f1-measure-overall 0.9998716869160252
training_loss 0.3576161563396454
validation_precision-overall 0.951771331281514
validation_recall-overall 0.951771331281514
validation_f1-measure-overall 0.9517713312814641
validation_loss 143.30697631835938
test_precision-overall 0.9542605899530794
test_recall-overall 0.9542605899530794
test_f1-measure-overall 0.9542605899530294
/data/tagger/taskembtagger_task_embedding_tagger_uni
training_duration 02:59:44
training_start_epoch 0
training_epochs 25
training_precision-overall 0.9998851338801287
training_recall-overall 0.9998851338801287
training_f1-measure-overall 0.9998851338800787
training_loss 0.26874402165412903
validation_precision-overall 0.9496779067917925
validation_recall-overall 0.9496779067917925
validation_f1-measure-overall 0.9496779067917427
validation_loss 181.84857177734375
test_precision-overall 0.9522633088938476
test_recall-overall 0.9522633088938476
test_f1-measure-overall 0.9522633088937976
/data/tagger/taskembtagger_task_embedding_tagger_conll03
training_duration 04:08:34
training_start_epoch 0
training_epochs 32
training_precision-overall 0.9997463976945244
training_recall-overall 0.9997694471342279
training_f1-measure-overall 0.9997579222814749
training_loss 0.8358157277107239
validation_precision-overall 0.9438297098625938
validation_recall-overall 0.9425932891477191
validation_f1-measure-overall 0.9432110943106764
validation_loss 188.56341552734375
test_precision-overall 0.9369850584636998
test_recall-overall 0.9353151705499964
test_f1-measure-overall 0.9361493698277128
/data/tagger/taskembtagger_task_embedding_tagger_uposchunk
training_duration 03:28:51
training_start_epoch 0
training_epochs 32
training_precision-overall 0.9997785380946573
training_recall-overall 0.9997849558999115
training_f1-measure-overall 0.9997817469869351
training_loss 0.8021429181098938
validation_precision-overall 0.9475553868264772
validation_recall-overall 0.9499768914987902
validation_f1-measure-overall 0.9487645940808623
validation_loss 164.17059326171875
test_precision-overall 0.9495742059878957
test_recall-overall 0.950312223621794
test_f1-measure-overall 0.9499430714620088
/data/tagger/taskembtagger_task_prepend_embedding_tagger_xpos
training_duration 04:55:49
training_start_epoch 0
training_epochs 52
training_precision-overall 0.9998115401579855
training_recall-overall 0.9998115401579855
training_f1-measure-overall 0.9998115401579355
training_loss 0.2840873897075653
validation_precision-overall 0.9498395651889202
validation_recall-overall 0.9498395651889202
validation_f1-measure-overall 0.9498395651888702
validation_loss 148.66958618164062
test_precision-overall 0.951701282934672
test_recall-overall 0.951701282934672
test_f1-measure-overall 0.9517012829346221
/data/tagger/taskembtagger_task_prepend_embedding_tagger_upos
training_duration 02:11:23
training_start_epoch 0
training_epochs 25
training_precision-overall 0.9998957456193112
training_recall-overall 0.9998957456193112
training_f1-measure-overall 0.9998957456192612
training_loss 0.24794122576713562
validation_precision-overall 0.951181978914282
validation_recall-overall 0.951181978914282
validation_f1-measure-overall 0.9511819789142321
validation_loss 157.90658569335938
test_precision-overall 0.9541293434393149
test_recall-overall 0.9541293434393149
test_f1-measure-overall 0.9541293434392648
/data/tagger/taskembtagger_task_prepend_embedding_tagger_uni
training_duration 03:42:18
training_start_epoch 0
training_epochs 23
training_precision-overall 0.9998778020001369
training_recall-overall 0.9998778020001369
training_f1-measure-overall 0.9998778020000869
training_loss 0.24902941286563873
validation_precision-overall 0.9492404962621283
validation_recall-overall 0.9492404962621283
validation_f1-measure-overall 0.9492404962620783
validation_loss 173.94241333007812
test_precision-overall 0.9528003028431392
test_recall-overall 0.9527813197322282
test_f1-measure-overall 0.9527908111930803
/data/tagger/taskembtagger_task_prepend_embedding_tagger_conll03
training_duration 04:03:29
training_start_epoch 0
training_epochs 26
training_precision-overall 0.9995290180850468
training_recall-overall 0.9995388942684558
training_f1-measure-overall 0.9995339561523051
training_loss 1.0640742778778076
validation_precision-overall 0.9426486058260497
validation_recall-overall 0.9414259588321509
validation_f1-measure-overall 0.9420368856181929
validation_loss 186.9593048095703
test_precision-overall 0.9369745437501831
test_recall-overall 0.9344971148929954
test_f1-measure-overall 0.9357341895281409
/data/tagger/taskembtagger_task_prepend_embedding_tagger_uposchunk
training_duration 04:02:23
training_start_epoch 0
training_epochs 34
training_precision-overall 0.9997977975986058
training_recall-overall 0.9998138424208188
training_f1-measure-overall 0.9998058199452908
training_loss 0.6707249879837036
validation_precision-overall 0.9482047944462523
validation_recall-overall 0.9506021803550553
validation_f1-measure-overall 0.949401973961041
validation_loss 170.69989013671875
test_precision-overall 0.9488182646444075
test_recall-overall 0.9489454077667301
test_f1-measure-overall 0.9488818319464601