# Extract hidden representations from flair's pretrained Chunking model

In [6]:
from flair.data import Sentence
from flair.models import SequenceTagger
from flair.models import TextClassifier

from flair.data import TaggedCorpus
from flair.data_fetcher import  NLPTaskDataFetcher, NLPTask
import torch

In [7]:
from pymongo import MongoClient

client = MongoClient()

db = client['glvis_db']

In [8]:
db_col = db['flair_chunk']

In [4]:
chunk_tagger = SequenceTagger.load('chunk')

2019-03-20 12:40:07,155 https://s3.eu-central-1.amazonaws.com/alan-nlp/resources/models-v0.2/NP-conll2000--h256-l1-b32-%2Bnews-forward%2Bnews-backward--v0.2/en-chunk-conll2000-v0.2.pt not found in cache, downloading to /tmp/tmp0l09i918


100%|██████████| 247739475/247739475 [00:59<00:00, 4161783.21B/s]

2019-03-20 12:41:07,279 copying /tmp/tmp0l09i918 to cache at /home/snie/.flair/models/en-chunk-conll2000-v0.2.pt
2019-03-20 12:41:07,430 removing temp file /tmp/tmp0l09i918
2019-03-20 12:41:07,431 loading file /home/snie/.flair/models/en-chunk-conll2000-v0.2.pt





In [3]:
corpus: TaggedCorpus = NLPTaskDataFetcher.load_corpus(NLPTask.CONLL_2000)

2019-03-20 13:13:10,586 Reading data from /home/snie/.flair/datasets/conll_2000
2019-03-20 13:13:10,586 Train: /home/snie/.flair/datasets/conll_2000/train.txt
2019-03-20 13:13:10,586 Dev: None
2019-03-20 13:13:10,587 Test: /home/snie/.flair/datasets/conll_2000/test.txt


In [4]:
tag_type = 'np'
tag_dictionary = corpus.make_tag_dictionary(tag_type=tag_type)

In [9]:
tag_set = set()
for entry in db_col.find():
    tag_set.add(entry['tag'])

In [11]:
list(tag_set)

['VP',
 'CONJP',
 'PRT',
 'ADVP',
 'UCP',
 'SBAR',
 'NP',
 'LST',
 'PP',
 'INTJ',
 'ADJP']

In [10]:
print(len(corpus.get_all_sentences()))

10948


In [23]:
db_col.drop()

In [None]:
for i, sentence in enumerate(corpus.get_all_sentences()):
    print(f'Start sentence {i}')
    
    # Define hook to get intermediate values
    hidden_states = torch.zeros(len(sentence), 1, 512)
    def hook(m, i):
        hidden_states.copy_(i[0].data)
                                
    h = chunk_tagger.linear.register_forward_pre_hook(hook)
                                
    chunk_tagger.predict(sentence)
                                
    spans = sentence.get_spans(tag_type)
                                
    # Informaction to store: the named entities, their predicted labels, probabilities and hidden states
    # If there are multiple words for one entity, take the average value of hidden states
    # and record the number of words in the entity
    
    for span in spans:
        entry = {}
        entry['text'] = span.text
        entry['tag'] = span.tag
        entry['score'] = span.score
        entry['token_num'] = len(span.tokens)
        
        idx = [token.idx-1 for token in span.tokens]
        entry['linear_layer_state'] = hidden_states[idx, :, :].mean(dim=0).squeeze().tolist()
        
        db_col.insert_one(entry)
    
    h.remove()
    
    print(f'Finish sentence {i}')

# Train chunk model

In [1]:
from flair.data import TaggedCorpus
from flair.data_fetcher import  NLPTaskDataFetcher, NLPTask
from flair.embeddings import TokenEmbeddings, WordEmbeddings, StackedEmbeddings, FlairEmbeddings
from typing import List

Better speed can be achieved with apex installed from https://www.github.com/nvidia/apex.


In [2]:
# 1. get the corpus
corpus: TaggedCorpus = NLPTaskDataFetcher.load_corpus(NLPTask.CONLL_2000)

2019-03-17 23:28:59,562 Reading data from /home/snie/.flair/datasets/conll_2000
2019-03-17 23:28:59,562 Train: /home/snie/.flair/datasets/conll_2000/train.txt
2019-03-17 23:28:59,563 Dev: None
2019-03-17 23:28:59,563 Test: /home/snie/.flair/datasets/conll_2000/test.txt


In [3]:
# 2. what tag do we want to predict?
tag_type = 'np'

In [4]:
# 3. make the tag dictionary from the corpus
tag_dictionary = corpus.make_tag_dictionary(tag_type=tag_type)

In [5]:
# initialize embeddings
embedding_types: List[TokenEmbeddings] = [
    WordEmbeddings('extvec'),
    FlairEmbeddings('news-forward'),
    FlairEmbeddings('news-backward'),
]

embeddings: StackedEmbeddings = StackedEmbeddings(embeddings=embedding_types)

In [6]:
# initialize sequence tagger
from flair.models import SequenceTagger

tagger: SequenceTagger = SequenceTagger(hidden_size=256,
                                        embeddings=embeddings,
                                        tag_dictionary=tag_dictionary,
                                        tag_type=tag_type)

In [7]:
# initialize trainer
from flair.trainers import ModelTrainer

trainer: ModelTrainer = ModelTrainer(tagger, corpus)

trainer.train('models/flair/np-chunking',
              max_epochs=150)

2019-03-17 23:29:17,911 ----------------------------------------------------------------------------------------------------
2019-03-17 23:29:17,911 Evaluation method: MICRO_F1_SCORE
2019-03-17 23:29:17,945 ----------------------------------------------------------------------------------------------------
2019-03-17 23:29:18,634 epoch 1 - iter 0/252 - loss 115.07946777
2019-03-17 23:29:35,887 epoch 1 - iter 25/252 - loss 59.17966197
2019-03-17 23:29:53,432 epoch 1 - iter 50/252 - loss 43.37734552
2019-03-17 23:30:10,464 epoch 1 - iter 75/252 - loss 35.03818862
2019-03-17 23:30:28,253 epoch 1 - iter 100/252 - loss 29.57320743
2019-03-17 23:30:45,902 epoch 1 - iter 125/252 - loss 25.79143439
2019-03-17 23:31:03,494 epoch 1 - iter 150/252 - loss 23.05912499
2019-03-17 23:31:21,495 epoch 1 - iter 175/252 - loss 20.92689903
2019-03-17 23:31:39,219 epoch 1 - iter 200/252 - loss 19.28091297
2019-03-17 23:31:56,303 epoch 1 - iter 225/252 - loss 17.88000640
2019-03-17 23:32:14,494 epoch 1 - it

2019-03-17 23:43:42,181 EPOCH 7 done: loss 2.4415 - lr 0.1000 - bad epochs 0
2019-03-17 23:43:51,894 DEV  : loss 1.68751574 - f-score 0.9574 - acc 0.9183
2019-03-17 23:44:09,700 TEST : loss 1.94558537 - f-score 0.9573 - acc 0.9181
2019-03-17 23:44:25,233 ----------------------------------------------------------------------------------------------------
2019-03-17 23:44:25,778 epoch 8 - iter 0/252 - loss 2.90777588
2019-03-17 23:44:31,226 epoch 8 - iter 25/252 - loss 2.27331991
2019-03-17 23:44:35,478 epoch 8 - iter 50/252 - loss 2.40950742
2019-03-17 23:44:40,311 epoch 8 - iter 75/252 - loss 2.44182437
2019-03-17 23:44:47,138 epoch 8 - iter 100/252 - loss 2.38026772
2019-03-17 23:44:54,299 epoch 8 - iter 125/252 - loss 2.37121129
2019-03-17 23:45:01,141 epoch 8 - iter 150/252 - loss 2.35108398
2019-03-17 23:45:07,737 epoch 8 - iter 175/252 - loss 2.32164540
2019-03-17 23:45:14,413 epoch 8 - iter 200/252 - loss 2.30462948
2019-03-17 23:45:21,019 epoch 8 - iter 225/252 - loss 2.30583923

2019-03-17 23:56:15,293 epoch 14 - iter 250/252 - loss 1.61858657
2019-03-17 23:56:15,474 ----------------------------------------------------------------------------------------------------
2019-03-17 23:56:15,475 EPOCH 14 done: loss 1.6194 - lr 0.1000 - bad epochs 0
2019-03-17 23:56:25,115 DEV  : loss 1.45441425 - f-score 0.9628 - acc 0.9284
2019-03-17 23:56:45,738 TEST : loss 1.78657722 - f-score 0.9614 - acc 0.9258
2019-03-17 23:57:01,550 ----------------------------------------------------------------------------------------------------
2019-03-17 23:57:01,772 epoch 15 - iter 0/252 - loss 1.91809320
2019-03-17 23:57:07,243 epoch 15 - iter 25/252 - loss 1.61261233
2019-03-17 23:57:12,830 epoch 15 - iter 50/252 - loss 1.69123557
2019-03-17 23:57:18,271 epoch 15 - iter 75/252 - loss 1.60682987
2019-03-17 23:57:23,184 epoch 15 - iter 100/252 - loss 1.59830611
2019-03-17 23:57:27,743 epoch 15 - iter 125/252 - loss 1.59793631
2019-03-17 23:57:34,440 epoch 15 - iter 150/252 - loss 1.6002

2019-03-18 00:07:53,150 epoch 21 - iter 175/252 - loss 1.30064517
2019-03-18 00:07:59,990 epoch 21 - iter 200/252 - loss 1.29456116
2019-03-18 00:08:06,675 epoch 21 - iter 225/252 - loss 1.31048936
2019-03-18 00:08:13,426 epoch 21 - iter 250/252 - loss 1.30656933
2019-03-18 00:08:13,603 ----------------------------------------------------------------------------------------------------
2019-03-18 00:08:13,604 EPOCH 21 done: loss 1.3061 - lr 0.1000 - bad epochs 0
2019-03-18 00:08:23,101 DEV  : loss 1.42353547 - f-score 0.9651 - acc 0.9325
2019-03-18 00:08:44,910 TEST : loss 1.85697222 - f-score 0.9628 - acc 0.9284
2019-03-18 00:08:44,912 ----------------------------------------------------------------------------------------------------
2019-03-18 00:08:45,233 epoch 22 - iter 0/252 - loss 1.38127995
2019-03-18 00:08:51,918 epoch 22 - iter 25/252 - loss 1.24377674
2019-03-18 00:08:58,560 epoch 22 - iter 50/252 - loss 1.25182308
2019-03-18 00:09:05,304 epoch 22 - iter 75/252 - loss 1.2514

2019-03-18 00:19:39,438 epoch 28 - iter 100/252 - loss 0.98534920
2019-03-18 00:19:46,200 epoch 28 - iter 125/252 - loss 1.00326335
2019-03-18 00:19:52,896 epoch 28 - iter 150/252 - loss 1.03841952
2019-03-18 00:19:59,233 epoch 28 - iter 175/252 - loss 1.02182412
2019-03-18 00:20:05,212 epoch 28 - iter 200/252 - loss 1.01105713
2019-03-18 00:20:10,767 epoch 28 - iter 225/252 - loss 1.02168390
2019-03-18 00:20:16,395 epoch 28 - iter 250/252 - loss 1.02908807
2019-03-18 00:20:16,508 ----------------------------------------------------------------------------------------------------
2019-03-18 00:20:16,509 EPOCH 28 done: loss 1.0284 - lr 0.1000 - bad epochs 0
2019-03-18 00:20:24,566 DEV  : loss 1.43233895 - f-score 0.9654 - acc 0.9333
2019-03-18 00:20:42,543 TEST : loss 1.90831208 - f-score 0.9616 - acc 0.9262
2019-03-18 00:20:58,002 ----------------------------------------------------------------------------------------------------
2019-03-18 00:20:58,308 epoch 29 - iter 0/252 - loss 1.6

2019-03-18 00:31:25,408 epoch 35 - iter 25/252 - loss 1.11239253
2019-03-18 00:31:32,114 epoch 35 - iter 50/252 - loss 1.05585547
2019-03-18 00:31:38,839 epoch 35 - iter 75/252 - loss 1.00224012
2019-03-18 00:31:45,388 epoch 35 - iter 100/252 - loss 0.94685238
2019-03-18 00:31:51,843 epoch 35 - iter 125/252 - loss 0.91714160
2019-03-18 00:31:58,185 epoch 35 - iter 150/252 - loss 0.96495555
2019-03-18 00:32:04,468 epoch 35 - iter 175/252 - loss 0.95695243
2019-03-18 00:32:11,222 epoch 35 - iter 200/252 - loss 0.97198446
2019-03-18 00:32:17,885 epoch 35 - iter 225/252 - loss 0.96315103
2019-03-18 00:32:24,422 epoch 35 - iter 250/252 - loss 0.95320518
2019-03-18 00:32:24,556 ----------------------------------------------------------------------------------------------------
2019-03-18 00:32:24,565 EPOCH 35 done: loss 0.9530 - lr 0.1000 - bad epochs 0
2019-03-18 00:32:34,169 DEV  : loss 1.49393773 - f-score 0.9663 - acc 0.9348
2019-03-18 00:32:54,456 TEST : loss 2.03218269 - f-score 0.9624

2019-03-18 00:43:11,454 ----------------------------------------------------------------------------------------------------
2019-03-18 00:43:11,686 epoch 42 - iter 0/252 - loss 1.05445588
2019-03-18 00:43:16,905 epoch 42 - iter 25/252 - loss 0.89435651
2019-03-18 00:43:22,201 epoch 42 - iter 50/252 - loss 0.88072330
2019-03-18 00:43:27,811 epoch 42 - iter 75/252 - loss 0.83584705
2019-03-18 00:43:33,128 epoch 42 - iter 100/252 - loss 0.84543009
2019-03-18 00:43:38,620 epoch 42 - iter 125/252 - loss 0.86543511
2019-03-18 00:43:44,173 epoch 42 - iter 150/252 - loss 0.84524968
2019-03-18 00:43:50,594 epoch 42 - iter 175/252 - loss 0.83855304
2019-03-18 00:43:57,344 epoch 42 - iter 200/252 - loss 0.84644408
2019-03-18 00:44:03,969 epoch 42 - iter 225/252 - loss 0.83253302
2019-03-18 00:44:10,584 epoch 42 - iter 250/252 - loss 0.82305509
2019-03-18 00:44:10,745 ----------------------------------------------------------------------------------------------------
2019-03-18 00:44:10,746 EPOCH

2019-03-18 00:54:01,017 DEV  : loss 1.67239141 - f-score 0.9647 - acc 0.9319
2019-03-18 00:54:16,909 TEST : loss 2.18771577 - f-score 0.9630 - acc 0.9286
2019-03-18 00:54:16,911 ----------------------------------------------------------------------------------------------------
2019-03-18 00:54:17,160 epoch 49 - iter 0/252 - loss 0.67611146
2019-03-18 00:54:23,857 epoch 49 - iter 25/252 - loss 0.85158196
2019-03-18 00:54:30,433 epoch 49 - iter 50/252 - loss 0.74674031
2019-03-18 00:54:37,249 epoch 49 - iter 75/252 - loss 0.69522890
2019-03-18 00:54:43,739 epoch 49 - iter 100/252 - loss 0.68219233
2019-03-18 00:54:50,712 epoch 49 - iter 125/252 - loss 0.67266784
2019-03-18 00:54:57,602 epoch 49 - iter 150/252 - loss 0.67155901
2019-03-18 00:55:04,339 epoch 49 - iter 175/252 - loss 0.67334650
2019-03-18 00:55:11,033 epoch 49 - iter 200/252 - loss 0.67255216
2019-03-18 00:55:17,571 epoch 49 - iter 225/252 - loss 0.66766674
2019-03-18 00:55:24,483 epoch 49 - iter 250/252 - loss 0.67734847


2019-03-18 01:05:31,664 ----------------------------------------------------------------------------------------------------
2019-03-18 01:05:31,665 EPOCH 55 done: loss 0.6314 - lr 0.1000 - bad epochs 0
2019-03-18 01:05:41,536 DEV  : loss 1.75118661 - f-score 0.9654 - acc 0.9332
2019-03-18 01:06:03,206 TEST : loss 2.37548447 - f-score 0.9629 - acc 0.9285
2019-03-18 01:06:21,490 ----------------------------------------------------------------------------------------------------
2019-03-18 01:06:21,874 epoch 56 - iter 0/252 - loss 0.48036337
2019-03-18 01:06:27,340 epoch 56 - iter 25/252 - loss 0.59999600
2019-03-18 01:06:32,945 epoch 56 - iter 50/252 - loss 0.61787825
2019-03-18 01:06:38,303 epoch 56 - iter 75/252 - loss 0.59671608
2019-03-18 01:06:43,782 epoch 56 - iter 100/252 - loss 0.57741624
2019-03-18 01:06:50,525 epoch 56 - iter 125/252 - loss 0.61067082
2019-03-18 01:06:57,127 epoch 56 - iter 150/252 - loss 0.62778594
2019-03-18 01:07:03,714 epoch 56 - iter 175/252 - loss 0.6531

2019-03-18 01:16:56,695 epoch 62 - iter 175/252 - loss 0.53124483
2019-03-18 01:17:01,751 epoch 62 - iter 200/252 - loss 0.54173053
2019-03-18 01:17:05,974 epoch 62 - iter 225/252 - loss 0.52458798
2019-03-18 01:17:10,740 epoch 62 - iter 250/252 - loss 0.52728567
2019-03-18 01:17:10,885 ----------------------------------------------------------------------------------------------------
2019-03-18 01:17:10,886 EPOCH 62 done: loss 0.5267 - lr 0.0500 - bad epochs 0
2019-03-18 01:17:20,920 DEV  : loss 1.76516414 - f-score 0.9677 - acc 0.9375
2019-03-18 01:17:43,384 TEST : loss 2.42677307 - f-score 0.9642 - acc 0.9310
2019-03-18 01:18:00,018 ----------------------------------------------------------------------------------------------------
2019-03-18 01:18:00,249 epoch 63 - iter 0/252 - loss 0.10931206
2019-03-18 01:18:06,732 epoch 63 - iter 25/252 - loss 0.45053110
2019-03-18 01:18:13,492 epoch 63 - iter 50/252 - loss 0.42269150
2019-03-18 01:18:20,269 epoch 63 - iter 75/252 - loss 0.4262

2019-03-18 01:27:52,029 epoch 69 - iter 75/252 - loss 0.42771632
2019-03-18 01:27:58,773 epoch 69 - iter 100/252 - loss 0.44503409
2019-03-18 01:28:05,689 epoch 69 - iter 125/252 - loss 0.45002533
2019-03-18 01:28:12,395 epoch 69 - iter 150/252 - loss 0.46328723
2019-03-18 01:28:19,251 epoch 69 - iter 175/252 - loss 0.45479031
2019-03-18 01:28:26,048 epoch 69 - iter 200/252 - loss 0.48183334
2019-03-18 01:28:32,848 epoch 69 - iter 225/252 - loss 0.48467682
2019-03-18 01:28:39,573 epoch 69 - iter 250/252 - loss 0.48606820
2019-03-18 01:28:39,749 ----------------------------------------------------------------------------------------------------
2019-03-18 01:28:39,750 EPOCH 69 done: loss 0.4859 - lr 0.0250 - bad epochs 1
2019-03-18 01:28:49,456 DEV  : loss 1.77473772 - f-score 0.9686 - acc 0.9392
2019-03-18 01:29:11,313 TEST : loss 2.41981173 - f-score 0.9649 - acc 0.9322
2019-03-18 01:29:11,314 --------------------------------------------------------------------------------------------

2019-03-18 01:39:02,232 epoch 76 - iter 0/252 - loss 0.87012577
2019-03-18 01:39:08,932 epoch 76 - iter 25/252 - loss 0.41196173
2019-03-18 01:39:15,756 epoch 76 - iter 50/252 - loss 0.42539312
2019-03-18 01:39:22,122 epoch 76 - iter 75/252 - loss 0.44127733
2019-03-18 01:39:28,808 epoch 76 - iter 100/252 - loss 0.41969630
2019-03-18 01:39:34,751 epoch 76 - iter 125/252 - loss 0.40938221
2019-03-18 01:39:40,078 epoch 76 - iter 150/252 - loss 0.38961621
2019-03-18 01:39:45,644 epoch 76 - iter 175/252 - loss 0.38573451
2019-03-18 01:39:51,123 epoch 76 - iter 200/252 - loss 0.40088592
2019-03-18 01:39:56,687 epoch 76 - iter 225/252 - loss 0.40229823
2019-03-18 01:40:02,445 epoch 76 - iter 250/252 - loss 0.39813220
2019-03-18 01:40:02,591 ----------------------------------------------------------------------------------------------------
2019-03-18 01:40:02,592 EPOCH 76 done: loss 0.3983 - lr 0.0250 - bad epochs 2
2019-03-18 01:40:10,549 DEV  : loss 1.82789660 - f-score 0.9680 - acc 0.9380

2019-03-18 01:49:35,908 DEV  : loss 1.85016775 - f-score 0.9682 - acc 0.9384
2019-03-18 01:49:58,018 TEST : loss 2.54591465 - f-score 0.9640 - acc 0.9305
2019-03-18 01:50:13,084 ----------------------------------------------------------------------------------------------------
2019-03-18 01:50:13,685 epoch 83 - iter 0/252 - loss 0.45771861
2019-03-18 01:50:19,086 epoch 83 - iter 25/252 - loss 0.37230780
2019-03-18 01:50:24,596 epoch 83 - iter 50/252 - loss 0.39066860
2019-03-18 01:50:30,166 epoch 83 - iter 75/252 - loss 0.37833085
2019-03-18 01:50:35,474 epoch 83 - iter 100/252 - loss 0.36410244
2019-03-18 01:50:40,849 epoch 83 - iter 125/252 - loss 0.36399973
2019-03-18 01:50:47,382 epoch 83 - iter 150/252 - loss 0.37296017
2019-03-18 01:50:54,253 epoch 83 - iter 175/252 - loss 0.36790828
2019-03-18 01:51:00,932 epoch 83 - iter 200/252 - loss 0.37709492
2019-03-18 01:51:07,595 epoch 83 - iter 225/252 - loss 0.37545536
2019-03-18 01:51:14,168 epoch 83 - iter 250/252 - loss 0.37720644


2019-03-18 02:01:03,959 ----------------------------------------------------------------------------------------------------
2019-03-18 02:01:03,960 EPOCH 89 done: loss 0.3747 - lr 0.0125 - bad epochs 0
2019-03-18 02:01:13,846 DEV  : loss 1.88343143 - f-score 0.9687 - acc 0.9394
2019-03-18 02:01:36,262 TEST : loss 2.58502412 - f-score 0.9646 - acc 0.9316
2019-03-18 02:01:36,264 ----------------------------------------------------------------------------------------------------
2019-03-18 02:01:36,636 epoch 90 - iter 0/252 - loss 0.18564129
2019-03-18 02:01:43,387 epoch 90 - iter 25/252 - loss 0.65261563
2019-03-18 02:01:50,235 epoch 90 - iter 50/252 - loss 0.47972836
2019-03-18 02:01:56,856 epoch 90 - iter 75/252 - loss 0.43740006
2019-03-18 02:02:03,651 epoch 90 - iter 100/252 - loss 0.42427865
2019-03-18 02:02:10,408 epoch 90 - iter 125/252 - loss 0.41174400
2019-03-18 02:02:16,923 epoch 90 - iter 150/252 - loss 0.40348161
2019-03-18 02:02:23,430 epoch 90 - iter 175/252 - loss 0.3838

2019-03-18 02:11:44,913 epoch 96 - iter 175/252 - loss 0.36410582
2019-03-18 02:11:51,647 epoch 96 - iter 200/252 - loss 0.35694413
2019-03-18 02:11:57,995 epoch 96 - iter 225/252 - loss 0.38172091
2019-03-18 02:12:04,639 epoch 96 - iter 250/252 - loss 0.37444542
2019-03-18 02:12:04,804 ----------------------------------------------------------------------------------------------------
2019-03-18 02:12:04,805 EPOCH 96 done: loss 0.3741 - lr 0.0063 - bad epochs 0
2019-03-18 02:12:14,670 DEV  : loss 1.88458323 - f-score 0.9682 - acc 0.9383
2019-03-18 02:12:37,162 TEST : loss 2.62432718 - f-score 0.9640 - acc 0.9305
2019-03-18 02:12:37,164 ----------------------------------------------------------------------------------------------------
2019-03-18 02:12:37,421 epoch 97 - iter 0/252 - loss 0.27676380
2019-03-18 02:12:44,105 epoch 97 - iter 25/252 - loss 0.38975389
2019-03-18 02:12:50,527 epoch 97 - iter 50/252 - loss 0.36241199
2019-03-18 02:12:57,150 epoch 97 - iter 75/252 - loss 0.3368

2019-03-18 02:22:18,214 epoch 103 - iter 75/252 - loss 0.29775273
2019-03-18 02:22:24,983 epoch 103 - iter 100/252 - loss 0.31117548
2019-03-18 02:22:31,646 epoch 103 - iter 125/252 - loss 0.33452622
2019-03-18 02:22:38,358 epoch 103 - iter 150/252 - loss 0.34798793
2019-03-18 02:22:45,067 epoch 103 - iter 175/252 - loss 0.34291075
2019-03-18 02:22:51,651 epoch 103 - iter 200/252 - loss 0.34017011
2019-03-18 02:22:58,155 epoch 103 - iter 225/252 - loss 0.33411163
2019-03-18 02:23:04,636 epoch 103 - iter 250/252 - loss 0.33395518
2019-03-18 02:23:04,816 ----------------------------------------------------------------------------------------------------
2019-03-18 02:23:04,817 EPOCH 103 done: loss 0.3337 - lr 0.0063 - bad epochs 3
2019-03-18 02:23:14,745 DEV  : loss 1.88585496 - f-score 0.9680 - acc 0.9379
2019-03-18 02:23:33,486 TEST : loss 2.63816810 - f-score 0.9641 - acc 0.9307
Epoch   102: reducing learning rate of group 0 to 3.1250e-03.
2019-03-18 02:23:33,488 ---------------------

2019-03-18 02:32:47,437 TEST : loss 2.65898895 - f-score 0.9641 - acc 0.9308
2019-03-18 02:32:47,439 ----------------------------------------------------------------------------------------------------
2019-03-18 02:32:47,813 epoch 110 - iter 0/252 - loss 1.07988238
2019-03-18 02:32:54,407 epoch 110 - iter 25/252 - loss 0.38733920
2019-03-18 02:33:01,270 epoch 110 - iter 50/252 - loss 0.37071088
2019-03-18 02:33:08,216 epoch 110 - iter 75/252 - loss 0.39064711
2019-03-18 02:33:14,710 epoch 110 - iter 100/252 - loss 0.38503901
2019-03-18 02:33:21,418 epoch 110 - iter 125/252 - loss 0.37708403
2019-03-18 02:33:28,255 epoch 110 - iter 150/252 - loss 0.38127676
2019-03-18 02:33:34,831 epoch 110 - iter 175/252 - loss 0.37965028
2019-03-18 02:33:41,598 epoch 110 - iter 200/252 - loss 0.39601203
2019-03-18 02:33:46,563 epoch 110 - iter 225/252 - loss 0.39174918
2019-03-18 02:33:51,934 epoch 110 - iter 250/252 - loss 0.39652019
2019-03-18 02:33:52,151 ------------------------------------------

2019-03-18 02:42:54,008 epoch 116 - iter 225/252 - loss 0.37198618
2019-03-18 02:43:00,741 epoch 116 - iter 250/252 - loss 0.37387157
2019-03-18 02:43:00,892 ----------------------------------------------------------------------------------------------------
2019-03-18 02:43:00,893 EPOCH 116 done: loss 0.3746 - lr 0.0004 - bad epochs 0
2019-03-18 02:43:10,772 DEV  : loss 1.90232861 - f-score 0.9683 - acc 0.9386
2019-03-18 02:43:33,067 TEST : loss 2.66108942 - f-score 0.9643 - acc 0.9311
2019-03-18 02:43:33,069 ----------------------------------------------------------------------------------------------------
2019-03-18 02:43:33,328 epoch 117 - iter 0/252 - loss 0.55773926
2019-03-18 02:43:40,057 epoch 117 - iter 25/252 - loss 0.40707734
2019-03-18 02:43:46,612 epoch 117 - iter 50/252 - loss 0.41808533
2019-03-18 02:43:53,041 epoch 117 - iter 75/252 - loss 0.35383529
2019-03-18 02:43:59,719 epoch 117 - iter 100/252 - loss 0.38286741
2019-03-18 02:44:06,500 epoch 117 - iter 125/252 - lo

2019-03-18 02:53:26,913 epoch 123 - iter 100/252 - loss 0.35942106
2019-03-18 02:53:33,517 epoch 123 - iter 125/252 - loss 0.36980523
2019-03-18 02:53:40,228 epoch 123 - iter 150/252 - loss 0.37346624
2019-03-18 02:53:46,613 epoch 123 - iter 175/252 - loss 0.37139376
2019-03-18 02:53:53,313 epoch 123 - iter 200/252 - loss 0.36535145
2019-03-18 02:54:00,048 epoch 123 - iter 225/252 - loss 0.35931171
2019-03-18 02:54:06,845 epoch 123 - iter 250/252 - loss 0.35805020
2019-03-18 02:54:07,019 ----------------------------------------------------------------------------------------------------
2019-03-18 02:54:07,020 EPOCH 123 done: loss 0.3578 - lr 0.0002 - bad epochs 1
2019-03-18 02:54:17,562 DEV  : loss 1.90360594 - f-score 0.9683 - acc 0.9386
2019-03-18 02:54:36,297 TEST : loss 2.66191983 - f-score 0.9642 - acc 0.9310
2019-03-18 02:54:36,299 ----------------------------------------------------------------------------------------------------
2019-03-18 02:54:36,518 epoch 124 - iter 0/252 -

{'test_score': 0.9643,
 'dev_score_history': [0.9271,
  0.9388,
  0.9475,
  0.9518,
  0.9543,
  0.9566,
  0.9574,
  0.9603,
  0.9598,
  0.9585,
  0.9606,
  0.9613,
  0.9629,
  0.9628,
  0.9628,
  0.9636,
  0.9649,
  0.9648,
  0.9628,
  0.9641,
  0.9651,
  0.9654,
  0.9656,
  0.964,
  0.9669,
  0.9645,
  0.9661,
  0.9654,
  0.966,
  0.9655,
  0.965,
  0.9662,
  0.9654,
  0.9675,
  0.9663,
  0.9665,
  0.9659,
  0.9659,
  0.9654,
  0.9667,
  0.967,
  0.9647,
  0.9647,
  0.9676,
  0.9648,
  0.9658,
  0.9661,
  0.9647,
  0.9659,
  0.9643,
  0.9645,
  0.965,
  0.9657,
  0.966,
  0.9654,
  0.9666,
  0.9678,
  0.9662,
  0.9663,
  0.9672,
  0.968,
  0.9677,
  0.9676,
  0.9677,
  0.9674,
  0.9668,
  0.9674,
  0.9683,
  0.9686,
  0.9682,
  0.9682,
  0.9684,
  0.9676,
  0.968,
  0.9675,
  0.968,
  0.9685,
  0.9681,
  0.9684,
  0.9674,
  0.9682,
  0.9682,
  0.9683,
  0.9686,
  0.9681,
  0.9688,
  0.9688,
  0.968,
  0.9687,
  0.9688,
  0.9677,
  0.9677,
  0.968,
  0.968,
  0.9679,
  0.9682,
  0.9685