# Generating a WordVector

In [1]:
%load_ext autoreload
%autoreload 2
%matplotlib inline

In [2]:

import logging 
import multiprocessing
from datetime import datetime
import json

from gensim.models import Word2Vec
from gensim.test.utils import get_tmpfile
from gensim.models import KeyedVectors

from cltk.corpus.readers import get_corpus_reader 
from cltk.prosody.latin.string_utils import punctuation_for_spaces_dict
from cltk.stem.latin.j_v import JVReplacer
from cltk.tokenize.sentence import TokenizeSentence
from cltk.prosody.latin.scansion_constants import ScansionConstants
from cltk.tokenize.word import WordTokenizer


In [3]:
NAME = 'make_latin_web_vec'
LOG = logging.getLogger(NAME)
handler = logging.FileHandler('{}.log'.format(NAME)) 
handler.setLevel(logging.INFO)
formatter = logging.Formatter('%(name)s - %(levelname)s - %(message)s')
handler.setFormatter(formatter)
LOG.addHandler(handler)
logging.basicConfig(format='%(levelname)s : %(message)s', level=logging.INFO)

In [5]:
keyword_params = {
    'size': 600,
    'iter': 300,
    'min_count': 3,  # Ignores all words with total frequency lower than this.
    'max_vocab_size': None,
    'ns_exponent': 0.75,  # the default, optimal for linguistic tasks; also try -0.5 for recommenders
    'alpha':  0.025,
    'min_alpha': 0.004,
    'sg': 1,  # skip gram
    'window': 10,  # number of surrounding words to consider
    'workers': multiprocessing.cpu_count() - 1,
    'negative': 15, # 15 may be best
    'sample': 0.0001 #   0.00001  # 
}
LOG.info('Creating vector with parameters: %s', json.dumps(keyword_params))
latin_lib_vec = Word2Vec(corpus_file='latin_library.preprocessed.cor', **keyword_params)

2019-03-06 00:07:44,150 : INFO : Creating vector with parameters: {"size": 600, "iter": 300, "min_count": 3, "max_vocab_size": null, "ns_exponent": 0.75, "alpha": 0.025, "min_alpha": 0.004, "sg": 1, "window": 10, "workers": 7, "negative": 15, "sample": 0.0001}
2019-03-06 00:07:44,152 : INFO : collecting all words and their counts
2019-03-06 00:07:44,153 : INFO : PROGRESS: at sentence #0, processed 0 words, keeping 0 word types
2019-03-06 00:07:44,231 : INFO : PROGRESS: at sentence #10000, processed 175859 words, keeping 23146 word types
2019-03-06 00:07:44,301 : INFO : PROGRESS: at sentence #20000, processed 342816 words, keeping 34831 word types
2019-03-06 00:07:44,387 : INFO : PROGRESS: at sentence #30000, processed 550570 words, keeping 44583 word types
2019-03-06 00:07:44,469 : INFO : PROGRESS: at sentence #40000, processed 753358 words, keeping 53519 word types
2019-03-06 00:07:44,553 : INFO : PROGRESS: at sentence #50000, processed 969282 words, keeping 60675 word types
2019-03-0

2019-03-06 00:09:48,717 : INFO : EPOCH 1 - PROGRESS: at 13.21% examples, 8194 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:09:48,719 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 00:09:49,241 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 00:09:49,488 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 00:09:50,521 : INFO : EPOCH 1 - PROGRESS: at 61.50% examples, 33855 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:09:50,522 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 00:09:50,697 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 00:09:52,089 : INFO : EPOCH 1 - PROGRESS: at 89.55% examples, 49970 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:09:52,090 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 00:09:53,298 : INFO : EPOCH 1 - PROGRESS: at 100.54% examples, 57331 words/s, in_qsize -1, out_qsize 1
20

2019-03-06 00:22:02,464 : INFO : EPOCH 7 - PROGRESS: at 89.55% examples, 51248 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:22:02,465 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 00:22:03,690 : INFO : EPOCH 7 - PROGRESS: at 100.54% examples, 58772 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:22:03,691 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 00:22:03,692 : INFO : EPOCH - 7 : training on 10306257 raw words (6933746 effective words) took 118.0s, 58771 effective words/s
2019-03-06 00:23:56,630 : INFO : EPOCH 8 - PROGRESS: at 15.03% examples, 8761 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:23:56,632 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 00:23:56,830 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 00:23:57,578 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 00:23:58,611 : INFO : EPOCH 8 - PROGRESS: at 59.12% exam

2019-03-06 00:35:24,798 : INFO : EPOCH 14 - PROGRESS: at 61.50% examples, 36482 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:35:24,799 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 00:35:25,099 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 00:35:25,861 : INFO : EPOCH 14 - PROGRESS: at 89.55% examples, 54039 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:35:25,861 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 00:35:27,398 : INFO : EPOCH 14 - PROGRESS: at 100.54% examples, 61765 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:35:27,399 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 00:35:27,399 : INFO : EPOCH - 14 : training on 10306257 raw words (6936678 effective words) took 112.3s, 61764 effective words/s
2019-03-06 00:37:17,101 : INFO : EPOCH 15 - PROGRESS: at 15.03% examples, 9026 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:37:17,103 : INFO : worker 

2019-03-06 00:48:25,240 : INFO : EPOCH 21 - PROGRESS: at 15.03% examples, 9299 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:48:25,241 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 00:48:25,333 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 00:48:25,724 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 00:48:26,706 : INFO : EPOCH 21 - PROGRESS: at 59.12% examples, 36713 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:48:26,707 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 00:48:26,925 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 00:48:27,963 : INFO : EPOCH 21 - PROGRESS: at 89.55% examples, 54903 words/s, in_qsize -1, out_qsize 1
2019-03-06 00:48:27,964 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 00:48:29,126 : INFO : EPOCH 21 - PROGRESS: at 100.54% examples, 62956 words/s, in_qsize -1, out_qsize 

2019-03-06 00:59:26,502 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 00:59:26,503 : INFO : EPOCH - 27 : training on 10306257 raw words (6934428 effective words) took 108.9s, 63675 effective words/s
2019-03-06 01:01:11,573 : INFO : EPOCH 28 - PROGRESS: at 15.03% examples, 9422 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:01:11,574 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 01:01:11,777 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 01:01:12,067 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 01:01:12,982 : INFO : EPOCH 28 - PROGRESS: at 59.12% examples, 37191 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:01:12,983 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 01:01:13,116 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 01:01:14,343 : INFO : EPOCH 28 - PROGRESS: at 89.55% examples, 55563 words/s

2019-03-06 01:12:06,062 : INFO : EPOCH 34 - PROGRESS: at 89.55% examples, 55934 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:12:06,063 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 01:12:07,523 : INFO : EPOCH 34 - PROGRESS: at 100.54% examples, 63947 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:12:07,524 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 01:12:07,525 : INFO : EPOCH - 34 : training on 10306257 raw words (6934890 effective words) took 108.4s, 63946 effective words/s
2019-03-06 01:13:51,767 : INFO : EPOCH 35 - PROGRESS: at 15.03% examples, 9492 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:13:51,768 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 01:13:52,423 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 01:13:52,432 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 01:13:53,542 : INFO : EPOCH 35 - PROGRESS: at 59.12%

2019-03-06 01:24:42,835 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 01:24:43,575 : INFO : EPOCH 41 - PROGRESS: at 89.55% examples, 56230 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:24:43,576 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 01:24:44,982 : INFO : EPOCH 41 - PROGRESS: at 100.54% examples, 64314 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:24:44,983 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 01:24:44,984 : INFO : EPOCH - 41 : training on 10306257 raw words (6935262 effective words) took 107.8s, 64313 effective words/s
2019-03-06 01:26:29,242 : INFO : EPOCH 42 - PROGRESS: at 15.03% examples, 9503 words/s, in_qsize -1, out_qsize 3
2019-03-06 01:26:29,243 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 01:26:29,244 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 01:26:29,402 : INFO : worker thread finished; awaiti

2019-03-06 01:37:16,242 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 01:37:16,511 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 01:37:17,457 : INFO : EPOCH 48 - PROGRESS: at 59.12% examples, 37641 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:37:17,458 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 01:37:17,512 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 01:37:18,543 : INFO : EPOCH 48 - PROGRESS: at 89.55% examples, 56370 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:37:18,544 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 01:37:19,867 : INFO : EPOCH 48 - PROGRESS: at 100.54% examples, 64524 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:37:19,868 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 01:37:19,869 : INFO : EPOCH - 48 : training on 10306257 raw words (6934794 effective words) took 107

2019-03-06 01:48:05,644 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 01:48:05,645 : INFO : EPOCH - 54 : training on 10306257 raw words (6935013 effective words) took 107.3s, 64606 effective words/s
2019-03-06 01:49:49,035 : INFO : EPOCH 55 - PROGRESS: at 15.03% examples, 9573 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:49:49,036 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 01:49:49,448 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 01:49:49,559 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 01:49:50,565 : INFO : EPOCH 55 - PROGRESS: at 59.12% examples, 37744 words/s, in_qsize -1, out_qsize 1
2019-03-06 01:49:50,566 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 01:49:50,973 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 01:49:51,877 : INFO : EPOCH 55 - PROGRESS: at 89.55% examples, 56400 words/s

2019-03-06 02:00:34,092 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 02:00:35,088 : INFO : EPOCH 61 - PROGRESS: at 89.55% examples, 56707 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:00:35,088 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 02:00:36,406 : INFO : EPOCH 61 - PROGRESS: at 100.54% examples, 64902 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:00:36,407 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 02:00:36,407 : INFO : EPOCH - 61 : training on 10306257 raw words (6934387 effective words) took 106.8s, 64901 effective words/s
2019-03-06 02:02:19,377 : INFO : EPOCH 62 - PROGRESS: at 15.03% examples, 9603 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:02:19,378 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 02:02:19,576 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 02:02:19,789 : INFO : worker thread finished; awaiti

2019-03-06 02:13:01,002 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 02:13:02,478 : INFO : EPOCH 68 - PROGRESS: at 59.12% examples, 37821 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:13:02,479 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 02:13:03,735 : INFO : EPOCH 68 - PROGRESS: at 73.36% examples, 46868 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:13:03,736 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 02:13:03,817 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 02:13:04,759 : INFO : EPOCH 68 - PROGRESS: at 100.54% examples, 64910 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:13:04,760 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 02:13:04,760 : INFO : EPOCH - 68 : training on 10306257 raw words (6935374 effective words) took 106.8s, 64909 effective words/s
2019-03-06 02:14:47,743 : INFO : EPOCH 69 - PROGRESS: at 15.03

2019-03-06 02:23:47,076 : INFO : EPOCH - 74 : training on 10306257 raw words (6935734 effective words) took 106.9s, 64855 effective words/s
2019-03-06 02:25:29,924 : INFO : EPOCH 75 - PROGRESS: at 15.03% examples, 9624 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:25:29,925 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 02:25:30,316 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 02:25:30,625 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 02:25:31,522 : INFO : EPOCH 75 - PROGRESS: at 59.12% examples, 37915 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:25:31,524 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 02:25:31,525 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 02:25:32,526 : INFO : EPOCH 75 - PROGRESS: at 89.55% examples, 56824 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:25:32,527 : INFO : worker thread finished; awaitin

2019-03-06 02:36:13,010 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 02:36:14,450 : INFO : EPOCH 81 - PROGRESS: at 100.54% examples, 64915 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:36:14,451 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 02:36:14,451 : INFO : EPOCH - 81 : training on 10306257 raw words (6934067 effective words) took 106.8s, 64914 effective words/s
2019-03-06 02:37:56,962 : INFO : EPOCH 82 - PROGRESS: at 15.03% examples, 9654 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:37:56,963 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 02:37:57,445 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 02:37:57,518 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 02:37:58,494 : INFO : EPOCH 82 - PROGRESS: at 59.12% examples, 38058 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:37:58,495 : INFO : worker thread finished; awaiti

2019-03-06 02:48:38,013 : INFO : EPOCH 88 - PROGRESS: at 59.12% examples, 38135 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:48:38,014 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 02:48:38,252 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 02:48:39,295 : INFO : EPOCH 88 - PROGRESS: at 89.55% examples, 56990 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:48:39,296 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 02:48:40,428 : INFO : EPOCH 88 - PROGRESS: at 100.54% examples, 65336 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:48:40,428 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 02:48:40,429 : INFO : EPOCH - 88 : training on 10306257 raw words (6934692 effective words) took 106.1s, 65335 effective words/s
2019-03-06 02:50:23,084 : INFO : EPOCH 89 - PROGRESS: at 13.21% examples, 9297 words/s, in_qsize -1, out_qsize 1
2019-03-06 02:50:23,086 : INFO : worker 

2019-03-06 03:01:02,139 : INFO : EPOCH 95 - PROGRESS: at 15.03% examples, 9648 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:01:02,141 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 03:01:02,451 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 03:01:02,468 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 03:01:03,544 : INFO : EPOCH 95 - PROGRESS: at 59.12% examples, 38059 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:01:03,545 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 03:01:03,603 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 03:01:04,613 : INFO : EPOCH 95 - PROGRESS: at 89.55% examples, 56995 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:01:04,614 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 03:01:05,841 : INFO : EPOCH 95 - PROGRESS: at 100.54% examples, 65286 words/s, in_qsize -1, out_qsize 

2019-03-06 03:11:42,132 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 03:11:43,435 : INFO : EPOCH 101 - PROGRESS: at 100.54% examples, 65366 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:11:43,436 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 03:11:43,437 : INFO : EPOCH - 101 : training on 10306257 raw words (6933757 effective words) took 106.1s, 65365 effective words/s
2019-03-06 03:13:25,877 : INFO : EPOCH 102 - PROGRESS: at 15.03% examples, 9655 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:13:25,879 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 03:13:26,387 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 03:13:26,390 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 03:13:27,524 : INFO : EPOCH 102 - PROGRESS: at 59.12% examples, 38036 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:13:27,525 : INFO : worker thread finished; aw

2019-03-06 03:24:05,642 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 03:24:06,799 : INFO : EPOCH 108 - PROGRESS: at 89.55% examples, 57098 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:24:06,800 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 03:24:07,984 : INFO : EPOCH 108 - PROGRESS: at 100.54% examples, 65431 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:24:07,985 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 03:24:07,985 : INFO : EPOCH - 108 : training on 10306257 raw words (6935734 effective words) took 106.0s, 65430 effective words/s
2019-03-06 03:25:50,401 : INFO : EPOCH 109 - PROGRESS: at 15.03% examples, 9660 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:25:50,402 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 03:25:50,623 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 03:25:50,649 : INFO : worker thread finished; aw

2019-03-06 03:36:27,649 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 03:36:27,821 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 03:36:28,880 : INFO : EPOCH 115 - PROGRESS: at 59.12% examples, 38211 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:36:28,881 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 03:36:29,142 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 03:36:30,006 : INFO : EPOCH 115 - PROGRESS: at 89.55% examples, 57189 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:36:30,007 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 03:36:31,170 : INFO : EPOCH 115 - PROGRESS: at 100.54% examples, 65556 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:36:31,170 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 03:36:31,171 : INFO : EPOCH - 115 : training on 10306257 raw words (6933947 effective words) took

2019-03-06 03:47:08,538 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 03:47:08,539 : INFO : EPOCH - 121 : training on 10306257 raw words (6935393 effective words) took 106.4s, 65209 effective words/s
2019-03-06 03:48:50,840 : INFO : EPOCH 122 - PROGRESS: at 15.03% examples, 9674 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:48:50,842 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 03:48:51,013 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 03:48:51,134 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 03:48:52,144 : INFO : EPOCH 122 - PROGRESS: at 59.12% examples, 38223 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:48:52,145 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 03:48:52,410 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 03:48:53,460 : INFO : EPOCH 122 - PROGRESS: at 89.55% examples, 57108 wor

2019-03-06 03:59:27,375 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 03:59:28,433 : INFO : EPOCH 128 - PROGRESS: at 89.55% examples, 57274 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:59:28,434 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 03:59:29,717 : INFO : EPOCH 128 - PROGRESS: at 100.54% examples, 65568 words/s, in_qsize -1, out_qsize 1
2019-03-06 03:59:29,718 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 03:59:29,719 : INFO : EPOCH - 128 : training on 10306257 raw words (6932800 effective words) took 105.7s, 65567 effective words/s
2019-03-06 04:01:11,943 : INFO : EPOCH 129 - PROGRESS: at 13.21% examples, 9338 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:01:11,944 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 04:01:12,074 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 04:01:12,092 : INFO : worker thread finished; aw

2019-03-06 04:11:47,055 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 04:11:47,863 : INFO : EPOCH 135 - PROGRESS: at 59.12% examples, 38556 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:11:47,864 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 04:11:48,276 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 04:11:49,490 : INFO : EPOCH 135 - PROGRESS: at 89.55% examples, 57428 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:11:49,491 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 04:11:50,622 : INFO : EPOCH 135 - PROGRESS: at 100.54% examples, 65836 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:11:50,622 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 04:11:50,623 : INFO : EPOCH - 135 : training on 10306257 raw words (6933404 effective words) took 105.3s, 65835 effective words/s
2019-03-06 04:13:32,303 : INFO : EPOCH 136 - PROGRESS: at 

2019-03-06 04:22:25,123 : INFO : EPOCH - 141 : training on 10306257 raw words (6934224 effective words) took 105.7s, 65578 effective words/s
2019-03-06 04:24:06,971 : INFO : EPOCH 142 - PROGRESS: at 17.08% examples, 10179 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:24:06,974 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 04:24:07,459 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 04:24:07,582 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 04:24:08,567 : INFO : EPOCH 142 - PROGRESS: at 59.12% examples, 38297 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:24:08,568 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 04:24:08,617 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 04:24:09,520 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 04:24:11,009 : INFO : EPOCH 142 - PROGRESS: at 100.54% examples, 65581 w

2019-03-06 04:34:44,449 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 04:34:45,635 : INFO : EPOCH 148 - PROGRESS: at 100.54% examples, 65751 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:34:45,636 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 04:34:45,636 : INFO : EPOCH - 148 : training on 10306257 raw words (6935124 effective words) took 105.5s, 65750 effective words/s
2019-03-06 04:36:27,599 : INFO : EPOCH 149 - PROGRESS: at 17.08% examples, 10169 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:36:27,600 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 04:36:27,701 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 04:36:27,814 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 04:36:29,169 : INFO : EPOCH 149 - PROGRESS: at 59.12% examples, 38264 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:36:29,170 : INFO : worker thread finished; a

2019-03-06 04:47:02,518 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 04:47:02,848 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 04:47:03,810 : INFO : EPOCH 155 - PROGRESS: at 89.55% examples, 57312 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:47:03,811 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 04:47:04,974 : INFO : EPOCH 155 - PROGRESS: at 100.54% examples, 65690 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:47:04,975 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 04:47:04,975 : INFO : EPOCH - 155 : training on 10306257 raw words (6936026 effective words) took 105.6s, 65689 effective words/s
2019-03-06 04:48:46,525 : INFO : EPOCH 156 - PROGRESS: at 15.03% examples, 9747 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:48:46,526 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 04:48:46,847 : INFO : worker thread finished; aw

2019-03-06 04:59:19,580 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 04:59:20,028 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 04:59:20,029 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 04:59:20,877 : INFO : EPOCH 162 - PROGRESS: at 59.12% examples, 38489 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:59:20,878 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 04:59:21,149 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 04:59:22,272 : INFO : EPOCH 162 - PROGRESS: at 89.55% examples, 57450 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:59:22,273 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 04:59:23,355 : INFO : EPOCH 162 - PROGRESS: at 100.54% examples, 65890 words/s, in_qsize -1, out_qsize 1
2019-03-06 04:59:23,355 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 04:59:

2019-03-06 05:09:57,323 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 05:09:57,323 : INFO : EPOCH - 168 : training on 10306257 raw words (6934722 effective words) took 105.6s, 65692 effective words/s
2019-03-06 05:11:38,877 : INFO : EPOCH 169 - PROGRESS: at 15.03% examples, 9747 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:11:38,878 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 05:11:38,960 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 05:11:39,007 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 05:11:40,344 : INFO : EPOCH 169 - PROGRESS: at 59.12% examples, 38441 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:11:40,345 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 05:11:40,452 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 05:11:41,503 : INFO : EPOCH 169 - PROGRESS: at 89.55% examples, 57517 wor

2019-03-06 05:22:12,878 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 05:22:14,214 : INFO : EPOCH 175 - PROGRESS: at 89.55% examples, 57393 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:22:14,215 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 05:22:15,498 : INFO : EPOCH 175 - PROGRESS: at 100.54% examples, 65705 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:22:15,499 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 05:22:15,499 : INFO : EPOCH - 175 : training on 10306257 raw words (6934975 effective words) took 105.5s, 65704 effective words/s
2019-03-06 05:23:57,147 : INFO : EPOCH 176 - PROGRESS: at 17.08% examples, 10194 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:23:57,148 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 05:23:57,521 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 05:23:57,606 : INFO : worker thread finished; a

2019-03-06 05:34:30,500 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 05:34:30,574 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 05:34:31,637 : INFO : EPOCH 182 - PROGRESS: at 59.12% examples, 38481 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:34:31,638 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 05:34:31,949 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 05:34:33,060 : INFO : EPOCH 182 - PROGRESS: at 89.55% examples, 57419 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:34:33,061 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 05:34:34,285 : INFO : EPOCH 182 - PROGRESS: at 100.54% examples, 65764 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:34:34,286 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 05:34:34,286 : INFO : EPOCH - 182 : training on 10306257 raw words (6933829 effective words) took

2019-03-06 05:45:08,037 : INFO : EPOCH - 188 : training on 10306257 raw words (6934547 effective words) took 105.5s, 65760 effective words/s
2019-03-06 05:46:49,812 : INFO : EPOCH 189 - PROGRESS: at 17.08% examples, 10187 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:46:49,814 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 05:46:50,042 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 05:46:50,269 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 05:46:51,309 : INFO : EPOCH 189 - PROGRESS: at 59.12% examples, 38358 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:46:51,310 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 05:46:51,440 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 05:46:52,531 : INFO : EPOCH 189 - PROGRESS: at 89.55% examples, 57354 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:46:52,532 : INFO : worker thread finished; aw

2019-03-06 05:57:26,700 : INFO : EPOCH 195 - PROGRESS: at 89.55% examples, 57288 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:57:26,701 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 05:57:27,836 : INFO : EPOCH 195 - PROGRESS: at 100.54% examples, 65673 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:57:27,837 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 05:57:27,838 : INFO : EPOCH - 195 : training on 10306257 raw words (6934196 effective words) took 105.6s, 65673 effective words/s
2019-03-06 05:59:09,625 : INFO : EPOCH 196 - PROGRESS: at 17.08% examples, 10183 words/s, in_qsize -1, out_qsize 1
2019-03-06 05:59:09,627 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 05:59:09,670 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 05:59:09,729 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 05:59:10,829 : INFO : EPOCH 196 - PROGRESS: at 

2019-03-06 06:09:43,862 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 06:09:44,710 : INFO : EPOCH 202 - PROGRESS: at 59.12% examples, 38560 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:09:44,711 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 06:09:45,114 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 06:09:46,095 : INFO : EPOCH 202 - PROGRESS: at 89.55% examples, 57561 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:09:46,096 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 06:09:47,439 : INFO : EPOCH 202 - PROGRESS: at 100.54% examples, 65856 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:09:47,439 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 06:09:47,441 : INFO : EPOCH - 202 : training on 10306257 raw words (6934662 effective words) took 105.3s, 65855 effective words/s
2019-03-06 06:11:29,027 : INFO : EPOCH 203 - PROGRESS: at 

2019-03-06 06:22:02,962 : INFO : EPOCH 209 - PROGRESS: at 15.03% examples, 9721 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:22:02,963 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 06:22:03,344 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 06:22:03,391 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 06:22:04,158 : INFO : EPOCH 209 - PROGRESS: at 59.12% examples, 38463 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:22:04,159 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 06:22:04,551 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 06:22:05,714 : INFO : EPOCH 209 - PROGRESS: at 89.55% examples, 57326 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:22:05,715 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 06:22:06,943 : INFO : EPOCH 209 - PROGRESS: at 100.54% examples, 65663 words/s, in_qsize -1, out_qs

2019-03-06 06:32:38,761 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 06:32:40,005 : INFO : EPOCH 215 - PROGRESS: at 100.54% examples, 65757 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:32:40,005 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 06:32:40,006 : INFO : EPOCH - 215 : training on 10306257 raw words (6936321 effective words) took 105.5s, 65756 effective words/s
2019-03-06 06:34:21,656 : INFO : EPOCH 216 - PROGRESS: at 17.08% examples, 10196 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:34:21,657 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 06:34:21,662 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 06:34:21,937 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 06:34:22,789 : INFO : EPOCH 216 - PROGRESS: at 59.12% examples, 38530 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:34:22,790 : INFO : worker thread finished; a

2019-03-06 06:44:55,585 : INFO : EPOCH 222 - PROGRESS: at 61.50% examples, 38896 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:44:55,586 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 06:44:55,660 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 06:44:56,957 : INFO : EPOCH 222 - PROGRESS: at 89.55% examples, 57417 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:44:56,957 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 06:44:58,222 : INFO : EPOCH 222 - PROGRESS: at 100.54% examples, 65745 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:44:58,222 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 06:44:58,223 : INFO : EPOCH - 222 : training on 10306257 raw words (6935153 effective words) took 105.5s, 65744 effective words/s
2019-03-06 06:46:39,938 : INFO : EPOCH 223 - PROGRESS: at 15.03% examples, 9724 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:46:39,939 : INFO : wo

2019-03-06 06:57:12,060 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 06:57:12,183 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 06:57:12,420 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 06:57:13,269 : INFO : EPOCH 229 - PROGRESS: at 59.12% examples, 38532 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:57:13,270 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 06:57:13,663 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 06:57:14,956 : INFO : EPOCH 229 - PROGRESS: at 89.55% examples, 57356 words/s, in_qsize -1, out_qsize 1
2019-03-06 06:57:14,956 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 06:57:15,937 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 06:57:15,938 : INFO : EPOCH - 229 : training on 10306257 raw words (6934896 effective words) took 105.3s, 65848 effective 

2019-03-06 07:07:48,148 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 07:07:48,149 : INFO : EPOCH - 235 : training on 10306257 raw words (6933896 effective words) took 105.2s, 65903 effective words/s
2019-03-06 07:09:29,578 : INFO : EPOCH 236 - PROGRESS: at 15.03% examples, 9753 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:09:29,580 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 07:09:29,610 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 07:09:29,739 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 07:09:30,622 : INFO : EPOCH 236 - PROGRESS: at 59.12% examples, 38644 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:09:30,622 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 07:09:30,984 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 07:09:31,946 : INFO : EPOCH 236 - PROGRESS: at 89.55% examples, 57730 wor

2019-03-06 07:20:02,193 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 07:20:03,412 : INFO : EPOCH 242 - PROGRESS: at 89.55% examples, 57496 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:20:03,413 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 07:20:04,591 : INFO : EPOCH 242 - PROGRESS: at 100.54% examples, 65882 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:20:04,591 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 07:20:04,593 : INFO : EPOCH - 242 : training on 10306257 raw words (6935122 effective words) took 105.3s, 65881 effective words/s
2019-03-06 07:21:45,673 : INFO : EPOCH 243 - PROGRESS: at 15.03% examples, 9794 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:21:45,675 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 07:21:45,911 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 07:21:45,980 : INFO : worker thread finished; aw

2019-03-06 07:32:18,605 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 07:32:18,806 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 07:32:19,673 : INFO : EPOCH 249 - PROGRESS: at 59.12% examples, 38352 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:32:19,674 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 07:32:19,937 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 07:32:20,868 : INFO : EPOCH 249 - PROGRESS: at 89.55% examples, 57364 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:32:20,869 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 07:32:22,048 : INFO : EPOCH 249 - PROGRESS: at 100.54% examples, 65730 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:32:22,049 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 07:32:22,049 : INFO : EPOCH - 249 : training on 10306257 raw words (6935244 effective words) took

2019-03-06 07:42:54,155 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 07:42:54,155 : INFO : EPOCH - 255 : training on 10306257 raw words (6933734 effective words) took 105.1s, 65968 effective words/s
2019-03-06 07:44:35,719 : INFO : EPOCH 256 - PROGRESS: at 15.03% examples, 9747 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:44:35,720 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 07:44:35,945 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 07:44:36,049 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 07:44:36,746 : INFO : EPOCH 256 - PROGRESS: at 59.12% examples, 38612 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:44:36,747 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 07:44:37,178 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 07:44:38,326 : INFO : EPOCH 256 - PROGRESS: at 89.55% examples, 57536 wor

2019-03-06 07:55:10,750 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 07:55:11,830 : INFO : EPOCH 262 - PROGRESS: at 89.55% examples, 57474 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:55:11,831 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 07:55:13,200 : INFO : EPOCH 262 - PROGRESS: at 100.54% examples, 65745 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:55:13,200 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 07:55:13,201 : INFO : EPOCH - 262 : training on 10306257 raw words (6936188 effective words) took 105.5s, 65744 effective words/s
2019-03-06 07:56:55,154 : INFO : EPOCH 263 - PROGRESS: at 17.08% examples, 10165 words/s, in_qsize -1, out_qsize 1
2019-03-06 07:56:55,155 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 07:56:55,162 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 07:56:55,310 : INFO : worker thread finished; a

2019-03-06 08:07:50,910 : INFO : EPOCH 269 - PROGRESS: at 59.12% examples, 32331 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:07:50,911 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 08:07:51,285 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 08:07:52,481 : INFO : EPOCH 269 - PROGRESS: at 89.55% examples, 48291 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:07:52,482 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 08:07:53,646 : INFO : EPOCH 269 - PROGRESS: at 100.54% examples, 55446 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:07:53,646 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 08:07:53,647 : INFO : EPOCH - 269 : training on 10306257 raw words (6934883 effective words) took 125.1s, 55445 effective words/s
2019-03-06 08:09:38,729 : INFO : EPOCH 270 - PROGRESS: at 17.08% examples, 9865 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:09:38,730 : INFO : wo

2019-03-06 08:22:08,131 : INFO : EPOCH 276 - PROGRESS: at 17.08% examples, 7534 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:22:08,132 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 08:22:08,214 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 08:22:08,685 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 08:22:09,482 : INFO : EPOCH 276 - PROGRESS: at 59.12% examples, 28512 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:22:09,483 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 08:22:09,616 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 08:22:10,909 : INFO : EPOCH 276 - PROGRESS: at 89.55% examples, 42703 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:22:10,910 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 08:22:12,100 : INFO : EPOCH 276 - PROGRESS: at 100.54% examples, 49072 words/s, in_qsize -1, out_qs

2019-03-06 08:33:10,764 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 08:33:12,350 : INFO : EPOCH 282 - PROGRESS: at 100.54% examples, 60666 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:33:12,351 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 08:33:12,351 : INFO : EPOCH - 282 : training on 10306257 raw words (6934239 effective words) took 114.3s, 60665 effective words/s
2019-03-06 08:36:11,063 : INFO : EPOCH 283 - PROGRESS: at 15.03% examples, 5536 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:36:11,065 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 08:36:11,403 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 08:36:11,783 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 08:36:14,008 : INFO : EPOCH 283 - PROGRESS: at 59.12% examples, 21793 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:36:14,010 : INFO : worker thread finished; aw

2019-03-06 08:50:00,847 : INFO : EPOCH 289 - PROGRESS: at 59.12% examples, 28949 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:50:00,849 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 08:50:01,068 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 08:50:03,252 : INFO : EPOCH 289 - PROGRESS: at 89.55% examples, 43046 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:50:03,253 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 08:50:05,111 : INFO : EPOCH 289 - PROGRESS: at 100.54% examples, 49230 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:50:05,112 : INFO : worker thread finished; awaiting finish of 0 more threads
2019-03-06 08:50:05,113 : INFO : EPOCH - 289 : training on 10306257 raw words (6933387 effective words) took 140.8s, 49230 effective words/s
2019-03-06 08:52:04,869 : INFO : EPOCH 290 - PROGRESS: at 15.03% examples, 8269 words/s, in_qsize -1, out_qsize 1
2019-03-06 08:52:04,871 : INFO : wo

2019-03-06 09:02:48,954 : INFO : EPOCH 296 - PROGRESS: at 17.08% examples, 10053 words/s, in_qsize -1, out_qsize 1
2019-03-06 09:02:48,955 : INFO : worker thread finished; awaiting finish of 6 more threads
2019-03-06 09:02:48,996 : INFO : worker thread finished; awaiting finish of 5 more threads
2019-03-06 09:02:49,104 : INFO : worker thread finished; awaiting finish of 4 more threads
2019-03-06 09:02:50,300 : INFO : EPOCH 296 - PROGRESS: at 59.12% examples, 37918 words/s, in_qsize -1, out_qsize 1
2019-03-06 09:02:50,301 : INFO : worker thread finished; awaiting finish of 3 more threads
2019-03-06 09:02:50,720 : INFO : worker thread finished; awaiting finish of 2 more threads
2019-03-06 09:02:51,577 : INFO : EPOCH 296 - PROGRESS: at 89.55% examples, 56679 words/s, in_qsize -1, out_qsize 1
2019-03-06 09:02:51,578 : INFO : worker thread finished; awaiting finish of 1 more threads
2019-03-06 09:02:52,780 : INFO : EPOCH 296 - PROGRESS: at 100.54% examples, 64947 words/s, in_qsize -1, out_q

In [6]:
LOG.info('Saving word2vec for latin library corpus')
latin_lib_vec.save('latin_library.{}.vec'.format(datetime.datetime.now().strftime('%Y.%m.%d')))

2019-03-06 09:16:25,834 : INFO : Saving word2vec for latin library corpus
2019-03-06 09:16:25,835 : INFO : saving Word2Vec object under latin_library.2019.03.06.vec, separately None
2019-03-06 09:16:25,836 : INFO : storing np array 'vectors' to latin_library.2019.03.06.vec.wv.vectors.npy
2019-03-06 09:16:26,774 : INFO : not storing attribute vectors_norm
2019-03-06 09:16:26,775 : INFO : storing np array 'syn1neg' to latin_library.2019.03.06.vec.trainables.syn1neg.npy
2019-03-06 09:16:27,726 : INFO : not storing attribute cum_table
2019-03-06 09:16:27,984 : INFO : saved latin_library.2019.03.06.vec


In [7]:
with open('latin_library.vec.{}.params'.format(datetime.datetime.now().strftime('%Y.%m.%d')), 'wt') as writer:
    json.dump(keyword_params, writer)

### Persist the word vectors to disk
they should be cross platform, cross language loadable

In [8]:
word_vectors = latin_lib_vec.wv
the_filename = 'latin_library.{}.kv'.format(datetime.datetime.now().strftime('%Y.%m.%d'))
word_vectors.save(the_filename)

2019-03-06 09:16:35,921 : INFO : saving Word2VecKeyedVectors object under latin_library.2019.03.06.kv, separately None
2019-03-06 09:16:35,922 : INFO : storing np array 'vectors' to latin_library.2019.03.06.kv.vectors.npy
2019-03-06 09:16:36,902 : INFO : not storing attribute vectors_norm
2019-03-06 09:16:37,133 : INFO : saved latin_library.2019.03.06.kv


## Some QA

In [9]:
latin_lib_vec.wv.most_similar('puella')

2019-03-06 09:16:42,632 : INFO : precomputing L2-norms of word weight vectors


[('instabatur', 0.31701159477233887),
 ('scitula', 0.3043367266654968),
 ('sauio', 0.296586275100708),
 ('repugnasset', 0.2914842367172241),
 ('praepollet', 0.288862943649292),
 ('tractor', 0.28605037927627563),
 ('maturando', 0.2769477963447571),
 ('extruderetur', 0.27676403522491455),
 ('miserandas', 0.2750115394592285),
 ('uetula', 0.2738913595676422)]

In [10]:
latin_lib_vec.wv.similar_by_word('uiolenter')

[('occupant', 0.3278190493583679),
 ('aggrauantes', 0.3118888735771179),
 ('effracta', 0.28086984157562256),
 ('effringunt', 0.2808580994606018),
 ('occupauimus', 0.27877819538116455),
 ('interfatus', 0.2770298421382904),
 ('effringitur', 0.2761697769165039),
 ('nudabat', 0.27535030245780945),
 ('subuertens', 0.2740432620048523),
 ('geminatae', 0.27362722158432007)]

In [11]:
latin_lib_vec.wv.similar_by_word('uir')

[('homo', 0.41128575801849365),
 ('eius', 0.4087766408920288),
 ('qui', 0.4087045192718506),
 ('me', 0.3989563584327698),
 ('filius', 0.39075589179992676),
 ('et', 0.38757461309432983),
 ('quasi', 0.38720792531967163),
 ('quis', 0.38023948669433594),
 ('ille', 0.37594127655029297),
 ('erat', 0.37241026759147644)]

In [12]:
latin_word_vectors = KeyedVectors.load(the_filename, mmap='r')

2019-03-06 09:16:46,433 : INFO : loading Word2VecKeyedVectors object from latin_library.2019.03.06.kv
2019-03-06 09:16:46,713 : INFO : loading vectors from latin_library.2019.03.06.kv.vectors.npy with mmap=r
2019-03-06 09:16:46,722 : INFO : setting ignored attribute vectors_norm to None
2019-03-06 09:16:46,723 : INFO : loaded latin_library.2019.03.06.kv


In [13]:
latin_word_vectors.most_similar('uir')

2019-03-06 09:16:46,889 : INFO : precomputing L2-norms of word weight vectors


[('homo', 0.41128575801849365),
 ('eius', 0.4087766408920288),
 ('qui', 0.4087045192718506),
 ('me', 0.3989563584327698),
 ('filius', 0.39075589179992676),
 ('et', 0.38757461309432983),
 ('quasi', 0.38720792531967163),
 ('quis', 0.38023948669433594),
 ('ille', 0.37594127655029297),
 ('erat', 0.37241026759147644)]

In [14]:
latin_lib_vec.wv.most_similar('cano', topn=10) 

[('nes', 0.3691553473472595),
 ('nem', 0.3362516164779663),
 ('aurario', 0.2990747392177582),
 ('exorbitare', 0.2923274636268616),
 ('gramaticam', 0.2880067825317383),
 ('spumabant', 0.28595393896102905),
 ('arceo', 0.28334152698516846),
 ('dempto', 0.2765955626964569),
 ('derisi', 0.2744697630405426),
 ('compellentibus', 0.26956403255462646)]

In [15]:
latin_lib_vec.wv.most_similar('hominis', topn=10) 

[('fili', 0.41234782338142395),
 ('nullificame', 0.39074838161468506),
 ('deueneris', 0.35705214738845825),
 ('eius', 0.34812599420547485),
 ('prophetantibus', 0.3334704339504242),
 ('enim', 0.33328378200531006),
 ('monstruosam', 0.33029109239578247),
 ('quia', 0.32797425985336304),
 ('homo', 0.3257666826248169),
 ('me', 0.32543182373046875)]

In [16]:
latin_lib_vec.wv.most_similar('pigrum', topn=10) 

[('pinguescant', 0.3039183020591736),
 ('meanti', 0.282198429107666),
 ('remigantibus', 0.2680237889289856),
 ('conligari', 0.26064327359199524),
 ('homuncionem', 0.25794699788093567),
 ('mancum', 0.25267118215560913),
 ('neglegentem', 0.25006312131881714),
 ('pigros', 0.24705643951892853),
 ('metuent', 0.24419176578521729),
 ('elementum', 0.24003754556179047)]

In [17]:
latin_lib_vec.wv.most_similar('homo')

[('quia', 0.41234609484672546),
 ('uir', 0.41128572821617126),
 ('ergo', 0.3883773982524872),
 ('non', 0.38568592071533203),
 ('qui', 0.3810696005821228),
 ('est', 0.3801639676094055),
 ('enim', 0.37904277443885803),
 ('ille', 0.3717462718486786),
 ('sic', 0.3698633313179016),
 ('omnis', 0.3671305179595947)]

In [18]:
latin_lib_vec.wv.most_similar('mentula')

[('arrigis', 0.3291878402233124),
 ('sesquipedalis', 0.29460304975509644),
 ('meiere', 0.2688262462615967),
 ('commendasti', 0.2528712749481201),
 ('cerussata', 0.2522173821926117),
 ('mulgeat', 0.24947533011436462),
 ('numerantem', 0.24851492047309875),
 ('uellis', 0.24850168824195862),
 ('cunnus', 0.2467784434556961),
 ('olfacere', 0.24590563774108887)]

In [19]:
latin_lib_vec.wv.most_similar('scandere')

[('frangentia', 0.2777160406112671),
 ('pulsantis', 0.2761341333389282),
 ('lapsantibus', 0.25163206458091736),
 ('intrate', 0.24283654987812042),
 ('racio', 0.24051621556282043),
 ('submissus', 0.23489117622375488),
 ('euellas', 0.23214466869831085),
 ('incestare', 0.23007065057754517),
 ('deficiam', 0.22999346256256104),
 ('constancia', 0.2263008952140808)]

In [20]:
latin_lib_vec.wv.most_similar('praelucere')

[('tenderemus', 0.4717866778373718),
 ('praeuisum', 0.3457968533039093),
 ('effecero', 0.311782568693161),
 ('remistheo', 0.2971537709236145),
 ('mansisses', 0.284287691116333),
 ('uibret', 0.27515909075737),
 ('lenius', 0.2725391387939453),
 ('caeciliano', 0.2704721689224243),
 ('messalae', 0.26987600326538086),
 ('aedituus', 0.26893386244773865)]

In [21]:
latin_lib_vec.wv.similar_by_word('puella')

[('instabatur', 0.31701159477233887),
 ('scitula', 0.3043367266654968),
 ('sauio', 0.296586275100708),
 ('repugnasset', 0.2914842367172241),
 ('praepollet', 0.288862943649292),
 ('tractor', 0.28605037927627563),
 ('maturando', 0.2769477963447571),
 ('extruderetur', 0.27676403522491455),
 ('miserandas', 0.2750115394592285),
 ('uetula', 0.2738913595676422)]

In [22]:
latin_lib_vec.wv.similar_by_word('mentula')

[('arrigis', 0.3291878402233124),
 ('sesquipedalis', 0.29460304975509644),
 ('meiere', 0.2688262462615967),
 ('commendasti', 0.2528712749481201),
 ('cerussata', 0.2522173821926117),
 ('mulgeat', 0.24947533011436462),
 ('numerantem', 0.24851492047309875),
 ('uellis', 0.24850168824195862),
 ('cunnus', 0.2467784434556961),
 ('olfacere', 0.24590563774108887)]

In [24]:
latin_lib_vec.wv.similar_by_word('ciuis')

[('bacchium', 0.34864407777786255),
 ('ouch', 0.2970449924468994),
 ('romanus', 0.29618778824806213),
 ('aequaeuus', 0.29487138986587524),
 ('eiciebant', 0.28827977180480957),
 ('auteur', 0.2760046720504761),
 ('coaceruatam', 0.2718203663825989),
 ('indemnati', 0.26956579089164734),
 ('excultos', 0.2652883529663086),
 ('praeficiebant', 0.26509445905685425)]