In [1]:
import numpy as np

from nltk.tokenize import sent_tokenize, regexp_tokenize, word_tokenize
from nltk.corpus import stopwords
from common import *
from glob import iglob

from nltk.tokenize import RegexpTokenizer
from gensim.models import Word2Vec

from joblib import Parallel, delayed
import gensim, logging
import multiprocessing
import json
from gzip import GzipFile

import tensorflow as tf
from tensorflow.contrib.tensorboard.plugins import projector

DATA_FOLDER = '../data/'
cpu_count = multiprocessing.cpu_count()
logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s', level=logging.INFO)

In [2]:
class Sentences(object):
    def __init__(self, folder):
        self.folder = folder
 
    def __iter__(self):
        for i, fn in enumerate(glob(join(self.folder, '*.gz'))):
            logging.info("%s: " % i + fn)
            with GzipFile(fn, 'r') as myzip:
                text = myzip.read()
            docs = json.loads(text)
            for doc in docs.values():
                for sentence in doc:
                    yield sentence

# Train

In [4]:
dim = 300

In [7]:
model = Word2Vec(Sentences(join(DATA_FOLDER, 'documents/')), size=dim, 
                 sg=1, min_count=5, window=3, workers=cpu_count)

2017-07-20 19:25:01,040 : INFO : collecting all words and their counts
2017-07-20 19:25:01,290 : INFO : PROGRESS: at sentence #0, processed 0 words, keeping 0 word types
2017-07-20 19:25:01,314 : INFO : PROGRESS: at sentence #10000, processed 82018 words, keeping 9389 word types
2017-07-20 19:25:01,339 : INFO : PROGRESS: at sentence #20000, processed 177881 words, keeping 14813 word types
2017-07-20 19:25:01,467 : INFO : PROGRESS: at sentence #30000, processed 265117 words, keeping 18502 word types
2017-07-20 19:25:03,067 : INFO : PROGRESS: at sentence #40000, processed 344670 words, keeping 21567 word types
2017-07-20 19:25:03,098 : INFO : PROGRESS: at sentence #50000, processed 442225 words, keeping 26393 word types
2017-07-20 19:25:03,130 : INFO : PROGRESS: at sentence #60000, processed 542691 words, keeping 30469 word types
2017-07-20 19:25:03,162 : INFO : PROGRESS: at sentence #70000, processed 639353 words, keeping 33615 word types
2017-07-20 19:25:03,194 : INFO : PROGRESS: at se

2017-07-20 19:25:10,982 : INFO : PROGRESS: at sentence #720000, processed 6770142 words, keeping 138871 word types
2017-07-20 19:25:11,016 : INFO : PROGRESS: at sentence #730000, processed 6869565 words, keeping 140363 word types
2017-07-20 19:25:11,047 : INFO : PROGRESS: at sentence #740000, processed 6964701 words, keeping 141672 word types
2017-07-20 19:25:11,078 : INFO : PROGRESS: at sentence #750000, processed 7059966 words, keeping 142958 word types
2017-07-20 19:25:11,114 : INFO : PROGRESS: at sentence #760000, processed 7172587 words, keeping 144393 word types
2017-07-20 19:25:11,146 : INFO : PROGRESS: at sentence #770000, processed 7267458 words, keeping 145572 word types
2017-07-20 19:25:12,677 : INFO : PROGRESS: at sentence #780000, processed 7378029 words, keeping 146593 word types
2017-07-20 19:25:12,712 : INFO : PROGRESS: at sentence #790000, processed 7496255 words, keeping 147768 word types
2017-07-20 19:25:12,744 : INFO : PROGRESS: at sentence #800000, processed 759470

2017-07-20 19:25:20,507 : INFO : PROGRESS: at sentence #1430000, processed 13936608 words, keeping 214616 word types
2017-07-20 19:25:20,542 : INFO : PROGRESS: at sentence #1440000, processed 14054915 words, keeping 215350 word types
2017-07-20 19:25:20,579 : INFO : PROGRESS: at sentence #1450000, processed 14163569 words, keeping 216273 word types
2017-07-20 19:25:22,137 : INFO : PROGRESS: at sentence #1460000, processed 14270746 words, keeping 217371 word types
2017-07-20 19:25:22,174 : INFO : PROGRESS: at sentence #1470000, processed 14375868 words, keeping 218554 word types
2017-07-20 19:25:22,211 : INFO : PROGRESS: at sentence #1480000, processed 14479793 words, keeping 219628 word types
2017-07-20 19:25:22,249 : INFO : PROGRESS: at sentence #1490000, processed 14588391 words, keeping 220475 word types
2017-07-20 19:25:22,286 : INFO : PROGRESS: at sentence #1500000, processed 14687364 words, keeping 221307 word types
2017-07-20 19:25:22,324 : INFO : PROGRESS: at sentence #1510000,

2017-07-20 19:25:31,152 : INFO : PROGRESS: at sentence #2140000, processed 21178436 words, keeping 274768 word types
2017-07-20 19:25:31,189 : INFO : PROGRESS: at sentence #2150000, processed 21274186 words, keeping 275601 word types
2017-07-20 19:25:31,222 : INFO : PROGRESS: at sentence #2160000, processed 21371018 words, keeping 276229 word types
2017-07-20 19:25:31,256 : INFO : PROGRESS: at sentence #2170000, processed 21465995 words, keeping 277139 word types
2017-07-20 19:25:31,292 : INFO : PROGRESS: at sentence #2180000, processed 21565766 words, keeping 278097 word types
2017-07-20 19:25:31,325 : INFO : PROGRESS: at sentence #2190000, processed 21658938 words, keeping 278768 word types
2017-07-20 19:25:31,360 : INFO : PROGRESS: at sentence #2200000, processed 21755793 words, keeping 279424 word types
2017-07-20 19:25:31,394 : INFO : PROGRESS: at sentence #2210000, processed 21850656 words, keeping 280205 word types
2017-07-20 19:25:31,427 : INFO : PROGRESS: at sentence #2220000,

2017-07-20 19:25:40,217 : INFO : PROGRESS: at sentence #2850000, processed 28214165 words, keeping 328841 word types
2017-07-20 19:25:40,255 : INFO : PROGRESS: at sentence #2860000, processed 28310542 words, keeping 329683 word types
2017-07-20 19:25:40,290 : INFO : PROGRESS: at sentence #2870000, processed 28411544 words, keeping 330327 word types
2017-07-20 19:25:40,577 : INFO : PROGRESS: at sentence #2880000, processed 28523939 words, keeping 331114 word types
2017-07-20 19:25:40,611 : INFO : PROGRESS: at sentence #2890000, processed 28613183 words, keeping 331523 word types
2017-07-20 19:25:40,642 : INFO : PROGRESS: at sentence #2900000, processed 28700915 words, keeping 331977 word types
2017-07-20 19:25:42,187 : INFO : PROGRESS: at sentence #2910000, processed 28785727 words, keeping 332490 word types
2017-07-20 19:25:42,222 : INFO : PROGRESS: at sentence #2920000, processed 28885291 words, keeping 332999 word types
2017-07-20 19:25:42,259 : INFO : PROGRESS: at sentence #2930000,

2017-07-20 19:25:50,157 : INFO : PROGRESS: at sentence #3560000, processed 35108322 words, keeping 371867 word types
2017-07-20 19:25:50,193 : INFO : PROGRESS: at sentence #3570000, processed 35199910 words, keeping 372496 word types
2017-07-20 19:25:50,232 : INFO : PROGRESS: at sentence #3580000, processed 35292815 words, keeping 373291 word types
2017-07-20 19:25:50,270 : INFO : PROGRESS: at sentence #3590000, processed 35399919 words, keeping 374011 word types
2017-07-20 19:25:50,305 : INFO : PROGRESS: at sentence #3600000, processed 35496108 words, keeping 374856 word types
2017-07-20 19:25:50,341 : INFO : PROGRESS: at sentence #3610000, processed 35586182 words, keeping 375464 word types
2017-07-20 19:25:50,617 : INFO : PROGRESS: at sentence #3620000, processed 35680427 words, keeping 375895 word types
2017-07-20 19:25:50,648 : INFO : PROGRESS: at sentence #3630000, processed 35762363 words, keeping 376336 word types
2017-07-20 19:25:50,681 : INFO : PROGRESS: at sentence #3640000,

2017-07-20 19:26:00,227 : INFO : PROGRESS: at sentence #4270000, processed 42076429 words, keeping 414260 word types
2017-07-20 19:26:00,262 : INFO : PROGRESS: at sentence #4280000, processed 42166387 words, keeping 414809 word types
2017-07-20 19:26:00,297 : INFO : PROGRESS: at sentence #4290000, processed 42264401 words, keeping 415373 word types
2017-07-20 19:26:00,335 : INFO : PROGRESS: at sentence #4300000, processed 42367789 words, keeping 416185 word types
2017-07-20 19:26:00,368 : INFO : PROGRESS: at sentence #4310000, processed 42462369 words, keeping 416746 word types
2017-07-20 19:26:00,403 : INFO : PROGRESS: at sentence #4320000, processed 42559298 words, keeping 417335 word types
2017-07-20 19:26:00,440 : INFO : PROGRESS: at sentence #4330000, processed 42659338 words, keeping 417786 word types
2017-07-20 19:26:00,475 : INFO : PROGRESS: at sentence #4340000, processed 42751449 words, keeping 418392 word types
2017-07-20 19:26:00,511 : INFO : PROGRESS: at sentence #4350000,

2017-07-20 19:26:10,502 : INFO : PROGRESS: at sentence #4980000, processed 49198664 words, keeping 455179 word types
2017-07-20 19:26:10,540 : INFO : PROGRESS: at sentence #4990000, processed 49301291 words, keeping 455673 word types
2017-07-20 19:26:10,584 : INFO : PROGRESS: at sentence #5000000, processed 49409575 words, keeping 456236 word types
2017-07-20 19:26:10,628 : INFO : PROGRESS: at sentence #5010000, processed 49519117 words, keeping 456639 word types
2017-07-20 19:26:10,667 : INFO : PROGRESS: at sentence #5020000, processed 49617574 words, keeping 457095 word types
2017-07-20 19:26:10,707 : INFO : PROGRESS: at sentence #5030000, processed 49716810 words, keeping 457566 word types
2017-07-20 19:26:10,744 : INFO : PROGRESS: at sentence #5040000, processed 49814367 words, keeping 457940 word types
2017-07-20 19:26:10,784 : INFO : PROGRESS: at sentence #5050000, processed 49912278 words, keeping 458484 word types
2017-07-20 19:26:10,824 : INFO : PROGRESS: at sentence #5060000,

2017-07-20 19:26:19,857 : INFO : PROGRESS: at sentence #5690000, processed 56305199 words, keeping 492114 word types
2017-07-20 19:26:19,893 : INFO : PROGRESS: at sentence #5700000, processed 56400350 words, keeping 492501 word types
2017-07-20 19:26:19,934 : INFO : PROGRESS: at sentence #5710000, processed 56516340 words, keeping 493392 word types
2017-07-20 19:26:19,972 : INFO : PROGRESS: at sentence #5720000, processed 56615220 words, keeping 494008 word types
2017-07-20 19:26:20,010 : INFO : PROGRESS: at sentence #5730000, processed 56712159 words, keeping 494472 word types
2017-07-20 19:26:20,045 : INFO : PROGRESS: at sentence #5740000, processed 56810635 words, keeping 494788 word types
2017-07-20 19:26:20,084 : INFO : PROGRESS: at sentence #5750000, processed 56921452 words, keeping 495488 word types
2017-07-20 19:26:20,120 : INFO : PROGRESS: at sentence #5760000, processed 57018809 words, keeping 495991 word types
2017-07-20 19:26:20,400 : INFO : PROGRESS: at sentence #5770000,

2017-07-20 19:26:29,521 : INFO : PROGRESS: at sentence #6400000, processed 63297228 words, keeping 528477 word types
2017-07-20 19:26:29,557 : INFO : PROGRESS: at sentence #6410000, processed 63391322 words, keeping 528897 word types
2017-07-20 19:26:29,598 : INFO : PROGRESS: at sentence #6420000, processed 63496312 words, keeping 529416 word types
2017-07-20 19:26:29,636 : INFO : PROGRESS: at sentence #6430000, processed 63595954 words, keeping 529912 word types
2017-07-20 19:26:29,670 : INFO : PROGRESS: at sentence #6440000, processed 63693988 words, keeping 530411 word types
2017-07-20 19:26:29,709 : INFO : PROGRESS: at sentence #6450000, processed 63789715 words, keeping 530802 word types
2017-07-20 19:26:29,745 : INFO : PROGRESS: at sentence #6460000, processed 63883774 words, keeping 531121 word types
2017-07-20 19:26:29,914 : INFO : PROGRESS: at sentence #6470000, processed 63988956 words, keeping 531405 word types
2017-07-20 19:26:31,427 : INFO : PROGRESS: at sentence #6480000,

2017-07-20 19:26:39,494 : INFO : PROGRESS: at sentence #7110000, processed 70291599 words, keeping 562464 word types
2017-07-20 19:26:39,536 : INFO : PROGRESS: at sentence #7120000, processed 70394514 words, keeping 563216 word types
2017-07-20 19:26:39,572 : INFO : PROGRESS: at sentence #7130000, processed 70491399 words, keeping 563690 word types
2017-07-20 19:26:39,617 : INFO : PROGRESS: at sentence #7140000, processed 70604548 words, keeping 564294 word types
2017-07-20 19:26:39,654 : INFO : PROGRESS: at sentence #7150000, processed 70698881 words, keeping 564731 word types
2017-07-20 19:26:39,691 : INFO : PROGRESS: at sentence #7160000, processed 70789873 words, keeping 565268 word types
2017-07-20 19:26:39,727 : INFO : PROGRESS: at sentence #7170000, processed 70879928 words, keeping 565800 word types
2017-07-20 19:26:41,389 : INFO : PROGRESS: at sentence #7180000, processed 70981803 words, keeping 566208 word types
2017-07-20 19:26:41,426 : INFO : PROGRESS: at sentence #7190000,

2017-07-20 19:26:49,876 : INFO : PROGRESS: at sentence #7820000, processed 77227461 words, keeping 594260 word types
2017-07-20 19:26:49,913 : INFO : PROGRESS: at sentence #7830000, processed 77320340 words, keeping 594572 word types
2017-07-20 19:26:49,952 : INFO : PROGRESS: at sentence #7840000, processed 77418316 words, keeping 594920 word types
2017-07-20 19:26:49,990 : INFO : PROGRESS: at sentence #7850000, processed 77517288 words, keeping 595226 word types
2017-07-20 19:26:50,030 : INFO : PROGRESS: at sentence #7860000, processed 77623501 words, keeping 595648 word types
2017-07-20 19:26:50,068 : INFO : PROGRESS: at sentence #7870000, processed 77714679 words, keeping 596094 word types
2017-07-20 19:26:50,105 : INFO : PROGRESS: at sentence #7880000, processed 77804193 words, keeping 596495 word types
2017-07-20 19:26:50,147 : INFO : PROGRESS: at sentence #7890000, processed 77906859 words, keeping 597240 word types
2017-07-20 19:26:50,184 : INFO : PROGRESS: at sentence #7900000,

2017-07-20 19:26:59,015 : INFO : PROGRESS: at sentence #8530000, processed 84186396 words, keeping 625050 word types
2017-07-20 19:26:59,060 : INFO : PROGRESS: at sentence #8540000, processed 84288262 words, keeping 625577 word types
2017-07-20 19:27:00,792 : INFO : PROGRESS: at sentence #8550000, processed 84390339 words, keeping 626097 word types
2017-07-20 19:27:00,829 : INFO : PROGRESS: at sentence #8560000, processed 84483999 words, keeping 626445 word types
2017-07-20 19:27:00,872 : INFO : PROGRESS: at sentence #8570000, processed 84582640 words, keeping 626855 word types
2017-07-20 19:27:00,910 : INFO : PROGRESS: at sentence #8580000, processed 84680708 words, keeping 627174 word types
2017-07-20 19:27:00,950 : INFO : PROGRESS: at sentence #8590000, processed 84780127 words, keeping 627730 word types
2017-07-20 19:27:00,988 : INFO : PROGRESS: at sentence #8600000, processed 84881455 words, keeping 628130 word types
2017-07-20 19:27:01,028 : INFO : PROGRESS: at sentence #8610000,

2017-07-20 19:27:10,252 : INFO : PROGRESS: at sentence #9240000, processed 91120256 words, keeping 655280 word types
2017-07-20 19:27:10,290 : INFO : PROGRESS: at sentence #9250000, processed 91216685 words, keeping 655641 word types
2017-07-20 19:27:10,331 : INFO : PROGRESS: at sentence #9260000, processed 91316287 words, keeping 656105 word types
2017-07-20 19:27:10,373 : INFO : PROGRESS: at sentence #9270000, processed 91417536 words, keeping 656651 word types
2017-07-20 19:27:10,411 : INFO : PROGRESS: at sentence #9280000, processed 91513596 words, keeping 656999 word types
2017-07-20 19:27:10,450 : INFO : PROGRESS: at sentence #9290000, processed 91621272 words, keeping 657480 word types
2017-07-20 19:27:10,492 : INFO : PROGRESS: at sentence #9300000, processed 91722131 words, keeping 658008 word types
2017-07-20 19:27:10,534 : INFO : PROGRESS: at sentence #9310000, processed 91819992 words, keeping 658344 word types
2017-07-20 19:27:10,573 : INFO : PROGRESS: at sentence #9320000,

2017-07-20 19:27:19,059 : INFO : PROGRESS: at sentence #9950000, processed 98036854 words, keeping 682033 word types
2017-07-20 19:27:19,100 : INFO : PROGRESS: at sentence #9960000, processed 98136185 words, keeping 682622 word types
2017-07-20 19:27:19,273 : INFO : PROGRESS: at sentence #9970000, processed 98227002 words, keeping 682954 word types
2017-07-20 19:27:19,590 : INFO : PROGRESS: at sentence #9980000, processed 98306362 words, keeping 683140 word types
2017-07-20 19:27:19,623 : INFO : PROGRESS: at sentence #9990000, processed 98386248 words, keeping 683510 word types
2017-07-20 19:27:19,660 : INFO : PROGRESS: at sentence #10000000, processed 98467792 words, keeping 683915 word types
2017-07-20 19:27:19,884 : INFO : PROGRESS: at sentence #10010000, processed 98552414 words, keeping 684245 word types
2017-07-20 19:27:19,917 : INFO : PROGRESS: at sentence #10020000, processed 98633218 words, keeping 684496 word types
2017-07-20 19:27:19,953 : INFO : PROGRESS: at sentence #10030

2017-07-20 19:27:29,741 : INFO : PROGRESS: at sentence #10650000, processed 104904189 words, keeping 708689 word types
2017-07-20 19:27:29,786 : INFO : PROGRESS: at sentence #10660000, processed 105021854 words, keeping 709245 word types
2017-07-20 19:27:29,832 : INFO : PROGRESS: at sentence #10670000, processed 105143071 words, keeping 709631 word types
2017-07-20 19:27:29,876 : INFO : PROGRESS: at sentence #10680000, processed 105252772 words, keeping 709946 word types
2017-07-20 19:27:29,916 : INFO : PROGRESS: at sentence #10690000, processed 105349835 words, keeping 710376 word types
2017-07-20 19:27:29,954 : INFO : PROGRESS: at sentence #10700000, processed 105447056 words, keeping 710658 word types
2017-07-20 19:27:30,256 : INFO : PROGRESS: at sentence #10710000, processed 105538221 words, keeping 710881 word types
2017-07-20 19:27:30,293 : INFO : PROGRESS: at sentence #10720000, processed 105618622 words, keeping 711146 word types
2017-07-20 19:27:30,336 : INFO : PROGRESS: at se

2017-07-20 19:27:39,190 : INFO : PROGRESS: at sentence #11340000, processed 111811642 words, keeping 736053 word types
2017-07-20 19:27:39,231 : INFO : PROGRESS: at sentence #11350000, processed 111919518 words, keeping 736476 word types
2017-07-20 19:27:40,762 : INFO : PROGRESS: at sentence #11360000, processed 112019344 words, keeping 736809 word types
2017-07-20 19:27:40,802 : INFO : PROGRESS: at sentence #11370000, processed 112125440 words, keeping 737218 word types
2017-07-20 19:27:40,841 : INFO : PROGRESS: at sentence #11380000, processed 112222966 words, keeping 737559 word types
2017-07-20 19:27:40,885 : INFO : PROGRESS: at sentence #11390000, processed 112324612 words, keeping 737928 word types
2017-07-20 19:27:40,925 : INFO : PROGRESS: at sentence #11400000, processed 112429389 words, keeping 738271 word types
2017-07-20 19:27:40,962 : INFO : PROGRESS: at sentence #11410000, processed 112525698 words, keeping 738569 word types
2017-07-20 19:27:40,999 : INFO : PROGRESS: at se

2017-07-20 19:27:48,864 : INFO : PROGRESS: at sentence #12030000, processed 118696745 words, keeping 761161 word types
2017-07-20 19:27:48,905 : INFO : PROGRESS: at sentence #12040000, processed 118792106 words, keeping 761998 word types
2017-07-20 19:27:49,320 : INFO : PROGRESS: at sentence #12050000, processed 118889350 words, keeping 762379 word types
2017-07-20 19:27:49,356 : INFO : PROGRESS: at sentence #12060000, processed 118977699 words, keeping 762699 word types
2017-07-20 19:27:49,597 : INFO : PROGRESS: at sentence #12070000, processed 119059331 words, keeping 762942 word types
2017-07-20 19:27:49,629 : INFO : PROGRESS: at sentence #12080000, processed 119135994 words, keeping 763221 word types
2017-07-20 19:27:49,665 : INFO : PROGRESS: at sentence #12090000, processed 119224873 words, keeping 763474 word types
2017-07-20 19:27:51,173 : INFO : PROGRESS: at sentence #12100000, processed 119309830 words, keeping 763733 word types
2017-07-20 19:27:51,219 : INFO : PROGRESS: at se

2017-07-20 19:27:58,424 : INFO : PROGRESS: at sentence #12720000, processed 125252588 words, keeping 784975 word types
2017-07-20 19:27:58,461 : INFO : PROGRESS: at sentence #12730000, processed 125345562 words, keeping 785504 word types
2017-07-20 19:27:58,503 : INFO : PROGRESS: at sentence #12740000, processed 125448813 words, keeping 785870 word types
2017-07-20 19:27:58,767 : INFO : PROGRESS: at sentence #12750000, processed 125526676 words, keeping 786110 word types
2017-07-20 19:27:58,802 : INFO : PROGRESS: at sentence #12760000, processed 125607155 words, keeping 786347 word types
2017-07-20 19:28:00,181 : INFO : PROGRESS: at sentence #12770000, processed 125685596 words, keeping 786593 word types
2017-07-20 19:28:00,217 : INFO : PROGRESS: at sentence #12780000, processed 125780944 words, keeping 786912 word types
2017-07-20 19:28:00,257 : INFO : PROGRESS: at sentence #12790000, processed 125873866 words, keeping 787637 word types
2017-07-20 19:28:00,295 : INFO : PROGRESS: at se

2017-07-20 19:28:08,231 : INFO : PROGRESS: at sentence #13410000, processed 131943187 words, keeping 810637 word types
2017-07-20 19:28:08,271 : INFO : PROGRESS: at sentence #13420000, processed 132038101 words, keeping 810987 word types
2017-07-20 19:28:08,313 : INFO : PROGRESS: at sentence #13430000, processed 132149102 words, keeping 811256 word types
2017-07-20 19:28:08,356 : INFO : PROGRESS: at sentence #13440000, processed 132253017 words, keeping 811630 word types
2017-07-20 19:28:08,396 : INFO : PROGRESS: at sentence #13450000, processed 132349558 words, keeping 812138 word types
2017-07-20 19:28:08,683 : INFO : PROGRESS: at sentence #13460000, processed 132453239 words, keeping 812882 word types
2017-07-20 19:28:08,720 : INFO : PROGRESS: at sentence #13470000, processed 132537587 words, keeping 813156 word types
2017-07-20 19:28:08,759 : INFO : PROGRESS: at sentence #13480000, processed 132628760 words, keeping 813456 word types
2017-07-20 19:28:08,992 : INFO : PROGRESS: at se

2017-07-20 19:28:17,332 : INFO : PROGRESS: at sentence #14100000, processed 138581268 words, keeping 834011 word types
2017-07-20 19:28:17,365 : INFO : PROGRESS: at sentence #14110000, processed 138659644 words, keeping 834259 word types
2017-07-20 19:28:18,894 : INFO : PROGRESS: at sentence #14120000, processed 138749004 words, keeping 834505 word types
2017-07-20 19:28:18,931 : INFO : PROGRESS: at sentence #14130000, processed 138843453 words, keeping 834961 word types
2017-07-20 19:28:18,973 : INFO : PROGRESS: at sentence #14140000, processed 138946898 words, keeping 835367 word types
2017-07-20 19:28:19,013 : INFO : PROGRESS: at sentence #14150000, processed 139046120 words, keeping 835724 word types
2017-07-20 19:28:19,052 : INFO : PROGRESS: at sentence #14160000, processed 139139098 words, keeping 836081 word types
2017-07-20 19:28:19,091 : INFO : PROGRESS: at sentence #14170000, processed 139235255 words, keeping 836446 word types
2017-07-20 19:28:19,132 : INFO : PROGRESS: at se

2017-07-20 19:28:26,996 : INFO : PROGRESS: at sentence #14790000, processed 145132096 words, keeping 857058 word types
2017-07-20 19:28:27,039 : INFO : PROGRESS: at sentence #14800000, processed 145241886 words, keeping 857404 word types
2017-07-20 19:28:27,078 : INFO : PROGRESS: at sentence #14810000, processed 145340847 words, keeping 857834 word types
2017-07-20 19:28:27,118 : INFO : PROGRESS: at sentence #14820000, processed 145438171 words, keeping 858098 word types
2017-07-20 19:28:27,161 : INFO : PROGRESS: at sentence #14830000, processed 145545623 words, keeping 858697 word types
2017-07-20 19:28:28,746 : INFO : PROGRESS: at sentence #14840000, processed 145645244 words, keeping 858936 word types
2017-07-20 19:28:28,794 : INFO : PROGRESS: at sentence #14850000, processed 145770170 words, keeping 859254 word types
2017-07-20 19:28:28,834 : INFO : PROGRESS: at sentence #14860000, processed 145868511 words, keeping 859544 word types
2017-07-20 19:28:28,875 : INFO : PROGRESS: at se

2017-07-20 19:28:36,480 : INFO : PROGRESS: at sentence #15480000, processed 152018265 words, keeping 879871 word types
2017-07-20 19:28:38,015 : INFO : PROGRESS: at sentence #15490000, processed 152097072 words, keeping 880034 word types
2017-07-20 19:28:38,052 : INFO : PROGRESS: at sentence #15500000, processed 152193811 words, keeping 880381 word types
2017-07-20 19:28:38,093 : INFO : PROGRESS: at sentence #15510000, processed 152286726 words, keeping 880717 word types
2017-07-20 19:28:38,131 : INFO : PROGRESS: at sentence #15520000, processed 152380452 words, keeping 881078 word types
2017-07-20 19:28:38,171 : INFO : PROGRESS: at sentence #15530000, processed 152479893 words, keeping 881357 word types
2017-07-20 19:28:38,218 : INFO : PROGRESS: at sentence #15540000, processed 152601571 words, keeping 881715 word types
2017-07-20 19:28:38,256 : INFO : PROGRESS: at sentence #15550000, processed 152702428 words, keeping 882050 word types
2017-07-20 19:28:38,297 : INFO : PROGRESS: at se

2017-07-20 19:28:47,256 : INFO : PROGRESS: at sentence #16170000, processed 158791452 words, keeping 902786 word types
2017-07-20 19:28:47,296 : INFO : PROGRESS: at sentence #16180000, processed 158886278 words, keeping 903268 word types
2017-07-20 19:28:47,340 : INFO : PROGRESS: at sentence #16190000, processed 158983653 words, keeping 903784 word types
2017-07-20 19:28:47,382 : INFO : PROGRESS: at sentence #16200000, processed 159078916 words, keeping 904032 word types
2017-07-20 19:28:47,424 : INFO : PROGRESS: at sentence #16210000, processed 159184766 words, keeping 904719 word types
2017-07-20 19:28:47,465 : INFO : PROGRESS: at sentence #16220000, processed 159286284 words, keeping 905051 word types
2017-07-20 19:28:47,502 : INFO : PROGRESS: at sentence #16230000, processed 159375632 words, keeping 905298 word types
2017-07-20 19:28:47,549 : INFO : PROGRESS: at sentence #16240000, processed 159491557 words, keeping 905749 word types
2017-07-20 19:28:47,589 : INFO : PROGRESS: at se

2017-07-20 19:28:56,462 : INFO : PROGRESS: at sentence #16860000, processed 165768505 words, keeping 926336 word types
2017-07-20 19:28:56,516 : INFO : PROGRESS: at sentence #16870000, processed 165908500 words, keeping 926587 word types
2017-07-20 19:28:56,554 : INFO : PROGRESS: at sentence #16880000, processed 165999500 words, keeping 926771 word types
2017-07-20 19:28:56,597 : INFO : PROGRESS: at sentence #16890000, processed 166101689 words, keeping 927042 word types
2017-07-20 19:28:56,637 : INFO : PROGRESS: at sentence #16900000, processed 166194956 words, keeping 927433 word types
2017-07-20 19:28:58,216 : INFO : PROGRESS: at sentence #16910000, processed 166291833 words, keeping 927705 word types
2017-07-20 19:28:58,253 : INFO : PROGRESS: at sentence #16920000, processed 166384697 words, keeping 928024 word types
2017-07-20 19:28:58,298 : INFO : PROGRESS: at sentence #16930000, processed 166488555 words, keeping 928421 word types
2017-07-20 19:28:58,341 : INFO : PROGRESS: at se

2017-07-20 19:29:07,198 : INFO : PROGRESS: at sentence #17550000, processed 172641201 words, keeping 948260 word types
2017-07-20 19:29:07,242 : INFO : PROGRESS: at sentence #17560000, processed 172739397 words, keeping 948630 word types
2017-07-20 19:29:07,281 : INFO : PROGRESS: at sentence #17570000, processed 172838093 words, keeping 948882 word types
2017-07-20 19:29:07,324 : INFO : PROGRESS: at sentence #17580000, processed 172937118 words, keeping 949331 word types
2017-07-20 19:29:07,364 : INFO : PROGRESS: at sentence #17590000, processed 173028624 words, keeping 949706 word types
2017-07-20 19:29:07,405 : INFO : PROGRESS: at sentence #17600000, processed 173127839 words, keeping 949909 word types
2017-07-20 19:29:07,449 : INFO : PROGRESS: at sentence #17610000, processed 173234053 words, keeping 950301 word types
2017-07-20 19:29:07,496 : INFO : PROGRESS: at sentence #17620000, processed 173343432 words, keeping 950574 word types
2017-07-20 19:29:07,541 : INFO : PROGRESS: at se

2017-07-20 19:29:15,901 : INFO : PROGRESS: at sentence #18240000, processed 179410435 words, keeping 972312 word types
2017-07-20 19:29:16,197 : INFO : PROGRESS: at sentence #18250000, processed 179504973 words, keeping 972519 word types
2017-07-20 19:29:16,234 : INFO : PROGRESS: at sentence #18260000, processed 179586587 words, keeping 972696 word types
2017-07-20 19:29:17,674 : INFO : PROGRESS: at sentence #18270000, processed 179667116 words, keeping 972879 word types
2017-07-20 19:29:17,714 : INFO : PROGRESS: at sentence #18280000, processed 179770820 words, keeping 973242 word types
2017-07-20 19:29:17,758 : INFO : PROGRESS: at sentence #18290000, processed 179869628 words, keeping 973435 word types
2017-07-20 19:29:17,800 : INFO : PROGRESS: at sentence #18300000, processed 179968888 words, keeping 973634 word types
2017-07-20 19:29:17,840 : INFO : PROGRESS: at sentence #18310000, processed 180062775 words, keeping 974299 word types
2017-07-20 19:29:17,883 : INFO : PROGRESS: at se

2017-07-20 19:29:26,965 : INFO : PROGRESS: at sentence #18930000, processed 186261647 words, keeping 994131 word types
2017-07-20 19:29:27,004 : INFO : PROGRESS: at sentence #18940000, processed 186358417 words, keeping 994397 word types
2017-07-20 19:29:27,047 : INFO : PROGRESS: at sentence #18950000, processed 186455559 words, keeping 994660 word types
2017-07-20 19:29:27,089 : INFO : PROGRESS: at sentence #18960000, processed 186554953 words, keeping 995177 word types
2017-07-20 19:29:27,132 : INFO : PROGRESS: at sentence #18970000, processed 186656784 words, keeping 995545 word types
2017-07-20 19:29:27,174 : INFO : PROGRESS: at sentence #18980000, processed 186758913 words, keeping 995870 word types
2017-07-20 19:29:27,213 : INFO : PROGRESS: at sentence #18990000, processed 186845528 words, keeping 996200 word types
2017-07-20 19:29:27,253 : INFO : PROGRESS: at sentence #19000000, processed 186943590 words, keeping 996453 word types
2017-07-20 19:29:27,296 : INFO : PROGRESS: at se

2017-07-20 19:29:35,784 : INFO : PROGRESS: at sentence #19620000, processed 193010509 words, keeping 1014537 word types
2017-07-20 19:29:35,823 : INFO : PROGRESS: at sentence #19630000, processed 193106194 words, keeping 1014859 word types
2017-07-20 19:29:35,863 : INFO : PROGRESS: at sentence #19640000, processed 193201049 words, keeping 1015154 word types
2017-07-20 19:29:36,968 : INFO : PROGRESS: at sentence #19650000, processed 193300277 words, keeping 1015407 word types
2017-07-20 19:29:37,012 : INFO : PROGRESS: at sentence #19660000, processed 193406142 words, keeping 1015611 word types
2017-07-20 19:29:37,053 : INFO : PROGRESS: at sentence #19670000, processed 193507398 words, keeping 1015810 word types
2017-07-20 19:29:37,093 : INFO : PROGRESS: at sentence #19680000, processed 193605947 words, keeping 1016013 word types
2017-07-20 19:29:37,136 : INFO : PROGRESS: at sentence #19690000, processed 193711948 words, keeping 1016248 word types
2017-07-20 19:29:37,177 : INFO : PROGRES

2017-07-20 19:29:46,359 : INFO : PROGRESS: at sentence #20310000, processed 200014088 words, keeping 1035694 word types
2017-07-20 19:29:46,406 : INFO : PROGRESS: at sentence #20320000, processed 200126947 words, keeping 1035937 word types
2017-07-20 19:29:46,449 : INFO : PROGRESS: at sentence #20330000, processed 200228820 words, keeping 1036409 word types
2017-07-20 19:29:46,490 : INFO : PROGRESS: at sentence #20340000, processed 200325495 words, keeping 1036650 word types
2017-07-20 19:29:46,530 : INFO : PROGRESS: at sentence #20350000, processed 200422923 words, keeping 1037051 word types
2017-07-20 19:29:46,572 : INFO : PROGRESS: at sentence #20360000, processed 200513452 words, keeping 1037343 word types
2017-07-20 19:29:46,614 : INFO : PROGRESS: at sentence #20370000, processed 200626077 words, keeping 1037631 word types
2017-07-20 19:29:48,373 : INFO : PROGRESS: at sentence #20380000, processed 200735718 words, keeping 1037836 word types
2017-07-20 19:29:48,415 : INFO : PROGRES

2017-07-20 19:29:55,773 : INFO : PROGRESS: at sentence #21000000, processed 206918963 words, keeping 1056719 word types
2017-07-20 19:29:57,339 : INFO : PROGRESS: at sentence #21010000, processed 207010381 words, keeping 1057009 word types
2017-07-20 19:29:57,381 : INFO : PROGRESS: at sentence #21020000, processed 207104103 words, keeping 1057208 word types
2017-07-20 19:29:57,422 : INFO : PROGRESS: at sentence #21030000, processed 207205197 words, keeping 1057353 word types
2017-07-20 19:29:57,465 : INFO : PROGRESS: at sentence #21040000, processed 207308912 words, keeping 1057602 word types
2017-07-20 19:29:57,508 : INFO : PROGRESS: at sentence #21050000, processed 207410439 words, keeping 1057988 word types
2017-07-20 19:29:57,550 : INFO : PROGRESS: at sentence #21060000, processed 207511824 words, keeping 1058176 word types
2017-07-20 19:29:57,594 : INFO : PROGRESS: at sentence #21070000, processed 207619923 words, keeping 1058434 word types
2017-07-20 19:29:57,640 : INFO : PROGRES

2017-07-20 19:30:06,846 : INFO : PROGRESS: at sentence #21690000, processed 213923681 words, keeping 1076660 word types
2017-07-20 19:30:06,893 : INFO : PROGRESS: at sentence #21700000, processed 214030056 words, keeping 1076940 word types
2017-07-20 19:30:06,939 : INFO : PROGRESS: at sentence #21710000, processed 214130605 words, keeping 1077204 word types
2017-07-20 19:30:06,986 : INFO : PROGRESS: at sentence #21720000, processed 214234965 words, keeping 1077519 word types
2017-07-20 19:30:07,030 : INFO : PROGRESS: at sentence #21730000, processed 214329802 words, keeping 1077973 word types
2017-07-20 19:30:07,075 : INFO : PROGRESS: at sentence #21740000, processed 214431223 words, keeping 1078182 word types
2017-07-20 19:30:07,119 : INFO : PROGRESS: at sentence #21750000, processed 214530691 words, keeping 1078437 word types
2017-07-20 19:30:07,165 : INFO : PROGRESS: at sentence #21760000, processed 214634456 words, keeping 1078800 word types
2017-07-20 19:30:07,213 : INFO : PROGRES

2017-07-20 19:30:16,651 : INFO : PROGRESS: at sentence #22380000, processed 220679764 words, keeping 1097502 word types
2017-07-20 19:30:16,692 : INFO : PROGRESS: at sentence #22390000, processed 220778752 words, keeping 1097755 word types
2017-07-20 19:30:16,738 : INFO : PROGRESS: at sentence #22400000, processed 220877239 words, keeping 1098006 word types
2017-07-20 19:30:16,785 : INFO : PROGRESS: at sentence #22410000, processed 220978072 words, keeping 1098409 word types
2017-07-20 19:30:16,829 : INFO : PROGRESS: at sentence #22420000, processed 221076085 words, keeping 1098750 word types
2017-07-20 19:30:16,869 : INFO : PROGRESS: at sentence #22430000, processed 221172770 words, keeping 1099020 word types
2017-07-20 19:30:16,913 : INFO : PROGRESS: at sentence #22440000, processed 221265489 words, keeping 1099324 word types
2017-07-20 19:30:16,955 : INFO : PROGRESS: at sentence #22450000, processed 221361664 words, keeping 1099595 word types
2017-07-20 19:30:17,235 : INFO : PROGRES

2017-07-20 19:30:26,871 : INFO : PROGRESS: at sentence #23070000, processed 227390537 words, keeping 1116614 word types
2017-07-20 19:30:26,914 : INFO : PROGRESS: at sentence #23080000, processed 227496324 words, keeping 1116847 word types
2017-07-20 19:30:26,960 : INFO : PROGRESS: at sentence #23090000, processed 227596023 words, keeping 1117091 word types
2017-07-20 19:30:27,003 : INFO : PROGRESS: at sentence #23100000, processed 227691984 words, keeping 1117347 word types
2017-07-20 19:30:27,046 : INFO : PROGRESS: at sentence #23110000, processed 227793458 words, keeping 1117688 word types
2017-07-20 19:30:27,087 : INFO : PROGRESS: at sentence #23120000, processed 227889579 words, keeping 1117974 word types
2017-07-20 19:30:27,132 : INFO : PROGRESS: at sentence #23130000, processed 227992032 words, keeping 1118239 word types
2017-07-20 19:30:27,177 : INFO : PROGRESS: at sentence #23140000, processed 228099082 words, keeping 1118557 word types
2017-07-20 19:30:27,222 : INFO : PROGRES

2017-07-20 19:30:35,807 : INFO : PROGRESS: at sentence #23760000, processed 234136148 words, keeping 1135018 word types
2017-07-20 19:30:35,845 : INFO : PROGRESS: at sentence #23770000, processed 234217388 words, keeping 1135183 word types
2017-07-20 19:30:37,470 : INFO : PROGRESS: at sentence #23780000, processed 234303710 words, keeping 1135364 word types
2017-07-20 19:30:37,511 : INFO : PROGRESS: at sentence #23790000, processed 234406768 words, keeping 1135633 word types
2017-07-20 19:30:37,552 : INFO : PROGRESS: at sentence #23800000, processed 234501770 words, keeping 1135832 word types
2017-07-20 19:30:37,596 : INFO : PROGRESS: at sentence #23810000, processed 234597669 words, keeping 1136209 word types
2017-07-20 19:30:37,641 : INFO : PROGRESS: at sentence #23820000, processed 234703688 words, keeping 1136741 word types
2017-07-20 19:30:37,684 : INFO : PROGRESS: at sentence #23830000, processed 234798343 words, keeping 1137024 word types
2017-07-20 19:30:37,728 : INFO : PROGRES

2017-07-20 19:30:46,265 : INFO : PROGRESS: at sentence #24450000, processed 240787834 words, keeping 1154389 word types
2017-07-20 19:30:46,309 : INFO : PROGRESS: at sentence #24460000, processed 240886807 words, keeping 1154691 word types
2017-07-20 19:30:46,352 : INFO : PROGRESS: at sentence #24470000, processed 240993249 words, keeping 1155069 word types
2017-07-20 19:30:46,395 : INFO : PROGRESS: at sentence #24480000, processed 241085295 words, keeping 1155388 word types
2017-07-20 19:30:46,440 : INFO : PROGRESS: at sentence #24490000, processed 241186603 words, keeping 1155716 word types
2017-07-20 19:30:46,480 : INFO : PROGRESS: at sentence #24500000, processed 241270499 words, keeping 1156198 word types
2017-07-20 19:30:46,526 : INFO : PROGRESS: at sentence #24510000, processed 241383175 words, keeping 1156402 word types
2017-07-20 19:30:46,570 : INFO : PROGRESS: at sentence #24520000, processed 241477594 words, keeping 1156793 word types
2017-07-20 19:30:46,611 : INFO : PROGRES

2017-07-20 19:30:56,403 : INFO : PROGRESS: at sentence #25140000, processed 247670161 words, keeping 1175317 word types
2017-07-20 19:30:56,449 : INFO : PROGRESS: at sentence #25150000, processed 247776443 words, keeping 1175704 word types
2017-07-20 19:30:56,496 : INFO : PROGRESS: at sentence #25160000, processed 247889224 words, keeping 1175967 word types
2017-07-20 19:30:56,542 : INFO : PROGRESS: at sentence #25170000, processed 247996773 words, keeping 1176223 word types
2017-07-20 19:30:56,586 : INFO : PROGRESS: at sentence #25180000, processed 248089995 words, keeping 1176515 word types
2017-07-20 19:30:56,631 : INFO : PROGRESS: at sentence #25190000, processed 248183053 words, keeping 1176806 word types
2017-07-20 19:30:56,676 : INFO : PROGRESS: at sentence #25200000, processed 248284477 words, keeping 1177108 word types
2017-07-20 19:30:56,719 : INFO : PROGRESS: at sentence #25210000, processed 248387627 words, keeping 1177355 word types
2017-07-20 19:30:56,765 : INFO : PROGRES

2017-07-20 19:31:05,766 : INFO : PROGRESS: at sentence #25830000, processed 254498411 words, keeping 1193867 word types
2017-07-20 19:31:06,105 : INFO : PROGRESS: at sentence #25840000, processed 254580634 words, keeping 1193985 word types
2017-07-20 19:31:06,143 : INFO : PROGRESS: at sentence #25850000, processed 254665550 words, keeping 1194157 word types
2017-07-20 19:31:06,286 : INFO : PROGRESS: at sentence #25860000, processed 254754258 words, keeping 1194285 word types
2017-07-20 19:31:06,325 : INFO : PROGRESS: at sentence #25870000, processed 254835101 words, keeping 1194389 word types
2017-07-20 19:31:07,913 : INFO : PROGRESS: at sentence #25880000, processed 254941968 words, keeping 1194495 word types
2017-07-20 19:31:07,957 : INFO : PROGRESS: at sentence #25890000, processed 255032340 words, keeping 1194932 word types
2017-07-20 19:31:08,002 : INFO : PROGRESS: at sentence #25900000, processed 255126092 words, keeping 1195170 word types
2017-07-20 19:31:08,041 : INFO : PROGRES

2017-07-20 19:31:16,572 : INFO : PROGRESS: at sentence #26520000, processed 261325888 words, keeping 1212989 word types
2017-07-20 19:31:16,616 : INFO : PROGRESS: at sentence #26530000, processed 261430756 words, keeping 1213223 word types
2017-07-20 19:31:16,663 : INFO : PROGRESS: at sentence #26540000, processed 261538561 words, keeping 1213392 word types
2017-07-20 19:31:16,710 : INFO : PROGRESS: at sentence #26550000, processed 261632808 words, keeping 1213696 word types
2017-07-20 19:31:16,761 : INFO : PROGRESS: at sentence #26560000, processed 261744973 words, keeping 1213979 word types
2017-07-20 19:31:16,809 : INFO : PROGRESS: at sentence #26570000, processed 261849898 words, keeping 1214269 word types
2017-07-20 19:31:16,854 : INFO : PROGRESS: at sentence #26580000, processed 261943000 words, keeping 1214687 word types
2017-07-20 19:31:16,900 : INFO : PROGRESS: at sentence #26590000, processed 262039703 words, keeping 1214968 word types
2017-07-20 19:31:17,190 : INFO : PROGRES

2017-07-20 19:31:26,433 : INFO : PROGRESS: at sentence #27210000, processed 268237533 words, keeping 1230647 word types
2017-07-20 19:31:26,478 : INFO : PROGRESS: at sentence #27220000, processed 268333331 words, keeping 1230813 word types
2017-07-20 19:31:26,524 : INFO : PROGRESS: at sentence #27230000, processed 268428810 words, keeping 1230999 word types
2017-07-20 19:31:28,093 : INFO : PROGRESS: at sentence #27240000, processed 268519851 words, keeping 1231253 word types
2017-07-20 19:31:28,132 : INFO : PROGRESS: at sentence #27250000, processed 268608101 words, keeping 1231525 word types
2017-07-20 19:31:28,177 : INFO : PROGRESS: at sentence #27260000, processed 268704225 words, keeping 1232041 word types
2017-07-20 19:31:28,224 : INFO : PROGRESS: at sentence #27270000, processed 268802998 words, keeping 1232296 word types
2017-07-20 19:31:28,270 : INFO : PROGRESS: at sentence #27280000, processed 268912476 words, keeping 1232535 word types
2017-07-20 19:31:28,317 : INFO : PROGRES

2017-07-20 19:31:37,303 : INFO : PROGRESS: at sentence #27900000, processed 274811962 words, keeping 1247302 word types
2017-07-20 19:31:37,347 : INFO : PROGRESS: at sentence #27910000, processed 274912584 words, keeping 1247531 word types
2017-07-20 19:31:37,395 : INFO : PROGRESS: at sentence #27920000, processed 275017455 words, keeping 1247760 word types
2017-07-20 19:31:37,444 : INFO : PROGRESS: at sentence #27930000, processed 275126562 words, keeping 1248028 word types
2017-07-20 19:31:37,488 : INFO : PROGRESS: at sentence #27940000, processed 275219650 words, keeping 1248275 word types
2017-07-20 19:31:37,532 : INFO : PROGRESS: at sentence #27950000, processed 275314186 words, keeping 1248531 word types
2017-07-20 19:31:37,578 : INFO : PROGRESS: at sentence #27960000, processed 275413134 words, keeping 1248778 word types
2017-07-20 19:31:37,625 : INFO : PROGRESS: at sentence #27970000, processed 275515987 words, keeping 1249036 word types
2017-07-20 19:31:37,673 : INFO : PROGRES

2017-07-20 19:31:47,050 : INFO : PROGRESS: at sentence #28590000, processed 281749044 words, keeping 1265614 word types
2017-07-20 19:31:47,099 : INFO : PROGRESS: at sentence #28600000, processed 281856699 words, keeping 1265796 word types
2017-07-20 19:31:47,143 : INFO : PROGRESS: at sentence #28610000, processed 281962063 words, keeping 1266101 word types
2017-07-20 19:31:47,185 : INFO : PROGRESS: at sentence #28620000, processed 282054681 words, keeping 1266402 word types
2017-07-20 19:31:47,231 : INFO : PROGRESS: at sentence #28630000, processed 282153285 words, keeping 1266738 word types
2017-07-20 19:31:47,275 : INFO : PROGRESS: at sentence #28640000, processed 282245181 words, keeping 1266929 word types
2017-07-20 19:31:47,320 : INFO : PROGRESS: at sentence #28650000, processed 282344104 words, keeping 1267203 word types
2017-07-20 19:31:47,366 : INFO : PROGRESS: at sentence #28660000, processed 282452703 words, keeping 1267397 word types
2017-07-20 19:31:47,662 : INFO : PROGRES

2017-07-20 19:31:56,998 : INFO : PROGRESS: at sentence #29280000, processed 288664035 words, keeping 1282625 word types
2017-07-20 19:31:57,045 : INFO : PROGRESS: at sentence #29290000, processed 288767393 words, keeping 1282899 word types
2017-07-20 19:31:57,091 : INFO : PROGRESS: at sentence #29300000, processed 288878257 words, keeping 1283205 word types
2017-07-20 19:31:57,136 : INFO : PROGRESS: at sentence #29310000, processed 288978529 words, keeping 1283460 word types
2017-07-20 19:31:57,186 : INFO : PROGRESS: at sentence #29320000, processed 289079528 words, keeping 1283680 word types
2017-07-20 19:31:57,481 : INFO : PROGRESS: at sentence #29330000, processed 289181641 words, keeping 1283882 word types
2017-07-20 19:31:57,523 : INFO : PROGRESS: at sentence #29340000, processed 289267314 words, keeping 1284035 word types
2017-07-20 19:31:59,218 : INFO : PROGRESS: at sentence #29350000, processed 289362981 words, keeping 1284168 word types
2017-07-20 19:31:59,260 : INFO : PROGRES

2017-07-20 19:32:06,802 : INFO : PROGRESS: at sentence #29970000, processed 295516223 words, keeping 1299721 word types
2017-07-20 19:32:08,545 : INFO : PROGRESS: at sentence #29980000, processed 295608488 words, keeping 1300039 word types
2017-07-20 19:32:08,586 : INFO : PROGRESS: at sentence #29990000, processed 295703165 words, keeping 1300226 word types
2017-07-20 19:32:08,630 : INFO : PROGRESS: at sentence #30000000, processed 295801071 words, keeping 1300416 word types
2017-07-20 19:32:08,677 : INFO : PROGRESS: at sentence #30010000, processed 295897264 words, keeping 1300698 word types
2017-07-20 19:32:08,723 : INFO : PROGRESS: at sentence #30020000, processed 295996812 words, keeping 1301015 word types
2017-07-20 19:32:08,770 : INFO : PROGRESS: at sentence #30030000, processed 296100474 words, keeping 1302003 word types
2017-07-20 19:32:08,814 : INFO : PROGRESS: at sentence #30040000, processed 296190888 words, keeping 1302768 word types
2017-07-20 19:32:08,866 : INFO : PROGRES

2017-07-20 19:32:18,337 : INFO : PROGRESS: at sentence #30660000, processed 302502842 words, keeping 1318803 word types
2017-07-20 19:32:18,382 : INFO : PROGRESS: at sentence #30670000, processed 302598446 words, keeping 1319051 word types
2017-07-20 19:32:18,427 : INFO : PROGRESS: at sentence #30680000, processed 302695908 words, keeping 1319257 word types
2017-07-20 19:32:18,475 : INFO : PROGRESS: at sentence #30690000, processed 302806894 words, keeping 1319435 word types
2017-07-20 19:32:18,519 : INFO : PROGRESS: at sentence #30700000, processed 302902197 words, keeping 1319591 word types
2017-07-20 19:32:18,563 : INFO : PROGRESS: at sentence #30710000, processed 302997490 words, keeping 1319817 word types
2017-07-20 19:32:18,608 : INFO : PROGRESS: at sentence #30720000, processed 303094571 words, keeping 1320049 word types
2017-07-20 19:32:18,655 : INFO : PROGRESS: at sentence #30730000, processed 303194083 words, keeping 1320508 word types
2017-07-20 19:32:18,702 : INFO : PROGRES

2017-07-20 19:32:27,198 : INFO : PROGRESS: at sentence #31350000, processed 309206923 words, keeping 1335437 word types
2017-07-20 19:32:27,492 : INFO : PROGRESS: at sentence #31360000, processed 309304240 words, keeping 1335697 word types
2017-07-20 19:32:27,533 : INFO : PROGRESS: at sentence #31370000, processed 309378497 words, keeping 1335807 word types
2017-07-20 19:32:27,576 : INFO : PROGRESS: at sentence #31380000, processed 309466675 words, keeping 1335958 word types
2017-07-20 19:32:29,134 : INFO : PROGRESS: at sentence #31390000, processed 309546448 words, keeping 1336119 word types
2017-07-20 19:32:29,181 : INFO : PROGRESS: at sentence #31400000, processed 309650058 words, keeping 1336442 word types
2017-07-20 19:32:29,232 : INFO : PROGRESS: at sentence #31410000, processed 309751781 words, keeping 1336636 word types
2017-07-20 19:32:29,277 : INFO : PROGRESS: at sentence #31420000, processed 309848840 words, keeping 1336859 word types
2017-07-20 19:32:29,322 : INFO : PROGRES

2017-07-20 19:32:37,205 : INFO : PROGRESS: at sentence #32040000, processed 315944044 words, keeping 1351590 word types
2017-07-20 19:32:37,492 : INFO : PROGRESS: at sentence #32050000, processed 316034551 words, keeping 1351842 word types
2017-07-20 19:32:37,532 : INFO : PROGRESS: at sentence #32060000, processed 316120708 words, keeping 1351997 word types
2017-07-20 19:32:37,876 : INFO : PROGRESS: at sentence #32070000, processed 316206524 words, keeping 1352101 word types
2017-07-20 19:32:37,915 : INFO : PROGRESS: at sentence #32080000, processed 316289266 words, keeping 1352228 word types
2017-07-20 19:32:37,958 : INFO : PROGRESS: at sentence #32090000, processed 316374792 words, keeping 1352382 word types
2017-07-20 19:32:39,436 : INFO : PROGRESS: at sentence #32100000, processed 316466659 words, keeping 1352613 word types
2017-07-20 19:32:39,477 : INFO : PROGRESS: at sentence #32110000, processed 316559824 words, keeping 1352751 word types
2017-07-20 19:32:39,525 : INFO : PROGRES

2017-07-20 19:32:48,876 : INFO : PROGRESS: at sentence #32730000, processed 322607109 words, keeping 1367048 word types
2017-07-20 19:32:48,925 : INFO : PROGRESS: at sentence #32740000, processed 322725895 words, keeping 1367295 word types
2017-07-20 19:32:48,972 : INFO : PROGRESS: at sentence #32750000, processed 322825034 words, keeping 1367474 word types
2017-07-20 19:32:49,019 : INFO : PROGRESS: at sentence #32760000, processed 322930461 words, keeping 1367627 word types
2017-07-20 19:32:49,065 : INFO : PROGRESS: at sentence #32770000, processed 323023817 words, keeping 1367858 word types
2017-07-20 19:32:49,112 : INFO : PROGRESS: at sentence #32780000, processed 323129376 words, keeping 1368067 word types
2017-07-20 19:32:49,155 : INFO : PROGRESS: at sentence #32790000, processed 323226784 words, keeping 1368373 word types
2017-07-20 19:32:49,206 : INFO : PROGRESS: at sentence #32800000, processed 323341780 words, keeping 1368701 word types
2017-07-20 19:32:49,253 : INFO : PROGRES

2017-07-20 19:32:57,629 : INFO : PROGRESS: at sentence #33420000, processed 329415932 words, keeping 1383749 word types
2017-07-20 19:32:59,275 : INFO : PROGRESS: at sentence #33430000, processed 329511035 words, keeping 1383958 word types
2017-07-20 19:32:59,318 : INFO : PROGRESS: at sentence #33440000, processed 329607723 words, keeping 1384141 word types
2017-07-20 19:32:59,366 : INFO : PROGRESS: at sentence #33450000, processed 329704963 words, keeping 1384397 word types
2017-07-20 19:32:59,410 : INFO : PROGRESS: at sentence #33460000, processed 329802515 words, keeping 1384651 word types
2017-07-20 19:32:59,458 : INFO : PROGRESS: at sentence #33470000, processed 329903174 words, keeping 1385021 word types
2017-07-20 19:32:59,505 : INFO : PROGRESS: at sentence #33480000, processed 329998271 words, keeping 1385322 word types
2017-07-20 19:32:59,553 : INFO : PROGRESS: at sentence #33490000, processed 330100889 words, keeping 1385609 word types
2017-07-20 19:32:59,598 : INFO : PROGRES

2017-07-20 19:33:09,055 : INFO : PROGRESS: at sentence #34110000, processed 336274689 words, keeping 1401349 word types
2017-07-20 19:33:09,103 : INFO : PROGRESS: at sentence #34120000, processed 336384021 words, keeping 1401561 word types
2017-07-20 19:33:09,149 : INFO : PROGRESS: at sentence #34130000, processed 336481662 words, keeping 1401764 word types
2017-07-20 19:33:09,197 : INFO : PROGRESS: at sentence #34140000, processed 336582500 words, keeping 1401993 word types
2017-07-20 19:33:09,246 : INFO : PROGRESS: at sentence #34150000, processed 336690640 words, keeping 1402202 word types
2017-07-20 19:33:09,294 : INFO : PROGRESS: at sentence #34160000, processed 336785991 words, keeping 1402399 word types
2017-07-20 19:33:09,346 : INFO : PROGRESS: at sentence #34170000, processed 336899043 words, keeping 1402611 word types
2017-07-20 19:33:09,400 : INFO : PROGRESS: at sentence #34180000, processed 337030198 words, keeping 1402926 word types
2017-07-20 19:33:09,449 : INFO : PROGRES

2017-07-20 19:33:19,541 : INFO : PROGRESS: at sentence #34800000, processed 343224903 words, keeping 1417712 word types
2017-07-20 19:33:19,582 : INFO : PROGRESS: at sentence #34810000, processed 343312738 words, keeping 1417862 word types
2017-07-20 19:33:19,627 : INFO : PROGRESS: at sentence #34820000, processed 343405878 words, keeping 1418111 word types
2017-07-20 19:33:19,675 : INFO : PROGRESS: at sentence #34830000, processed 343505641 words, keeping 1418322 word types
2017-07-20 19:33:19,722 : INFO : PROGRESS: at sentence #34840000, processed 343608538 words, keeping 1418492 word types
2017-07-20 19:33:19,769 : INFO : PROGRESS: at sentence #34850000, processed 343707420 words, keeping 1418723 word types
2017-07-20 19:33:19,815 : INFO : PROGRESS: at sentence #34860000, processed 343808447 words, keeping 1418917 word types
2017-07-20 19:33:19,863 : INFO : PROGRESS: at sentence #34870000, processed 343906028 words, keeping 1419111 word types
2017-07-20 19:33:19,909 : INFO : PROGRES

2017-07-20 19:33:28,704 : INFO : PROGRESS: at sentence #35490000, processed 350087150 words, keeping 1433859 word types
2017-07-20 19:33:28,747 : INFO : PROGRESS: at sentence #35500000, processed 350164048 words, keeping 1434018 word types
2017-07-20 19:33:28,998 : INFO : PROGRESS: at sentence #35510000, processed 350249310 words, keeping 1434172 word types
2017-07-20 19:33:29,037 : INFO : PROGRESS: at sentence #35520000, processed 350322179 words, keeping 1434303 word types
2017-07-20 19:33:29,077 : INFO : PROGRESS: at sentence #35530000, processed 350403564 words, keeping 1434463 word types
2017-07-20 19:33:30,122 : INFO : PROGRESS: at sentence #35540000, processed 350501523 words, keeping 1434571 word types
2017-07-20 19:33:30,169 : INFO : PROGRESS: at sentence #35550000, processed 350607819 words, keeping 1434666 word types
2017-07-20 19:33:30,215 : INFO : PROGRESS: at sentence #35560000, processed 350712444 words, keeping 1434789 word types
2017-07-20 19:33:30,260 : INFO : PROGRES

2017-07-20 19:33:39,641 : INFO : PROGRESS: at sentence #36180000, processed 357028809 words, keeping 1450244 word types
2017-07-20 19:33:39,692 : INFO : PROGRESS: at sentence #36190000, processed 357137482 words, keeping 1450578 word types
2017-07-20 19:33:39,740 : INFO : PROGRESS: at sentence #36200000, processed 357244326 words, keeping 1450841 word types
2017-07-20 19:33:39,788 : INFO : PROGRESS: at sentence #36210000, processed 357339707 words, keeping 1451085 word types
2017-07-20 19:33:39,834 : INFO : PROGRESS: at sentence #36220000, processed 357434501 words, keeping 1451442 word types
2017-07-20 19:33:39,883 : INFO : PROGRESS: at sentence #36230000, processed 357537206 words, keeping 1451653 word types
2017-07-20 19:33:39,930 : INFO : PROGRESS: at sentence #36240000, processed 357631389 words, keeping 1451880 word types
2017-07-20 19:33:41,673 : INFO : PROGRESS: at sentence #36250000, processed 357735299 words, keeping 1452152 word types
2017-07-20 19:33:41,718 : INFO : PROGRES

2017-07-20 19:33:49,234 : INFO : PROGRESS: at sentence #36870000, processed 363673503 words, keeping 1465775 word types
2017-07-20 19:33:50,696 : INFO : PROGRESS: at sentence #36880000, processed 363778714 words, keeping 1465987 word types
2017-07-20 19:33:50,740 : INFO : PROGRESS: at sentence #36890000, processed 363882112 words, keeping 1466252 word types
2017-07-20 19:33:50,786 : INFO : PROGRESS: at sentence #36900000, processed 363977293 words, keeping 1466421 word types
2017-07-20 19:33:50,834 : INFO : PROGRESS: at sentence #36910000, processed 364074731 words, keeping 1466612 word types
2017-07-20 19:33:50,882 : INFO : PROGRESS: at sentence #36920000, processed 364178267 words, keeping 1466768 word types
2017-07-20 19:33:50,932 : INFO : PROGRESS: at sentence #36930000, processed 364288901 words, keeping 1466973 word types
2017-07-20 19:33:50,978 : INFO : PROGRESS: at sentence #36940000, processed 364385976 words, keeping 1467218 word types
2017-07-20 19:33:51,025 : INFO : PROGRES

2017-07-20 19:34:00,484 : INFO : PROGRESS: at sentence #37560000, processed 370473658 words, keeping 1480554 word types
2017-07-20 19:34:00,528 : INFO : PROGRESS: at sentence #37570000, processed 370571483 words, keeping 1480704 word types
2017-07-20 19:34:00,577 : INFO : PROGRESS: at sentence #37580000, processed 370668764 words, keeping 1480861 word types
2017-07-20 19:34:00,622 : INFO : PROGRESS: at sentence #37590000, processed 370766020 words, keeping 1481076 word types
2017-07-20 19:34:00,668 : INFO : PROGRESS: at sentence #37600000, processed 370867373 words, keeping 1481224 word types
2017-07-20 19:34:00,714 : INFO : PROGRESS: at sentence #37610000, processed 370965649 words, keeping 1481400 word types
2017-07-20 19:34:00,765 : INFO : PROGRESS: at sentence #37620000, processed 371074717 words, keeping 1481572 word types
2017-07-20 19:34:00,811 : INFO : PROGRESS: at sentence #37630000, processed 371175206 words, keeping 1481713 word types
2017-07-20 19:34:00,857 : INFO : PROGRES

2017-07-20 19:34:09,621 : INFO : PROGRESS: at sentence #38250000, processed 377116422 words, keeping 1495475 word types
2017-07-20 19:34:09,667 : INFO : PROGRESS: at sentence #38260000, processed 377197384 words, keeping 1495557 word types
2017-07-20 19:34:09,902 : INFO : PROGRESS: at sentence #38270000, processed 377277659 words, keeping 1495725 word types
2017-07-20 19:34:09,945 : INFO : PROGRESS: at sentence #38280000, processed 377362659 words, keeping 1495882 word types
2017-07-20 19:34:10,183 : INFO : PROGRESS: at sentence #38290000, processed 377442850 words, keeping 1496007 word types
2017-07-20 19:34:10,227 : INFO : PROGRESS: at sentence #38300000, processed 377529147 words, keeping 1496146 word types
2017-07-20 19:34:10,269 : INFO : PROGRESS: at sentence #38310000, processed 377610647 words, keeping 1496302 word types
2017-07-20 19:34:10,410 : INFO : PROGRESS: at sentence #38320000, processed 377692551 words, keeping 1496406 word types
2017-07-20 19:34:10,731 : INFO : PROGRES

2017-07-20 19:34:20,059 : INFO : PROGRESS: at sentence #38940000, processed 383764039 words, keeping 1510037 word types
2017-07-20 19:34:20,109 : INFO : PROGRESS: at sentence #38950000, processed 383866530 words, keeping 1510228 word types
2017-07-20 19:34:20,162 : INFO : PROGRESS: at sentence #38960000, processed 383986791 words, keeping 1510380 word types
2017-07-20 19:34:20,209 : INFO : PROGRESS: at sentence #38970000, processed 384081949 words, keeping 1510654 word types
2017-07-20 19:34:20,253 : INFO : PROGRESS: at sentence #38980000, processed 384172713 words, keeping 1510961 word types
2017-07-20 19:34:20,299 : INFO : PROGRESS: at sentence #38990000, processed 384269338 words, keeping 1511122 word types
2017-07-20 19:34:20,346 : INFO : PROGRESS: at sentence #39000000, processed 384366406 words, keeping 1511388 word types
2017-07-20 19:34:21,453 : INFO : PROGRESS: at sentence #39010000, processed 384472014 words, keeping 1511503 word types
2017-07-20 19:34:21,499 : INFO : PROGRES

2017-07-20 19:34:30,789 : INFO : PROGRESS: at sentence #39630000, processed 390385525 words, keeping 1523017 word types
2017-07-20 19:34:30,836 : INFO : PROGRESS: at sentence #39640000, processed 390481739 words, keeping 1523167 word types
2017-07-20 19:34:30,884 : INFO : PROGRESS: at sentence #39650000, processed 390588087 words, keeping 1523396 word types
2017-07-20 19:34:30,928 : INFO : PROGRESS: at sentence #39660000, processed 390675225 words, keeping 1523723 word types
2017-07-20 19:34:30,974 : INFO : PROGRESS: at sentence #39670000, processed 390767610 words, keeping 1523959 word types
2017-07-20 19:34:31,018 : INFO : PROGRESS: at sentence #39680000, processed 390865391 words, keeping 1524121 word types
2017-07-20 19:34:31,070 : INFO : PROGRESS: at sentence #39690000, processed 390978820 words, keeping 1524312 word types
2017-07-20 19:34:31,114 : INFO : PROGRESS: at sentence #39700000, processed 391075334 words, keeping 1524660 word types
2017-07-20 19:34:31,164 : INFO : PROGRES

2017-07-20 19:34:40,798 : INFO : PROGRESS: at sentence #40320000, processed 397181119 words, keeping 1538223 word types
2017-07-20 19:34:40,848 : INFO : PROGRESS: at sentence #40330000, processed 397287955 words, keeping 1538437 word types
2017-07-20 19:34:40,894 : INFO : PROGRESS: at sentence #40340000, processed 397386149 words, keeping 1538673 word types
2017-07-20 19:34:40,943 : INFO : PROGRESS: at sentence #40350000, processed 397493933 words, keeping 1538879 word types
2017-07-20 19:34:40,988 : INFO : PROGRESS: at sentence #40360000, processed 397581499 words, keeping 1539072 word types
2017-07-20 19:34:41,037 : INFO : PROGRESS: at sentence #40370000, processed 397683048 words, keeping 1539321 word types
2017-07-20 19:34:41,084 : INFO : PROGRESS: at sentence #40380000, processed 397785052 words, keeping 1539545 word types
2017-07-20 19:34:41,131 : INFO : PROGRESS: at sentence #40390000, processed 397888008 words, keeping 1539695 word types
2017-07-20 19:34:41,179 : INFO : PROGRES

2017-07-20 19:34:50,709 : INFO : PROGRESS: at sentence #41010000, processed 403734949 words, keeping 1550893 word types
2017-07-20 19:34:50,753 : INFO : PROGRESS: at sentence #41020000, processed 403830946 words, keeping 1551131 word types
2017-07-20 19:34:50,803 : INFO : PROGRESS: at sentence #41030000, processed 403934950 words, keeping 1551446 word types
2017-07-20 19:34:50,853 : INFO : PROGRESS: at sentence #41040000, processed 404041368 words, keeping 1551772 word types
2017-07-20 19:34:50,898 : INFO : PROGRESS: at sentence #41050000, processed 404132799 words, keeping 1551997 word types
2017-07-20 19:34:50,947 : INFO : PROGRESS: at sentence #41060000, processed 404240330 words, keeping 1552180 word types
2017-07-20 19:34:50,994 : INFO : PROGRESS: at sentence #41070000, processed 404336651 words, keeping 1552353 word types
2017-07-20 19:34:51,039 : INFO : PROGRESS: at sentence #41080000, processed 404420902 words, keeping 1552641 word types
2017-07-20 19:34:51,089 : INFO : PROGRES

2017-07-20 19:35:00,562 : INFO : PROGRESS: at sentence #41700000, processed 410622639 words, keeping 1567175 word types
2017-07-20 19:35:00,603 : INFO : PROGRESS: at sentence #41710000, processed 410712402 words, keeping 1567341 word types
2017-07-20 19:35:02,043 : INFO : PROGRESS: at sentence #41720000, processed 410815856 words, keeping 1567574 word types
2017-07-20 19:35:02,086 : INFO : PROGRESS: at sentence #41730000, processed 410908804 words, keeping 1567788 word types
2017-07-20 19:35:02,136 : INFO : PROGRESS: at sentence #41740000, processed 411007879 words, keeping 1567982 word types
2017-07-20 19:35:02,184 : INFO : PROGRESS: at sentence #41750000, processed 411106470 words, keeping 1568251 word types
2017-07-20 19:35:02,234 : INFO : PROGRESS: at sentence #41760000, processed 411212846 words, keeping 1568426 word types
2017-07-20 19:35:02,287 : INFO : PROGRESS: at sentence #41770000, processed 411340592 words, keeping 1568657 word types
2017-07-20 19:35:02,336 : INFO : PROGRES

2017-07-20 19:35:11,588 : INFO : PROGRESS: at sentence #42390000, processed 417560544 words, keeping 1583824 word types
2017-07-20 19:35:11,639 : INFO : PROGRESS: at sentence #42400000, processed 417667424 words, keeping 1584005 word types
2017-07-20 19:35:11,689 : INFO : PROGRESS: at sentence #42410000, processed 417769915 words, keeping 1584197 word types
2017-07-20 19:35:11,739 : INFO : PROGRESS: at sentence #42420000, processed 417877345 words, keeping 1585877 word types
2017-07-20 19:35:11,793 : INFO : PROGRESS: at sentence #42430000, processed 418003689 words, keeping 1586047 word types
2017-07-20 19:35:11,839 : INFO : PROGRESS: at sentence #42440000, processed 418100837 words, keeping 1586354 word types
2017-07-20 19:35:11,885 : INFO : PROGRESS: at sentence #42450000, processed 418191492 words, keeping 1586554 word types
2017-07-20 19:35:12,307 : INFO : PROGRESS: at sentence #42460000, processed 418276509 words, keeping 1586665 word types
2017-07-20 19:35:12,349 : INFO : PROGRES

2017-07-20 19:35:22,034 : INFO : PROGRESS: at sentence #43080000, processed 424279022 words, keeping 1599915 word types
2017-07-20 19:35:22,083 : INFO : PROGRESS: at sentence #43090000, processed 424378203 words, keeping 1600095 word types
2017-07-20 19:35:22,130 : INFO : PROGRESS: at sentence #43100000, processed 424476693 words, keeping 1600245 word types
2017-07-20 19:35:22,177 : INFO : PROGRESS: at sentence #43110000, processed 424568729 words, keeping 1600429 word types
2017-07-20 19:35:22,224 : INFO : PROGRESS: at sentence #43120000, processed 424662146 words, keeping 1600633 word types
2017-07-20 19:35:22,271 : INFO : PROGRESS: at sentence #43130000, processed 424757036 words, keeping 1600840 word types
2017-07-20 19:35:22,320 : INFO : PROGRESS: at sentence #43140000, processed 424854625 words, keeping 1601094 word types
2017-07-20 19:35:22,367 : INFO : PROGRESS: at sentence #43150000, processed 424953712 words, keeping 1601418 word types
2017-07-20 19:35:22,418 : INFO : PROGRES

2017-07-20 19:35:32,541 : INFO : PROGRESS: at sentence #43770000, processed 431151242 words, keeping 1614050 word types
2017-07-20 19:35:32,587 : INFO : PROGRESS: at sentence #43780000, processed 431250278 words, keeping 1614203 word types
2017-07-20 19:35:32,633 : INFO : PROGRESS: at sentence #43790000, processed 431343427 words, keeping 1614435 word types
2017-07-20 19:35:32,687 : INFO : PROGRESS: at sentence #43800000, processed 431460524 words, keeping 1617047 word types
2017-07-20 19:35:32,734 : INFO : PROGRESS: at sentence #43810000, processed 431562024 words, keeping 1617424 word types
2017-07-20 19:35:32,785 : INFO : PROGRESS: at sentence #43820000, processed 431663497 words, keeping 1617593 word types
2017-07-20 19:35:32,833 : INFO : PROGRESS: at sentence #43830000, processed 431761114 words, keeping 1617784 word types
2017-07-20 19:35:32,882 : INFO : PROGRESS: at sentence #43840000, processed 431859678 words, keeping 1618005 word types
2017-07-20 19:35:32,930 : INFO : PROGRES

2017-07-20 19:35:42,630 : INFO : PROGRESS: at sentence #44460000, processed 438015483 words, keeping 1630864 word types
2017-07-20 19:35:42,680 : INFO : PROGRESS: at sentence #44470000, processed 438119467 words, keeping 1631078 word types
2017-07-20 19:35:42,730 : INFO : PROGRESS: at sentence #44480000, processed 438223855 words, keeping 1631268 word types
2017-07-20 19:35:42,780 : INFO : PROGRESS: at sentence #44490000, processed 438327748 words, keeping 1631502 word types
2017-07-20 19:35:42,827 : INFO : PROGRESS: at sentence #44500000, processed 438432563 words, keeping 1631703 word types
2017-07-20 19:35:44,570 : INFO : PROGRESS: at sentence #44510000, processed 438526717 words, keeping 1631924 word types
2017-07-20 19:35:44,618 : INFO : PROGRESS: at sentence #44520000, processed 438621088 words, keeping 1632093 word types
2017-07-20 19:35:44,666 : INFO : PROGRESS: at sentence #44530000, processed 438715217 words, keeping 1632325 word types
2017-07-20 19:35:44,712 : INFO : PROGRES

2017-07-20 19:35:52,851 : INFO : PROGRESS: at sentence #45150000, processed 444882459 words, keeping 1644501 word types
2017-07-20 19:35:52,897 : INFO : PROGRESS: at sentence #45160000, processed 444981617 words, keeping 1644772 word types
2017-07-20 19:35:53,166 : INFO : PROGRESS: at sentence #45170000, processed 445060744 words, keeping 1644919 word types
2017-07-20 19:35:53,209 : INFO : PROGRESS: at sentence #45180000, processed 445144904 words, keeping 1645039 word types
2017-07-20 19:35:53,546 : INFO : PROGRESS: at sentence #45190000, processed 445228663 words, keeping 1645143 word types
2017-07-20 19:35:53,591 : INFO : PROGRESS: at sentence #45200000, processed 445316164 words, keeping 1645258 word types
2017-07-20 19:35:53,633 : INFO : PROGRESS: at sentence #45210000, processed 445392886 words, keeping 1645419 word types
2017-07-20 19:35:55,156 : INFO : PROGRESS: at sentence #45220000, processed 445479571 words, keeping 1645705 word types
2017-07-20 19:35:55,202 : INFO : PROGRES

2017-07-20 19:36:03,399 : INFO : PROGRESS: at sentence #45840000, processed 451687007 words, keeping 1658354 word types
2017-07-20 19:36:03,447 : INFO : PROGRESS: at sentence #45850000, processed 451775683 words, keeping 1658862 word types
2017-07-20 19:36:03,493 : INFO : PROGRESS: at sentence #45860000, processed 451871681 words, keeping 1659112 word types
2017-07-20 19:36:05,040 : INFO : PROGRESS: at sentence #45870000, processed 451974068 words, keeping 1659258 word types
2017-07-20 19:36:05,091 : INFO : PROGRESS: at sentence #45880000, processed 452078118 words, keeping 1659403 word types
2017-07-20 19:36:05,141 : INFO : PROGRESS: at sentence #45890000, processed 452180818 words, keeping 1659629 word types
2017-07-20 19:36:05,191 : INFO : PROGRESS: at sentence #45900000, processed 452286427 words, keeping 1659783 word types
2017-07-20 19:36:05,242 : INFO : PROGRESS: at sentence #45910000, processed 452390041 words, keeping 1660045 word types
2017-07-20 19:36:05,288 : INFO : PROGRES

2017-07-20 19:36:14,538 : INFO : PROGRESS: at sentence #46530000, processed 458628041 words, keeping 1673851 word types
2017-07-20 19:36:14,589 : INFO : PROGRESS: at sentence #46540000, processed 458732237 words, keeping 1674039 word types
2017-07-20 19:36:14,637 : INFO : PROGRESS: at sentence #46550000, processed 458830879 words, keeping 1674174 word types
2017-07-20 19:36:14,686 : INFO : PROGRESS: at sentence #46560000, processed 458930036 words, keeping 1674390 word types
2017-07-20 19:36:14,738 : INFO : PROGRESS: at sentence #46570000, processed 459029906 words, keeping 1674615 word types
2017-07-20 19:36:14,787 : INFO : PROGRESS: at sentence #46580000, processed 459130621 words, keeping 1674751 word types
2017-07-20 19:36:14,836 : INFO : PROGRESS: at sentence #46590000, processed 459222847 words, keeping 1675055 word types
2017-07-20 19:36:14,884 : INFO : PROGRESS: at sentence #46600000, processed 459323666 words, keeping 1675254 word types
2017-07-20 19:36:16,496 : INFO : PROGRES

2017-07-20 19:36:24,328 : INFO : PROGRESS: at sentence #47220000, processed 465397286 words, keeping 1688683 word types
2017-07-20 19:36:25,976 : INFO : PROGRESS: at sentence #47230000, processed 465489595 words, keeping 1688822 word types
2017-07-20 19:36:26,022 : INFO : PROGRESS: at sentence #47240000, processed 465588904 words, keeping 1689054 word types
2017-07-20 19:36:26,076 : INFO : PROGRESS: at sentence #47250000, processed 465689261 words, keeping 1689189 word types
2017-07-20 19:36:26,133 : INFO : PROGRESS: at sentence #47260000, processed 465824543 words, keeping 1689410 word types
2017-07-20 19:36:26,180 : INFO : PROGRESS: at sentence #47270000, processed 465923870 words, keeping 1689546 word types
2017-07-20 19:36:26,229 : INFO : PROGRESS: at sentence #47280000, processed 466017313 words, keeping 1689726 word types
2017-07-20 19:36:26,278 : INFO : PROGRESS: at sentence #47290000, processed 466118616 words, keeping 1689862 word types
2017-07-20 19:36:26,328 : INFO : PROGRES

2017-07-20 19:36:35,534 : INFO : PROGRESS: at sentence #47910000, processed 472196967 words, keeping 1702808 word types
2017-07-20 19:36:35,586 : INFO : PROGRESS: at sentence #47920000, processed 472296893 words, keeping 1703041 word types
2017-07-20 19:36:35,635 : INFO : PROGRESS: at sentence #47930000, processed 472395680 words, keeping 1703263 word types
2017-07-20 19:36:35,684 : INFO : PROGRESS: at sentence #47940000, processed 472493493 words, keeping 1703448 word types
2017-07-20 19:36:35,730 : INFO : PROGRESS: at sentence #47950000, processed 472586761 words, keeping 1703673 word types
2017-07-20 19:36:35,778 : INFO : PROGRESS: at sentence #47960000, processed 472682843 words, keeping 1703896 word types
2017-07-20 19:36:35,830 : INFO : PROGRESS: at sentence #47970000, processed 472785341 words, keeping 1704200 word types
2017-07-20 19:36:35,881 : INFO : PROGRESS: at sentence #47980000, processed 472886124 words, keeping 1704376 word types
2017-07-20 19:36:35,930 : INFO : PROGRES

2017-07-20 19:36:45,808 : INFO : PROGRESS: at sentence #48600000, processed 478987033 words, keeping 1716917 word types
2017-07-20 19:36:45,856 : INFO : PROGRESS: at sentence #48610000, processed 479089547 words, keeping 1717218 word types
2017-07-20 19:36:45,907 : INFO : PROGRESS: at sentence #48620000, processed 479184240 words, keeping 1717388 word types
2017-07-20 19:36:45,956 : INFO : PROGRESS: at sentence #48630000, processed 479283049 words, keeping 1717571 word types
2017-07-20 19:36:46,004 : INFO : PROGRESS: at sentence #48640000, processed 479378981 words, keeping 1717764 word types
2017-07-20 19:36:46,053 : INFO : PROGRESS: at sentence #48650000, processed 479476354 words, keeping 1717958 word types
2017-07-20 19:36:46,102 : INFO : PROGRESS: at sentence #48660000, processed 479572955 words, keeping 1718149 word types
2017-07-20 19:36:47,278 : INFO : PROGRESS: at sentence #48670000, processed 479672755 words, keeping 1718283 word types
2017-07-20 19:36:47,329 : INFO : PROGRES

2017-07-20 19:36:56,980 : INFO : PROGRESS: at sentence #49290000, processed 485924422 words, keeping 1729509 word types
2017-07-20 19:36:57,030 : INFO : PROGRESS: at sentence #49300000, processed 486025622 words, keeping 1729727 word types
2017-07-20 19:36:57,083 : INFO : PROGRESS: at sentence #49310000, processed 486138132 words, keeping 1729844 word types
2017-07-20 19:36:57,131 : INFO : PROGRESS: at sentence #49320000, processed 486240021 words, keeping 1730507 word types
2017-07-20 19:36:57,181 : INFO : PROGRESS: at sentence #49330000, processed 486339900 words, keeping 1730830 word types
2017-07-20 19:36:57,231 : INFO : PROGRESS: at sentence #49340000, processed 486438162 words, keeping 1731031 word types
2017-07-20 19:36:57,280 : INFO : PROGRESS: at sentence #49350000, processed 486540866 words, keeping 1731352 word types
2017-07-20 19:36:57,323 : INFO : PROGRESS: at sentence #49360000, processed 486614932 words, keeping 1731752 word types
2017-07-20 19:36:57,370 : INFO : PROGRES

2017-07-20 19:37:06,700 : INFO : PROGRESS: at sentence #49980000, processed 492800461 words, keeping 1744478 word types
2017-07-20 19:37:06,749 : INFO : PROGRESS: at sentence #49990000, processed 492897560 words, keeping 1744647 word types
2017-07-20 19:37:08,402 : INFO : PROGRESS: at sentence #50000000, processed 492999466 words, keeping 1744884 word types
2017-07-20 19:37:08,457 : INFO : PROGRESS: at sentence #50010000, processed 493115827 words, keeping 1745036 word types
2017-07-20 19:37:08,507 : INFO : PROGRESS: at sentence #50020000, processed 493215603 words, keeping 1745191 word types
2017-07-20 19:37:08,557 : INFO : PROGRESS: at sentence #50030000, processed 493318945 words, keeping 1745401 word types
2017-07-20 19:37:08,607 : INFO : PROGRESS: at sentence #50040000, processed 493417085 words, keeping 1745551 word types
2017-07-20 19:37:08,658 : INFO : PROGRESS: at sentence #50050000, processed 493523951 words, keeping 1746345 word types
2017-07-20 19:37:08,707 : INFO : PROGRES

2017-07-20 19:37:17,432 : INFO : PROGRESS: at sentence #50670000, processed 499638279 words, keeping 1757809 word types
2017-07-20 19:37:17,483 : INFO : PROGRESS: at sentence #50680000, processed 499735736 words, keeping 1758016 word types
2017-07-20 19:37:17,538 : INFO : PROGRESS: at sentence #50690000, processed 499859724 words, keeping 1758120 word types
2017-07-20 19:37:17,588 : INFO : PROGRESS: at sentence #50700000, processed 499961518 words, keeping 1758362 word types
2017-07-20 19:37:18,042 : INFO : PROGRESS: at sentence #50710000, processed 500068581 words, keeping 1758525 word types
2017-07-20 19:37:18,088 : INFO : PROGRESS: at sentence #50720000, processed 500154887 words, keeping 1758648 word types
2017-07-20 19:37:18,133 : INFO : PROGRESS: at sentence #50730000, processed 500237091 words, keeping 1758761 word types
2017-07-20 19:37:18,393 : INFO : PROGRESS: at sentence #50740000, processed 500325798 words, keeping 1758874 word types
2017-07-20 19:37:18,434 : INFO : PROGRES

2017-07-20 19:37:28,014 : INFO : PROGRESS: at sentence #51360000, processed 506371695 words, keeping 1771108 word types
2017-07-20 19:37:28,063 : INFO : PROGRESS: at sentence #51370000, processed 506467872 words, keeping 1771412 word types
2017-07-20 19:37:28,115 : INFO : PROGRESS: at sentence #51380000, processed 506571079 words, keeping 1771793 word types
2017-07-20 19:37:28,163 : INFO : PROGRESS: at sentence #51390000, processed 506665359 words, keeping 1772023 word types
2017-07-20 19:37:28,213 : INFO : PROGRESS: at sentence #51400000, processed 506763910 words, keeping 1772190 word types
2017-07-20 19:37:28,262 : INFO : PROGRESS: at sentence #51410000, processed 506855373 words, keeping 1772462 word types
2017-07-20 19:37:30,010 : INFO : PROGRESS: at sentence #51420000, processed 506951508 words, keeping 1772720 word types
2017-07-20 19:37:30,057 : INFO : PROGRESS: at sentence #51430000, processed 507046754 words, keeping 1772877 word types
2017-07-20 19:37:30,115 : INFO : PROGRES

2017-07-20 19:37:38,601 : INFO : PROGRESS: at sentence #52050000, processed 513134326 words, keeping 1785394 word types
2017-07-20 19:37:38,650 : INFO : PROGRESS: at sentence #52060000, processed 513229324 words, keeping 1785605 word types
2017-07-20 19:37:38,701 : INFO : PROGRESS: at sentence #52070000, processed 513330433 words, keeping 1785856 word types
2017-07-20 19:37:38,752 : INFO : PROGRESS: at sentence #52080000, processed 513441149 words, keeping 1786093 word types
2017-07-20 19:37:38,803 : INFO : PROGRESS: at sentence #52090000, processed 513537043 words, keeping 1786293 word types
2017-07-20 19:37:38,852 : INFO : PROGRESS: at sentence #52100000, processed 513636847 words, keeping 1786415 word types
2017-07-20 19:37:40,454 : INFO : PROGRESS: at sentence #52110000, processed 513733964 words, keeping 1786580 word types
2017-07-20 19:37:40,501 : INFO : PROGRESS: at sentence #52120000, processed 513818363 words, keeping 1786702 word types
2017-07-20 19:37:40,547 : INFO : PROGRES

2017-07-20 19:37:49,521 : INFO : PROGRESS: at sentence #52740000, processed 519779372 words, keeping 1798135 word types
2017-07-20 19:37:49,570 : INFO : PROGRESS: at sentence #52750000, processed 519872783 words, keeping 1798370 word types
2017-07-20 19:37:49,622 : INFO : PROGRESS: at sentence #52760000, processed 519980474 words, keeping 1798546 word types
2017-07-20 19:37:49,672 : INFO : PROGRESS: at sentence #52770000, processed 520075051 words, keeping 1798710 word types
2017-07-20 19:37:49,726 : INFO : PROGRESS: at sentence #52780000, processed 520185183 words, keeping 1798895 word types
2017-07-20 19:37:49,781 : INFO : PROGRESS: at sentence #52790000, processed 520298079 words, keeping 1799155 word types
2017-07-20 19:37:49,835 : INFO : PROGRESS: at sentence #52800000, processed 520410828 words, keeping 1799395 word types
2017-07-20 19:37:49,885 : INFO : PROGRESS: at sentence #52810000, processed 520508923 words, keeping 1799569 word types
2017-07-20 19:37:49,933 : INFO : PROGRES

2017-07-20 19:37:58,568 : INFO : PROGRESS: at sentence #53430000, processed 526281228 words, keeping 1809463 word types
2017-07-20 19:37:58,929 : INFO : PROGRESS: at sentence #53440000, processed 526366167 words, keeping 1809566 word types
2017-07-20 19:37:58,974 : INFO : PROGRESS: at sentence #53450000, processed 526460153 words, keeping 1809794 word types
2017-07-20 19:37:59,020 : INFO : PROGRESS: at sentence #53460000, processed 526546341 words, keeping 1809877 word types
2017-07-20 19:37:59,267 : INFO : PROGRESS: at sentence #53470000, processed 526629541 words, keeping 1809988 word types
2017-07-20 19:37:59,309 : INFO : PROGRESS: at sentence #53480000, processed 526708337 words, keeping 1810084 word types
2017-07-20 19:37:59,354 : INFO : PROGRESS: at sentence #53490000, processed 526789163 words, keeping 1810178 word types
2017-07-20 19:37:59,625 : INFO : PROGRESS: at sentence #53500000, processed 526877867 words, keeping 1810304 word types
2017-07-20 19:37:59,672 : INFO : PROGRES

2017-07-20 19:38:09,852 : INFO : PROGRESS: at sentence #54120000, processed 532929026 words, keeping 1821143 word types
2017-07-20 19:38:09,904 : INFO : PROGRESS: at sentence #54130000, processed 533030434 words, keeping 1821417 word types
2017-07-20 19:38:09,964 : INFO : PROGRESS: at sentence #54140000, processed 533150944 words, keeping 1821573 word types
2017-07-20 19:38:10,013 : INFO : PROGRESS: at sentence #54150000, processed 533248873 words, keeping 1821806 word types
2017-07-20 19:38:10,063 : INFO : PROGRESS: at sentence #54160000, processed 533348922 words, keeping 1821927 word types
2017-07-20 19:38:10,114 : INFO : PROGRESS: at sentence #54170000, processed 533447272 words, keeping 1822217 word types
2017-07-20 19:38:10,167 : INFO : PROGRESS: at sentence #54180000, processed 533545614 words, keeping 1822507 word types
2017-07-20 19:38:10,219 : INFO : PROGRESS: at sentence #54190000, processed 533645890 words, keeping 1822672 word types
2017-07-20 19:38:10,271 : INFO : PROGRES

2017-07-20 19:38:19,706 : INFO : PROGRESS: at sentence #54810000, processed 539483002 words, keeping 1833058 word types
2017-07-20 19:38:19,759 : INFO : PROGRESS: at sentence #54820000, processed 539586499 words, keeping 1833240 word types
2017-07-20 19:38:19,807 : INFO : PROGRESS: at sentence #54830000, processed 539686814 words, keeping 1833456 word types
2017-07-20 19:38:19,861 : INFO : PROGRESS: at sentence #54840000, processed 539785877 words, keeping 1833623 word types
2017-07-20 19:38:19,921 : INFO : PROGRESS: at sentence #54850000, processed 539921108 words, keeping 1833772 word types
2017-07-20 19:38:19,971 : INFO : PROGRESS: at sentence #54860000, processed 540021728 words, keeping 1833939 word types
2017-07-20 19:38:21,551 : INFO : PROGRESS: at sentence #54870000, processed 540138163 words, keeping 1834145 word types
2017-07-20 19:38:21,598 : INFO : PROGRESS: at sentence #54880000, processed 540234216 words, keeping 1834263 word types
2017-07-20 19:38:21,649 : INFO : PROGRES

2017-07-20 19:38:30,210 : INFO : PROGRESS: at sentence #55500000, processed 546382334 words, keeping 1845161 word types
2017-07-20 19:38:30,267 : INFO : PROGRESS: at sentence #55510000, processed 546482042 words, keeping 1845352 word types
2017-07-20 19:38:30,317 : INFO : PROGRESS: at sentence #55520000, processed 546586287 words, keeping 1845546 word types
2017-07-20 19:38:30,369 : INFO : PROGRESS: at sentence #55530000, processed 546689400 words, keeping 1845673 word types
2017-07-20 19:38:31,325 : INFO : PROGRESS: at sentence #55540000, processed 546784419 words, keeping 1845883 word types
2017-07-20 19:38:31,374 : INFO : PROGRESS: at sentence #55550000, processed 546889563 words, keeping 1846070 word types
2017-07-20 19:38:31,427 : INFO : PROGRESS: at sentence #55560000, processed 546995695 words, keeping 1846220 word types
2017-07-20 19:38:31,480 : INFO : PROGRESS: at sentence #55570000, processed 547105382 words, keeping 1846357 word types
2017-07-20 19:38:31,532 : INFO : PROGRES

2017-07-20 19:38:41,739 : INFO : PROGRESS: at sentence #56190000, processed 553223426 words, keeping 1858723 word types
2017-07-20 19:38:41,790 : INFO : PROGRESS: at sentence #56200000, processed 553322456 words, keeping 1858892 word types
2017-07-20 19:38:41,843 : INFO : PROGRESS: at sentence #56210000, processed 553425583 words, keeping 1859048 word types
2017-07-20 19:38:41,895 : INFO : PROGRESS: at sentence #56220000, processed 553523614 words, keeping 1859275 word types
2017-07-20 19:38:41,947 : INFO : PROGRESS: at sentence #56230000, processed 553631414 words, keeping 1859492 word types
2017-07-20 19:38:42,000 : INFO : PROGRESS: at sentence #56240000, processed 553732003 words, keeping 1859676 word types
2017-07-20 19:38:42,047 : INFO : PROGRESS: at sentence #56250000, processed 553824698 words, keeping 1859841 word types
2017-07-20 19:38:42,102 : INFO : PROGRESS: at sentence #56260000, processed 553935906 words, keeping 1860035 word types
2017-07-20 19:38:42,153 : INFO : PROGRES

2017-07-20 19:38:52,052 : INFO : PROGRESS: at sentence #56880000, processed 560030214 words, keeping 1869831 word types
2017-07-20 19:38:52,108 : INFO : PROGRESS: at sentence #56890000, processed 560135707 words, keeping 1870058 word types
2017-07-20 19:38:52,161 : INFO : PROGRESS: at sentence #56900000, processed 560234606 words, keeping 1870284 word types
2017-07-20 19:38:52,217 : INFO : PROGRESS: at sentence #56910000, processed 560334100 words, keeping 1870441 word types
2017-07-20 19:38:52,269 : INFO : PROGRESS: at sentence #56920000, processed 560427884 words, keeping 1870564 word types
2017-07-20 19:38:52,321 : INFO : PROGRESS: at sentence #56930000, processed 560540423 words, keeping 1870805 word types
2017-07-20 19:38:52,372 : INFO : PROGRESS: at sentence #56940000, processed 560637718 words, keeping 1871002 word types
2017-07-20 19:38:52,424 : INFO : PROGRESS: at sentence #56950000, processed 560737483 words, keeping 1871150 word types
2017-07-20 19:38:53,989 : INFO : PROGRES

2017-07-20 19:39:02,312 : INFO : PROGRESS: at sentence #57570000, processed 566960776 words, keeping 1882566 word types
2017-07-20 19:39:02,361 : INFO : PROGRESS: at sentence #57580000, processed 567050642 words, keeping 1882657 word types
2017-07-20 19:39:02,407 : INFO : PROGRESS: at sentence #57590000, processed 567131909 words, keeping 1882763 word types
2017-07-20 19:39:03,965 : INFO : PROGRESS: at sentence #57600000, processed 567242546 words, keeping 1882953 word types
2017-07-20 19:39:04,014 : INFO : PROGRESS: at sentence #57610000, processed 567345442 words, keeping 1883128 word types
2017-07-20 19:39:04,068 : INFO : PROGRESS: at sentence #57620000, processed 567447229 words, keeping 1883426 word types
2017-07-20 19:39:04,119 : INFO : PROGRESS: at sentence #57630000, processed 567543615 words, keeping 1883627 word types
2017-07-20 19:39:04,168 : INFO : PROGRESS: at sentence #57640000, processed 567644402 words, keeping 1883804 word types
2017-07-20 19:39:04,221 : INFO : PROGRES

2017-07-20 19:39:13,765 : INFO : PROGRESS: at sentence #58260000, processed 573794891 words, keeping 1894395 word types
2017-07-20 19:39:13,815 : INFO : PROGRESS: at sentence #58270000, processed 573890399 words, keeping 1894581 word types
2017-07-20 19:39:13,869 : INFO : PROGRESS: at sentence #58280000, processed 573995921 words, keeping 1894735 word types
2017-07-20 19:39:13,924 : INFO : PROGRESS: at sentence #58290000, processed 574114183 words, keeping 1894872 word types
2017-07-20 19:39:13,974 : INFO : PROGRESS: at sentence #58300000, processed 574203330 words, keeping 1895031 word types
2017-07-20 19:39:14,027 : INFO : PROGRESS: at sentence #58310000, processed 574302673 words, keeping 1895154 word types
2017-07-20 19:39:14,079 : INFO : PROGRESS: at sentence #58320000, processed 574401359 words, keeping 1895347 word types
2017-07-20 19:39:14,131 : INFO : PROGRESS: at sentence #58330000, processed 574494770 words, keeping 1895521 word types
2017-07-20 19:39:14,184 : INFO : PROGRES

2017-07-20 19:39:24,598 : INFO : PROGRESS: at sentence #58950000, processed 580736578 words, keeping 1907932 word types
2017-07-20 19:39:24,649 : INFO : PROGRESS: at sentence #58960000, processed 580828685 words, keeping 1908103 word types
2017-07-20 19:39:24,704 : INFO : PROGRESS: at sentence #58970000, processed 580927776 words, keeping 1908251 word types
2017-07-20 19:39:24,760 : INFO : PROGRESS: at sentence #58980000, processed 581037328 words, keeping 1908421 word types
2017-07-20 19:39:24,811 : INFO : PROGRESS: at sentence #58990000, processed 581135088 words, keeping 1908610 word types
2017-07-20 19:39:24,867 : INFO : PROGRESS: at sentence #59000000, processed 581254423 words, keeping 1908900 word types
2017-07-20 19:39:24,920 : INFO : PROGRESS: at sentence #59010000, processed 581360098 words, keeping 1909061 word types
2017-07-20 19:39:24,973 : INFO : PROGRESS: at sentence #59020000, processed 581457313 words, keeping 1909233 word types
2017-07-20 19:39:25,023 : INFO : PROGRES

2017-07-20 19:39:35,114 : INFO : PROGRESS: at sentence #59640000, processed 587595987 words, keeping 1920482 word types
2017-07-20 19:39:35,169 : INFO : PROGRESS: at sentence #59650000, processed 587698976 words, keeping 1920680 word types
2017-07-20 19:39:35,230 : INFO : PROGRESS: at sentence #59660000, processed 587798525 words, keeping 1920826 word types
2017-07-20 19:39:35,289 : INFO : PROGRESS: at sentence #59670000, processed 587905669 words, keeping 1921005 word types
2017-07-20 19:39:35,339 : INFO : PROGRESS: at sentence #59680000, processed 588003333 words, keeping 1921342 word types
2017-07-20 19:39:35,395 : INFO : PROGRESS: at sentence #59690000, processed 588116643 words, keeping 1921431 word types
2017-07-20 19:39:35,448 : INFO : PROGRESS: at sentence #59700000, processed 588214724 words, keeping 1921617 word types
2017-07-20 19:39:35,499 : INFO : PROGRESS: at sentence #59710000, processed 588319039 words, keeping 1921818 word types
2017-07-20 19:39:35,934 : INFO : PROGRES

2017-07-20 19:39:46,350 : INFO : PROGRESS: at sentence #60330000, processed 594314947 words, keeping 1932003 word types
2017-07-20 19:39:46,403 : INFO : PROGRESS: at sentence #60340000, processed 594415344 words, keeping 1932127 word types
2017-07-20 19:39:46,463 : INFO : PROGRESS: at sentence #60350000, processed 594537681 words, keeping 1932229 word types
2017-07-20 19:39:46,515 : INFO : PROGRESS: at sentence #60360000, processed 594636483 words, keeping 1932480 word types
2017-07-20 19:39:46,566 : INFO : PROGRESS: at sentence #60370000, processed 594728962 words, keeping 1932630 word types
2017-07-20 19:39:46,615 : INFO : PROGRESS: at sentence #60380000, processed 594833776 words, keeping 1932839 word types
2017-07-20 19:39:46,670 : INFO : PROGRESS: at sentence #60390000, processed 594937699 words, keeping 1933003 word types
2017-07-20 19:39:46,721 : INFO : PROGRESS: at sentence #60400000, processed 595034940 words, keeping 1933187 word types
2017-07-20 19:39:46,774 : INFO : PROGRES

2017-07-20 19:39:57,023 : INFO : PROGRESS: at sentence #61020000, processed 601136276 words, keeping 1944691 word types
2017-07-20 19:39:57,078 : INFO : PROGRESS: at sentence #61030000, processed 601248736 words, keeping 1945513 word types
2017-07-20 19:39:57,130 : INFO : PROGRESS: at sentence #61040000, processed 601344199 words, keeping 1945764 word types
2017-07-20 19:39:57,181 : INFO : PROGRESS: at sentence #61050000, processed 601447270 words, keeping 1945935 word types
2017-07-20 19:39:57,235 : INFO : PROGRESS: at sentence #61060000, processed 601553945 words, keeping 1946084 word types
2017-07-20 19:39:57,287 : INFO : PROGRESS: at sentence #61070000, processed 601655413 words, keeping 1946299 word types
2017-07-20 19:39:57,339 : INFO : PROGRESS: at sentence #61080000, processed 601752741 words, keeping 1946478 word types
2017-07-20 19:39:57,396 : INFO : PROGRESS: at sentence #61090000, processed 601864022 words, keeping 1946617 word types
2017-07-20 19:39:57,447 : INFO : PROGRES

2017-07-20 19:40:07,259 : INFO : PROGRESS: at sentence #61710000, processed 608069609 words, keeping 1957826 word types
2017-07-20 19:40:07,315 : INFO : PROGRESS: at sentence #61720000, processed 608175345 words, keeping 1958172 word types
2017-07-20 19:40:07,368 : INFO : PROGRESS: at sentence #61730000, processed 608278170 words, keeping 1958351 word types
2017-07-20 19:40:07,421 : INFO : PROGRESS: at sentence #61740000, processed 608378814 words, keeping 1958515 word types
2017-07-20 19:40:07,473 : INFO : PROGRESS: at sentence #61750000, processed 608478369 words, keeping 1958709 word types
2017-07-20 19:40:07,524 : INFO : PROGRESS: at sentence #61760000, processed 608577606 words, keeping 1959046 word types
2017-07-20 19:40:09,027 : INFO : PROGRESS: at sentence #61770000, processed 608673127 words, keeping 1959335 word types
2017-07-20 19:40:09,079 : INFO : PROGRESS: at sentence #61780000, processed 608770949 words, keeping 1959511 word types
2017-07-20 19:40:09,131 : INFO : PROGRES

2017-07-20 19:40:19,060 : INFO : PROGRESS: at sentence #62400000, processed 614975449 words, keeping 1970514 word types
2017-07-20 19:40:19,115 : INFO : PROGRESS: at sentence #62410000, processed 615074558 words, keeping 1970634 word types
2017-07-20 19:40:19,172 : INFO : PROGRESS: at sentence #62420000, processed 615198054 words, keeping 1970861 word types
2017-07-20 19:40:19,226 : INFO : PROGRESS: at sentence #62430000, processed 615314196 words, keeping 1971009 word types
2017-07-20 19:40:19,282 : INFO : PROGRESS: at sentence #62440000, processed 615415368 words, keeping 1971191 word types
2017-07-20 19:40:19,333 : INFO : PROGRESS: at sentence #62450000, processed 615511054 words, keeping 1971368 word types
2017-07-20 19:40:19,384 : INFO : PROGRESS: at sentence #62460000, processed 615615792 words, keeping 1971511 word types
2017-07-20 19:40:19,440 : INFO : PROGRESS: at sentence #62470000, processed 615721812 words, keeping 1971706 word types
2017-07-20 19:40:19,493 : INFO : PROGRES

2017-07-20 19:40:28,231 : INFO : PROGRESS: at sentence #63090000, processed 621741291 words, keeping 1982733 word types
2017-07-20 19:40:29,947 : INFO : PROGRESS: at sentence #63100000, processed 621838846 words, keeping 1982881 word types
2017-07-20 19:40:29,998 : INFO : PROGRESS: at sentence #63110000, processed 621939205 words, keeping 1983027 word types
2017-07-20 19:40:30,053 : INFO : PROGRESS: at sentence #63120000, processed 622034535 words, keeping 1983168 word types
2017-07-20 19:40:30,105 : INFO : PROGRESS: at sentence #63130000, processed 622137282 words, keeping 1983317 word types
2017-07-20 19:40:30,161 : INFO : PROGRESS: at sentence #63140000, processed 622246548 words, keeping 1983530 word types
2017-07-20 19:40:30,213 : INFO : PROGRESS: at sentence #63150000, processed 622347027 words, keeping 1983637 word types
2017-07-20 19:40:30,267 : INFO : PROGRESS: at sentence #63160000, processed 622448183 words, keeping 1983885 word types
2017-07-20 19:40:30,320 : INFO : PROGRES

2017-07-20 19:40:40,445 : INFO : PROGRESS: at sentence #63780000, processed 628638433 words, keeping 1994810 word types
2017-07-20 19:40:40,497 : INFO : PROGRESS: at sentence #63790000, processed 628735827 words, keeping 1995015 word types
2017-07-20 19:40:40,552 : INFO : PROGRESS: at sentence #63800000, processed 628844475 words, keeping 1995172 word types
2017-07-20 19:40:40,601 : INFO : PROGRESS: at sentence #63810000, processed 628942299 words, keeping 1995382 word types
2017-07-20 19:40:40,655 : INFO : PROGRESS: at sentence #63820000, processed 629038765 words, keeping 1995574 word types
2017-07-20 19:40:40,709 : INFO : PROGRESS: at sentence #63830000, processed 629138916 words, keeping 1995925 word types
2017-07-20 19:40:40,759 : INFO : PROGRESS: at sentence #63840000, processed 629242863 words, keeping 1996088 word types
2017-07-20 19:40:40,811 : INFO : PROGRESS: at sentence #63850000, processed 629342346 words, keeping 1996181 word types
2017-07-20 19:40:40,861 : INFO : PROGRES

2017-07-20 19:40:50,463 : INFO : PROGRESS: at sentence #64470000, processed 635269795 words, keeping 2005555 word types
2017-07-20 19:40:50,516 : INFO : PROGRESS: at sentence #64480000, processed 635367007 words, keeping 2005704 word types
2017-07-20 19:40:50,569 : INFO : PROGRESS: at sentence #64490000, processed 635465070 words, keeping 2005862 word types
2017-07-20 19:40:50,624 : INFO : PROGRESS: at sentence #64500000, processed 635572404 words, keeping 2005947 word types
2017-07-20 19:40:50,676 : INFO : PROGRESS: at sentence #64510000, processed 635672002 words, keeping 2006064 word types
2017-07-20 19:40:50,726 : INFO : PROGRESS: at sentence #64520000, processed 635762052 words, keeping 2006304 word types
2017-07-20 19:40:50,779 : INFO : PROGRESS: at sentence #64530000, processed 635861046 words, keeping 2006760 word types
2017-07-20 19:40:51,084 : INFO : PROGRESS: at sentence #64540000, processed 635949489 words, keeping 2006934 word types
2017-07-20 19:40:51,136 : INFO : PROGRES

2017-07-20 19:41:02,185 : INFO : PROGRESS: at sentence #65160000, processed 642151887 words, keeping 2016484 word types
2017-07-20 19:41:02,234 : INFO : PROGRESS: at sentence #65170000, processed 642240945 words, keeping 2016585 word types
2017-07-20 19:41:02,285 : INFO : PROGRESS: at sentence #65180000, processed 642332609 words, keeping 2016788 word types
2017-07-20 19:41:02,335 : INFO : PROGRESS: at sentence #65190000, processed 642425242 words, keeping 2016941 word types
2017-07-20 19:41:02,391 : INFO : PROGRESS: at sentence #65200000, processed 642522670 words, keeping 2017143 word types
2017-07-20 19:41:02,443 : INFO : PROGRESS: at sentence #65210000, processed 642621688 words, keeping 2017313 word types
2017-07-20 19:41:02,494 : INFO : PROGRESS: at sentence #65220000, processed 642721976 words, keeping 2017669 word types
2017-07-20 19:41:02,546 : INFO : PROGRESS: at sentence #65230000, processed 642819185 words, keeping 2017814 word types
2017-07-20 19:41:02,602 : INFO : PROGRES

2017-07-20 19:41:11,797 : INFO : PROGRESS: at sentence #65850000, processed 648781391 words, keeping 2027515 word types
2017-07-20 19:41:11,847 : INFO : PROGRESS: at sentence #65860000, processed 648878131 words, keeping 2027650 word types
2017-07-20 19:41:11,901 : INFO : PROGRESS: at sentence #65870000, processed 648978389 words, keeping 2027809 word types
2017-07-20 19:41:11,957 : INFO : PROGRESS: at sentence #65880000, processed 649085469 words, keeping 2027906 word types
2017-07-20 19:41:12,013 : INFO : PROGRESS: at sentence #65890000, processed 649192407 words, keeping 2028120 word types
2017-07-20 19:41:12,068 : INFO : PROGRESS: at sentence #65900000, processed 649286956 words, keeping 2028244 word types
2017-07-20 19:41:12,119 : INFO : PROGRESS: at sentence #65910000, processed 649381961 words, keeping 2028397 word types
2017-07-20 19:41:12,579 : INFO : PROGRESS: at sentence #65920000, processed 649474514 words, keeping 2028549 word types
2017-07-20 19:41:12,629 : INFO : PROGRES

2017-07-20 19:41:22,090 : INFO : PROGRESS: at sentence #66540000, processed 655474405 words, keeping 2038168 word types
2017-07-20 19:41:22,145 : INFO : PROGRESS: at sentence #66550000, processed 655572093 words, keeping 2038332 word types
2017-07-20 19:41:22,198 : INFO : PROGRESS: at sentence #66560000, processed 655668128 words, keeping 2038479 word types
2017-07-20 19:41:22,257 : INFO : PROGRESS: at sentence #66570000, processed 655778430 words, keeping 2038593 word types
2017-07-20 19:41:22,710 : INFO : PROGRESS: at sentence #66580000, processed 655873012 words, keeping 2038761 word types
2017-07-20 19:41:22,755 : INFO : PROGRESS: at sentence #66590000, processed 655956546 words, keeping 2038859 word types
2017-07-20 19:41:22,806 : INFO : PROGRESS: at sentence #66600000, processed 656044775 words, keeping 2038958 word types
2017-07-20 19:41:24,358 : INFO : PROGRESS: at sentence #66610000, processed 656160026 words, keeping 2039059 word types
2017-07-20 19:41:24,407 : INFO : PROGRES

2017-07-20 19:41:33,647 : INFO : PROGRESS: at sentence #67230000, processed 662211415 words, keeping 2050140 word types
2017-07-20 19:41:33,697 : INFO : PROGRESS: at sentence #67240000, processed 662309574 words, keeping 2050479 word types
2017-07-20 19:41:33,754 : INFO : PROGRESS: at sentence #67250000, processed 662416447 words, keeping 2050660 word types
2017-07-20 19:41:33,803 : INFO : PROGRESS: at sentence #67260000, processed 662507515 words, keeping 2050848 word types
2017-07-20 19:41:33,861 : INFO : PROGRESS: at sentence #67270000, processed 662626533 words, keeping 2051105 word types
2017-07-20 19:41:33,913 : INFO : PROGRESS: at sentence #67280000, processed 662721804 words, keeping 2051291 word types
2017-07-20 19:41:33,966 : INFO : PROGRESS: at sentence #67290000, processed 662825689 words, keeping 2051492 word types
2017-07-20 19:41:34,019 : INFO : PROGRESS: at sentence #67300000, processed 662916549 words, keeping 2051613 word types
2017-07-20 19:41:34,069 : INFO : PROGRES

2017-07-20 19:41:44,032 : INFO : PROGRESS: at sentence #67920000, processed 669099035 words, keeping 2062303 word types
2017-07-20 19:41:44,082 : INFO : PROGRESS: at sentence #67930000, processed 669195462 words, keeping 2062428 word types
2017-07-20 19:41:44,137 : INFO : PROGRESS: at sentence #67940000, processed 669298141 words, keeping 2062510 word types
2017-07-20 19:41:44,192 : INFO : PROGRESS: at sentence #67950000, processed 669404601 words, keeping 2062732 word types
2017-07-20 19:41:44,243 : INFO : PROGRESS: at sentence #67960000, processed 669504787 words, keeping 2062903 word types
2017-07-20 19:41:44,297 : INFO : PROGRESS: at sentence #67970000, processed 669604642 words, keeping 2063108 word types
2017-07-20 19:41:44,354 : INFO : PROGRESS: at sentence #67980000, processed 669710383 words, keeping 2063238 word types
2017-07-20 19:41:44,407 : INFO : PROGRESS: at sentence #67990000, processed 669806383 words, keeping 2063451 word types
2017-07-20 19:41:46,194 : INFO : PROGRES

2017-07-20 19:41:54,658 : INFO : PROGRESS: at sentence #68610000, processed 676083822 words, keeping 2073992 word types
2017-07-20 19:41:54,714 : INFO : PROGRESS: at sentence #68620000, processed 676181108 words, keeping 2074273 word types
2017-07-20 19:41:55,020 : INFO : PROGRESS: at sentence #68630000, processed 676267954 words, keeping 2074415 word types
2017-07-20 19:41:55,067 : INFO : PROGRESS: at sentence #68640000, processed 676357694 words, keeping 2074559 word types
2017-07-20 19:41:55,327 : INFO : PROGRESS: at sentence #68650000, processed 676448328 words, keeping 2074666 word types
2017-07-20 19:41:55,375 : INFO : PROGRESS: at sentence #68660000, processed 676537091 words, keeping 2074805 word types
2017-07-20 19:41:55,425 : INFO : PROGRESS: at sentence #68670000, processed 676623419 words, keeping 2074917 word types
2017-07-20 19:41:55,708 : INFO : PROGRESS: at sentence #68680000, processed 676732157 words, keeping 2075078 word types
2017-07-20 19:41:55,759 : INFO : PROGRES

2017-07-20 19:42:05,918 : INFO : PROGRESS: at sentence #69300000, processed 682831346 words, keeping 2085385 word types
2017-07-20 19:42:05,974 : INFO : PROGRESS: at sentence #69310000, processed 682933811 words, keeping 2085595 word types
2017-07-20 19:42:06,029 : INFO : PROGRESS: at sentence #69320000, processed 683030707 words, keeping 2085958 word types
2017-07-20 19:42:06,086 : INFO : PROGRESS: at sentence #69330000, processed 683149715 words, keeping 2086325 word types
2017-07-20 19:42:06,137 : INFO : PROGRESS: at sentence #69340000, processed 683251644 words, keeping 2086573 word types
2017-07-20 19:42:06,190 : INFO : PROGRESS: at sentence #69350000, processed 683347500 words, keeping 2086820 word types
2017-07-20 19:42:06,244 : INFO : PROGRESS: at sentence #69360000, processed 683438987 words, keeping 2087132 word types
2017-07-20 19:42:06,539 : INFO : PROGRESS: at sentence #69370000, processed 683539225 words, keeping 2087219 word types
2017-07-20 19:42:06,589 : INFO : PROGRES

2017-07-20 19:42:16,989 : INFO : PROGRESS: at sentence #69990000, processed 689597574 words, keeping 2097000 word types
2017-07-20 19:42:17,046 : INFO : PROGRESS: at sentence #70000000, processed 689701519 words, keeping 2097353 word types
2017-07-20 19:42:17,096 : INFO : PROGRESS: at sentence #70010000, processed 689802102 words, keeping 2097524 word types
2017-07-20 19:42:17,149 : INFO : PROGRESS: at sentence #70020000, processed 689900867 words, keeping 2097644 word types
2017-07-20 19:42:17,204 : INFO : PROGRESS: at sentence #70030000, processed 690001091 words, keeping 2097800 word types
2017-07-20 19:42:17,268 : INFO : PROGRESS: at sentence #70040000, processed 690134095 words, keeping 2098109 word types
2017-07-20 19:42:17,320 : INFO : PROGRESS: at sentence #70050000, processed 690234680 words, keeping 2098251 word types
2017-07-20 19:42:17,373 : INFO : PROGRESS: at sentence #70060000, processed 690335369 words, keeping 2098381 word types
2017-07-20 19:42:17,426 : INFO : PROGRES

2017-07-20 19:42:28,217 : INFO : PROGRESS: at sentence #70680000, processed 696463981 words, keeping 2108357 word types
2017-07-20 19:42:28,271 : INFO : PROGRESS: at sentence #70690000, processed 696567270 words, keeping 2108476 word types
2017-07-20 19:42:28,331 : INFO : PROGRESS: at sentence #70700000, processed 696694373 words, keeping 2108619 word types
2017-07-20 19:42:28,390 : INFO : PROGRESS: at sentence #70710000, processed 696803579 words, keeping 2108753 word types
2017-07-20 19:42:28,446 : INFO : PROGRESS: at sentence #70720000, processed 696903536 words, keeping 2108998 word types
2017-07-20 19:42:28,497 : INFO : PROGRESS: at sentence #70730000, processed 696999049 words, keeping 2109165 word types
2017-07-20 19:42:28,546 : INFO : PROGRESS: at sentence #70740000, processed 697088006 words, keeping 2109263 word types
2017-07-20 19:42:28,606 : INFO : PROGRESS: at sentence #70750000, processed 697204064 words, keeping 2109394 word types
2017-07-20 19:42:28,655 : INFO : PROGRES

2017-07-20 19:42:37,787 : INFO : PROGRESS: at sentence #71370000, processed 703237500 words, keeping 2119050 word types
2017-07-20 19:42:39,371 : INFO : PROGRESS: at sentence #71380000, processed 703338761 words, keeping 2119132 word types
2017-07-20 19:42:39,422 : INFO : PROGRESS: at sentence #71390000, processed 703435460 words, keeping 2119333 word types
2017-07-20 19:42:39,476 : INFO : PROGRESS: at sentence #71400000, processed 703532559 words, keeping 2119557 word types
2017-07-20 19:42:39,529 : INFO : PROGRESS: at sentence #71410000, processed 703629202 words, keeping 2119695 word types
2017-07-20 19:42:39,587 : INFO : PROGRESS: at sentence #71420000, processed 703734913 words, keeping 2119944 word types
2017-07-20 19:42:39,642 : INFO : PROGRESS: at sentence #71430000, processed 703840141 words, keeping 2120182 word types
2017-07-20 19:42:39,694 : INFO : PROGRESS: at sentence #71440000, processed 703929030 words, keeping 2120416 word types
2017-07-20 19:42:39,747 : INFO : PROGRES

2017-07-20 19:42:50,078 : INFO : PROGRESS: at sentence #72060000, processed 710095887 words, keeping 2131166 word types
2017-07-20 19:42:50,133 : INFO : PROGRESS: at sentence #72070000, processed 710200953 words, keeping 2131373 word types
2017-07-20 19:42:50,190 : INFO : PROGRESS: at sentence #72080000, processed 710302203 words, keeping 2131567 word types
2017-07-20 19:42:50,242 : INFO : PROGRESS: at sentence #72090000, processed 710401057 words, keeping 2131733 word types
2017-07-20 19:42:50,300 : INFO : PROGRESS: at sentence #72100000, processed 710510765 words, keeping 2131844 word types
2017-07-20 19:42:50,352 : INFO : PROGRESS: at sentence #72110000, processed 710608351 words, keeping 2131995 word types
2017-07-20 19:42:50,404 : INFO : PROGRESS: at sentence #72120000, processed 710706434 words, keeping 2132170 word types
2017-07-20 19:42:50,465 : INFO : PROGRESS: at sentence #72130000, processed 710846147 words, keeping 2132349 word types
2017-07-20 19:42:50,520 : INFO : PROGRES

2017-07-20 19:42:59,364 : INFO : PROGRESS: at sentence #72750000, processed 716839920 words, keeping 2142451 word types
2017-07-20 19:43:01,219 : INFO : PROGRESS: at sentence #72760000, processed 716933156 words, keeping 2142655 word types
2017-07-20 19:43:01,271 : INFO : PROGRESS: at sentence #72770000, processed 717035611 words, keeping 2142775 word types
2017-07-20 19:43:01,325 : INFO : PROGRESS: at sentence #72780000, processed 717135875 words, keeping 2142955 word types
2017-07-20 19:43:01,379 : INFO : PROGRESS: at sentence #72790000, processed 717236302 words, keeping 2143134 word types
2017-07-20 19:43:01,433 : INFO : PROGRESS: at sentence #72800000, processed 717338074 words, keeping 2143292 word types
2017-07-20 19:43:01,491 : INFO : PROGRESS: at sentence #72810000, processed 717436569 words, keeping 2143577 word types
2017-07-20 19:43:01,545 : INFO : PROGRESS: at sentence #72820000, processed 717537701 words, keeping 2143732 word types
2017-07-20 19:43:01,599 : INFO : PROGRES

2017-07-20 19:43:10,645 : INFO : PROGRESS: at sentence #73440000, processed 723784639 words, keeping 2153437 word types
2017-07-20 19:43:12,221 : INFO : PROGRESS: at sentence #73450000, processed 723880789 words, keeping 2153557 word types
2017-07-20 19:43:12,276 : INFO : PROGRESS: at sentence #73460000, processed 723981950 words, keeping 2154376 word types
2017-07-20 19:43:12,335 : INFO : PROGRESS: at sentence #73470000, processed 724091532 words, keeping 2154568 word types
2017-07-20 19:43:12,387 : INFO : PROGRESS: at sentence #73480000, processed 724184715 words, keeping 2154696 word types
2017-07-20 19:43:12,446 : INFO : PROGRESS: at sentence #73490000, processed 724283365 words, keeping 2154802 word types
2017-07-20 19:43:12,503 : INFO : PROGRESS: at sentence #73500000, processed 724382918 words, keeping 2154928 word types
2017-07-20 19:43:12,562 : INFO : PROGRESS: at sentence #73510000, processed 724492807 words, keeping 2155025 word types
2017-07-20 19:43:12,612 : INFO : PROGRES

2017-07-20 19:43:22,031 : INFO : PROGRESS: at sentence #74130000, processed 730538736 words, keeping 2165129 word types
2017-07-20 19:43:22,090 : INFO : PROGRESS: at sentence #74140000, processed 730646902 words, keeping 2165279 word types
2017-07-20 19:43:22,137 : INFO : PROGRESS: at sentence #74150000, processed 730732524 words, keeping 2165570 word types
2017-07-20 19:43:22,190 : INFO : PROGRESS: at sentence #74160000, processed 730829416 words, keeping 2165682 word types
2017-07-20 19:43:22,248 : INFO : PROGRESS: at sentence #74170000, processed 730928417 words, keeping 2165892 word types
2017-07-20 19:43:22,298 : INFO : PROGRESS: at sentence #74180000, processed 731022842 words, keeping 2166076 word types
2017-07-20 19:43:23,859 : INFO : PROGRESS: at sentence #74190000, processed 731121812 words, keeping 2166210 word types
2017-07-20 19:43:23,913 : INFO : PROGRESS: at sentence #74200000, processed 731224628 words, keeping 2166477 word types
2017-07-20 19:43:23,972 : INFO : PROGRES

2017-07-20 19:43:32,443 : INFO : PROGRESS: at sentence #74820000, processed 737235117 words, keeping 2176843 word types
2017-07-20 19:43:32,497 : INFO : PROGRESS: at sentence #74830000, processed 737328308 words, keeping 2177087 word types
2017-07-20 19:43:32,551 : INFO : PROGRESS: at sentence #74840000, processed 737440592 words, keeping 2177182 word types
2017-07-20 19:43:32,850 : INFO : PROGRESS: at sentence #74850000, processed 737532063 words, keeping 2177296 word types
2017-07-20 19:43:32,900 : INFO : PROGRESS: at sentence #74860000, processed 737627294 words, keeping 2177360 word types
2017-07-20 19:43:32,953 : INFO : PROGRESS: at sentence #74870000, processed 737715530 words, keeping 2177446 word types
2017-07-20 19:43:33,297 : INFO : PROGRESS: at sentence #74880000, processed 737798319 words, keeping 2177566 word types
2017-07-20 19:43:33,347 : INFO : PROGRESS: at sentence #74890000, processed 737878544 words, keeping 2177666 word types
2017-07-20 19:43:33,494 : INFO : PROGRES

2017-07-20 19:43:44,551 : INFO : PROGRESS: at sentence #75510000, processed 744003187 words, keeping 2187374 word types
2017-07-20 19:43:44,607 : INFO : PROGRESS: at sentence #75520000, processed 744094685 words, keeping 2187534 word types
2017-07-20 19:43:44,658 : INFO : PROGRESS: at sentence #75530000, processed 744188884 words, keeping 2187638 word types
2017-07-20 19:43:44,712 : INFO : PROGRESS: at sentence #75540000, processed 744286566 words, keeping 2187852 word types
2017-07-20 19:43:44,765 : INFO : PROGRESS: at sentence #75550000, processed 744381920 words, keeping 2188003 word types
2017-07-20 19:43:44,822 : INFO : PROGRESS: at sentence #75560000, processed 744484383 words, keeping 2188276 word types
2017-07-20 19:43:44,871 : INFO : PROGRESS: at sentence #75570000, processed 744576119 words, keeping 2188405 word types
2017-07-20 19:43:44,926 : INFO : PROGRESS: at sentence #75580000, processed 744674041 words, keeping 2188531 word types
2017-07-20 19:43:44,977 : INFO : PROGRES

2017-07-20 19:43:55,094 : INFO : PROGRESS: at sentence #76200000, processed 750895652 words, keeping 2199437 word types
2017-07-20 19:43:55,149 : INFO : PROGRESS: at sentence #76210000, processed 750994451 words, keeping 2199594 word types
2017-07-20 19:43:55,203 : INFO : PROGRESS: at sentence #76220000, processed 751089301 words, keeping 2199741 word types
2017-07-20 19:43:55,255 : INFO : PROGRESS: at sentence #76230000, processed 751177971 words, keeping 2199917 word types
2017-07-20 19:43:55,313 : INFO : PROGRESS: at sentence #76240000, processed 751278215 words, keeping 2200088 word types
2017-07-20 19:43:55,368 : INFO : PROGRESS: at sentence #76250000, processed 751378261 words, keeping 2200202 word types
2017-07-20 19:43:55,425 : INFO : PROGRESS: at sentence #76260000, processed 751483281 words, keeping 2200409 word types
2017-07-20 19:43:55,484 : INFO : PROGRESS: at sentence #76270000, processed 751581145 words, keeping 2200700 word types
2017-07-20 19:43:55,539 : INFO : PROGRES

2017-07-20 19:44:06,223 : INFO : PROGRESS: at sentence #76890000, processed 757615781 words, keeping 2209941 word types
2017-07-20 19:44:06,282 : INFO : PROGRESS: at sentence #76900000, processed 757726031 words, keeping 2210136 word types
2017-07-20 19:44:06,337 : INFO : PROGRESS: at sentence #76910000, processed 757823579 words, keeping 2210327 word types
2017-07-20 19:44:06,389 : INFO : PROGRESS: at sentence #76920000, processed 757921430 words, keeping 2210517 word types
2017-07-20 19:44:06,450 : INFO : PROGRESS: at sentence #76930000, processed 758030981 words, keeping 2210634 word types
2017-07-20 19:44:06,501 : INFO : PROGRESS: at sentence #76940000, processed 758129663 words, keeping 2210763 word types
2017-07-20 19:44:06,559 : INFO : PROGRESS: at sentence #76950000, processed 758226212 words, keeping 2210876 word types
2017-07-20 19:44:06,616 : INFO : PROGRESS: at sentence #76960000, processed 758330425 words, keeping 2210955 word types
2017-07-20 19:44:06,670 : INFO : PROGRES

2017-07-20 19:44:16,263 : INFO : PROGRESS: at sentence #77580000, processed 764235224 words, keeping 2220014 word types
2017-07-20 19:44:16,320 : INFO : PROGRESS: at sentence #77590000, processed 764334198 words, keeping 2220127 word types
2017-07-20 19:44:16,375 : INFO : PROGRESS: at sentence #77600000, processed 764430150 words, keeping 2220248 word types
2017-07-20 19:44:16,430 : INFO : PROGRESS: at sentence #77610000, processed 764526604 words, keeping 2220399 word types
2017-07-20 19:44:16,485 : INFO : PROGRESS: at sentence #77620000, processed 764627186 words, keeping 2220600 word types
2017-07-20 19:44:16,542 : INFO : PROGRESS: at sentence #77630000, processed 764728538 words, keeping 2220720 word types
2017-07-20 19:44:16,594 : INFO : PROGRESS: at sentence #77640000, processed 764821795 words, keeping 2220893 word types
2017-07-20 19:44:16,896 : INFO : PROGRESS: at sentence #77650000, processed 764911809 words, keeping 2221011 word types
2017-07-20 19:44:16,944 : INFO : PROGRES

2017-07-20 19:44:27,604 : INFO : PROGRESS: at sentence #78270000, processed 770968967 words, keeping 2229895 word types
2017-07-20 19:44:27,660 : INFO : PROGRESS: at sentence #78280000, processed 771066984 words, keeping 2230111 word types
2017-07-20 19:44:27,717 : INFO : PROGRESS: at sentence #78290000, processed 771166463 words, keeping 2230292 word types
2017-07-20 19:44:27,775 : INFO : PROGRESS: at sentence #78300000, processed 771274792 words, keeping 2230460 word types
2017-07-20 19:44:27,834 : INFO : PROGRESS: at sentence #78310000, processed 771379625 words, keeping 2230652 word types
2017-07-20 19:44:27,887 : INFO : PROGRESS: at sentence #78320000, processed 771476991 words, keeping 2230971 word types
2017-07-20 19:44:27,942 : INFO : PROGRESS: at sentence #78330000, processed 771575421 words, keeping 2231098 word types
2017-07-20 19:44:27,998 : INFO : PROGRESS: at sentence #78340000, processed 771670926 words, keeping 2231272 word types
2017-07-20 19:44:28,050 : INFO : PROGRES

2017-07-20 19:44:37,558 : INFO : PROGRESS: at sentence #78960000, processed 777876898 words, keeping 2240774 word types
2017-07-20 19:44:38,006 : INFO : PROGRESS: at sentence #78970000, processed 777960822 words, keeping 2240873 word types
2017-07-20 19:44:38,053 : INFO : PROGRESS: at sentence #78980000, processed 778039887 words, keeping 2240956 word types
2017-07-20 19:44:38,326 : INFO : PROGRESS: at sentence #78990000, processed 778126982 words, keeping 2241037 word types
2017-07-20 19:44:38,374 : INFO : PROGRESS: at sentence #79000000, processed 778213451 words, keeping 2241135 word types
2017-07-20 19:44:38,431 : INFO : PROGRESS: at sentence #79010000, processed 778318501 words, keeping 2241229 word types
2017-07-20 19:44:38,704 : INFO : PROGRESS: at sentence #79020000, processed 778415784 words, keeping 2241322 word types
2017-07-20 19:44:38,753 : INFO : PROGRESS: at sentence #79030000, processed 778504777 words, keeping 2241443 word types
2017-07-20 19:44:38,806 : INFO : PROGRES

2017-07-20 19:44:49,151 : INFO : PROGRESS: at sentence #79650000, processed 784612685 words, keeping 2250857 word types
2017-07-20 19:44:49,208 : INFO : PROGRESS: at sentence #79660000, processed 784715321 words, keeping 2251135 word types
2017-07-20 19:44:49,266 : INFO : PROGRESS: at sentence #79670000, processed 784821630 words, keeping 2251251 word types
2017-07-20 19:44:49,321 : INFO : PROGRESS: at sentence #79680000, processed 784920106 words, keeping 2251408 word types
2017-07-20 19:44:49,378 : INFO : PROGRESS: at sentence #79690000, processed 785024165 words, keeping 2251833 word types
2017-07-20 19:44:49,431 : INFO : PROGRESS: at sentence #79700000, processed 785118017 words, keeping 2251951 word types
2017-07-20 19:44:49,485 : INFO : PROGRESS: at sentence #79710000, processed 785210894 words, keeping 2252170 word types
2017-07-20 19:44:49,540 : INFO : PROGRESS: at sentence #79720000, processed 785308904 words, keeping 2252346 word types
2017-07-20 19:44:49,732 : INFO : PROGRES

2017-07-20 19:45:00,553 : INFO : PROGRESS: at sentence #80340000, processed 791216716 words, keeping 2262889 word types
2017-07-20 19:45:00,611 : INFO : PROGRESS: at sentence #80350000, processed 791316408 words, keeping 2263012 word types
2017-07-20 19:45:00,670 : INFO : PROGRESS: at sentence #80360000, processed 791416916 words, keeping 2263205 word types
2017-07-20 19:45:00,730 : INFO : PROGRESS: at sentence #80370000, processed 791516970 words, keeping 2263394 word types
2017-07-20 19:45:00,794 : INFO : PROGRESS: at sentence #80380000, processed 791633563 words, keeping 2263610 word types
2017-07-20 19:45:00,856 : INFO : PROGRESS: at sentence #80390000, processed 791742742 words, keeping 2263751 word types
2017-07-20 19:45:00,916 : INFO : PROGRESS: at sentence #80400000, processed 791847418 words, keeping 2263890 word types
2017-07-20 19:45:00,975 : INFO : PROGRESS: at sentence #80410000, processed 791943343 words, keeping 2264077 word types
2017-07-20 19:45:01,041 : INFO : PROGRES

2017-07-20 19:45:12,397 : INFO : PROGRESS: at sentence #81030000, processed 798083359 words, keeping 2273564 word types
2017-07-20 19:45:12,459 : INFO : PROGRESS: at sentence #81040000, processed 798184960 words, keeping 2273664 word types
2017-07-20 19:45:12,521 : INFO : PROGRESS: at sentence #81050000, processed 798294047 words, keeping 2273853 word types
2017-07-20 19:45:12,581 : INFO : PROGRESS: at sentence #81060000, processed 798391944 words, keeping 2273958 word types
2017-07-20 19:45:12,640 : INFO : PROGRESS: at sentence #81070000, processed 798491616 words, keeping 2274145 word types
2017-07-20 19:45:12,699 : INFO : PROGRESS: at sentence #81080000, processed 798592510 words, keeping 2274283 word types
2017-07-20 19:45:12,757 : INFO : PROGRESS: at sentence #81090000, processed 798692783 words, keeping 2274457 word types
2017-07-20 19:45:12,821 : INFO : PROGRESS: at sentence #81100000, processed 798802588 words, keeping 2274592 word types
2017-07-20 19:45:12,878 : INFO : PROGRES

2017-07-20 19:45:23,665 : INFO : PROGRESS: at sentence #81720000, processed 804873249 words, keeping 2282683 word types
2017-07-20 19:45:23,723 : INFO : PROGRESS: at sentence #81730000, processed 804972108 words, keeping 2282811 word types
2017-07-20 19:45:23,779 : INFO : PROGRESS: at sentence #81740000, processed 805069109 words, keeping 2282985 word types
2017-07-20 19:45:23,834 : INFO : PROGRESS: at sentence #81750000, processed 805164775 words, keeping 2283162 word types
2017-07-20 19:45:23,889 : INFO : PROGRESS: at sentence #81760000, processed 805261738 words, keeping 2283393 word types
2017-07-20 19:45:23,947 : INFO : PROGRESS: at sentence #81770000, processed 805361852 words, keeping 2283503 word types
2017-07-20 19:45:24,001 : INFO : PROGRESS: at sentence #81780000, processed 805453127 words, keeping 2283669 word types
2017-07-20 19:45:24,057 : INFO : PROGRESS: at sentence #81790000, processed 805553257 words, keeping 2283792 word types
2017-07-20 19:45:24,124 : INFO : PROGRES

2017-07-20 19:45:34,724 : INFO : PROGRESS: at sentence #82410000, processed 811780675 words, keeping 2293916 word types
2017-07-20 19:45:34,785 : INFO : PROGRESS: at sentence #82420000, processed 811893238 words, keeping 2294037 word types
2017-07-20 19:45:34,845 : INFO : PROGRESS: at sentence #82430000, processed 811993711 words, keeping 2294168 word types
2017-07-20 19:45:34,897 : INFO : PROGRESS: at sentence #82440000, processed 812089252 words, keeping 2294301 word types
2017-07-20 19:45:35,236 : INFO : PROGRESS: at sentence #82450000, processed 812193956 words, keeping 2294413 word types
2017-07-20 19:45:35,289 : INFO : PROGRESS: at sentence #82460000, processed 812277161 words, keeping 2294547 word types
2017-07-20 19:45:36,879 : INFO : PROGRESS: at sentence #82470000, processed 812356974 words, keeping 2294603 word types
2017-07-20 19:45:36,947 : INFO : PROGRESS: at sentence #82480000, processed 812455722 words, keeping 2294712 word types
2017-07-20 19:45:37,025 : INFO : PROGRES

2017-07-20 19:45:46,531 : INFO : PROGRESS: at sentence #83100000, processed 818547140 words, keeping 2304255 word types
2017-07-20 19:45:46,589 : INFO : PROGRESS: at sentence #83110000, processed 818649946 words, keeping 2304403 word types
2017-07-20 19:45:46,648 : INFO : PROGRESS: at sentence #83120000, processed 818753631 words, keeping 2304538 word types
2017-07-20 19:45:46,988 : INFO : PROGRESS: at sentence #83130000, processed 818856914 words, keeping 2304624 word types
2017-07-20 19:45:47,042 : INFO : PROGRESS: at sentence #83140000, processed 818943145 words, keeping 2304700 word types
2017-07-20 19:45:47,104 : INFO : PROGRESS: at sentence #83150000, processed 819039508 words, keeping 2304795 word types
2017-07-20 19:45:47,389 : INFO : PROGRESS: at sentence #83160000, processed 819117981 words, keeping 2304862 word types
2017-07-20 19:45:47,448 : INFO : PROGRESS: at sentence #83170000, processed 819199352 words, keeping 2304952 word types
2017-07-20 19:45:49,050 : INFO : PROGRES

2017-07-20 19:45:58,180 : INFO : PROGRESS: at sentence #83790000, processed 825332887 words, keeping 2316191 word types
2017-07-20 19:45:58,237 : INFO : PROGRESS: at sentence #83800000, processed 825427515 words, keeping 2316307 word types
2017-07-20 19:45:58,294 : INFO : PROGRESS: at sentence #83810000, processed 825540302 words, keeping 2316501 word types
2017-07-20 19:45:58,350 : INFO : PROGRESS: at sentence #83820000, processed 825636365 words, keeping 2316598 word types
2017-07-20 19:45:58,455 : INFO : collected 2316883 word types from a corpus of 825732409 raw words and 83829845 sentences
2017-07-20 19:45:58,455 : INFO : Loading a fresh vocabulary
2017-07-20 19:46:01,133 : INFO : min_count=5 retains 721299 unique words (31% of original 2316883, drops 1595584)
2017-07-20 19:46:01,133 : INFO : min_count=5 leaves 823175224 word corpus (99% of original 825732409, drops 2557185)
2017-07-20 19:46:03,289 : INFO : deleting the raw counts dictionary of 2316883 items
2017-07-20 19:46:03,43

2017-07-20 19:47:41,894 : INFO : PROGRESS: at 0.55% examples, 266707 words/s, in_qsize 8, out_qsize 1
2017-07-20 19:47:42,926 : INFO : PROGRESS: at 0.56% examples, 268044 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:47:43,934 : INFO : PROGRESS: at 0.57% examples, 269582 words/s, in_qsize 8, out_qsize 0
2017-07-20 19:47:45,881 : INFO : PROGRESS: at 0.58% examples, 266869 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:47:46,883 : INFO : PROGRESS: at 0.59% examples, 268172 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:47:47,920 : INFO : PROGRESS: at 0.60% examples, 269448 words/s, in_qsize 6, out_qsize 1
2017-07-20 19:47:48,940 : INFO : PROGRESS: at 0.61% examples, 270739 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:47:51,125 : INFO : PROGRESS: at 0.61% examples, 266526 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:47:52,136 : INFO : PROGRESS: at 0.62% examples, 267895 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:47:53,176 : INFO : PROGRESS: at 0.63% examples, 268988 words/s, in_q

2017-07-20 19:49:20,222 : INFO : PROGRESS: at 1.22% examples, 271462 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:49:21,302 : INFO : PROGRESS: at 1.22% examples, 271193 words/s, in_qsize 8, out_qsize 1
2017-07-20 19:49:22,334 : INFO : PROGRESS: at 1.23% examples, 271517 words/s, in_qsize 0, out_qsize 0
2017-07-20 19:49:23,679 : INFO : PROGRESS: at 1.23% examples, 269712 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:49:24,679 : INFO : PROGRESS: at 1.24% examples, 270373 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:49:25,690 : INFO : PROGRESS: at 1.25% examples, 271098 words/s, in_qsize 8, out_qsize 1
2017-07-20 19:49:26,705 : INFO : PROGRESS: at 1.26% examples, 271805 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:49:28,836 : INFO : PROGRESS: at 1.27% examples, 269908 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:49:29,855 : INFO : PROGRESS: at 1.28% examples, 270577 words/s, in_qsize 8, out_qsize 1
2017-07-20 19:49:30,886 : INFO : PROGRESS: at 1.29% examples, 271259 words/s, in_q

2017-07-20 19:50:58,576 : INFO : PROGRESS: at 1.90% examples, 275204 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:50:59,583 : INFO : PROGRESS: at 1.91% examples, 275653 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:51:00,584 : INFO : PROGRESS: at 1.92% examples, 276139 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:51:02,740 : INFO : PROGRESS: at 1.93% examples, 274949 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:51:03,747 : INFO : PROGRESS: at 1.94% examples, 275424 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:51:04,768 : INFO : PROGRESS: at 1.95% examples, 275882 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:51:05,770 : INFO : PROGRESS: at 1.96% examples, 276322 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:51:07,595 : INFO : PROGRESS: at 1.96% examples, 275295 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:51:08,601 : INFO : PROGRESS: at 1.97% examples, 275693 words/s, in_qsize 8, out_qsize 0
2017-07-20 19:51:09,651 : INFO : PROGRESS: at 1.98% examples, 276117 words/s, in_q

2017-07-20 19:52:33,047 : INFO : PROGRESS: at 2.59% examples, 279643 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:34,058 : INFO : PROGRESS: at 2.60% examples, 279994 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:36,204 : INFO : PROGRESS: at 2.60% examples, 279055 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:37,212 : INFO : PROGRESS: at 2.61% examples, 279402 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:38,222 : INFO : PROGRESS: at 2.62% examples, 279745 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:39,266 : INFO : PROGRESS: at 2.63% examples, 280086 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:41,062 : INFO : PROGRESS: at 2.64% examples, 279314 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:42,069 : INFO : PROGRESS: at 2.65% examples, 279678 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:43,089 : INFO : PROGRESS: at 2.66% examples, 280009 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:52:44,091 : INFO : PROGRESS: at 2.67% examples, 280349 words/s, in_q

2017-07-20 19:54:08,276 : INFO : PROGRESS: at 3.28% examples, 282295 words/s, in_qsize 2, out_qsize 3
2017-07-20 19:54:10,419 : INFO : PROGRESS: at 3.29% examples, 281692 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:54:11,425 : INFO : PROGRESS: at 3.30% examples, 281965 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:54:12,454 : INFO : PROGRESS: at 3.31% examples, 282204 words/s, in_qsize 8, out_qsize 1
2017-07-20 19:54:13,465 : INFO : PROGRESS: at 3.32% examples, 282494 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:54:15,731 : INFO : PROGRESS: at 3.33% examples, 281772 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:54:16,737 : INFO : PROGRESS: at 3.34% examples, 282063 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:54:17,750 : INFO : PROGRESS: at 3.35% examples, 282308 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:54:18,780 : INFO : PROGRESS: at 3.36% examples, 282596 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:54:19,830 : INFO : PROGRESS: at 3.37% examples, 282670 words/s, in_q

2017-07-20 19:55:46,030 : INFO : PROGRESS: at 3.98% examples, 283425 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:47,062 : INFO : PROGRESS: at 3.99% examples, 283637 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:48,069 : INFO : PROGRESS: at 4.00% examples, 283753 words/s, in_qsize 0, out_qsize 0
2017-07-20 19:55:49,596 : INFO : PROGRESS: at 4.00% examples, 283013 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:50,637 : INFO : PROGRESS: at 4.01% examples, 283248 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:51,640 : INFO : PROGRESS: at 4.02% examples, 283473 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:52,658 : INFO : PROGRESS: at 4.02% examples, 283687 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:54,682 : INFO : PROGRESS: at 4.03% examples, 283202 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:55,687 : INFO : PROGRESS: at 4.04% examples, 283442 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:55:56,723 : INFO : PROGRESS: at 4.05% examples, 283647 words/s, in_q

2017-07-20 19:57:22,762 : INFO : PROGRESS: at 4.67% examples, 284603 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:23,791 : INFO : PROGRESS: at 4.68% examples, 284783 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:25,388 : INFO : PROGRESS: at 4.69% examples, 284558 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:26,427 : INFO : PROGRESS: at 4.70% examples, 284763 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:27,436 : INFO : PROGRESS: at 4.71% examples, 284951 words/s, in_qsize 6, out_qsize 0
2017-07-20 19:57:29,951 : INFO : PROGRESS: at 4.72% examples, 284364 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:30,955 : INFO : PROGRESS: at 4.73% examples, 284559 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:31,961 : INFO : PROGRESS: at 4.74% examples, 284746 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:32,992 : INFO : PROGRESS: at 4.75% examples, 284938 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:57:35,041 : INFO : PROGRESS: at 4.75% examples, 284496 words/s, in_q

2017-07-20 19:59:04,341 : INFO : PROGRESS: at 5.39% examples, 285888 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:06,566 : INFO : PROGRESS: at 5.40% examples, 285449 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:07,579 : INFO : PROGRESS: at 5.41% examples, 285609 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:08,605 : INFO : PROGRESS: at 5.42% examples, 285739 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:09,632 : INFO : PROGRESS: at 5.43% examples, 285910 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:10,634 : INFO : PROGRESS: at 5.44% examples, 285952 words/s, in_qsize 2, out_qsize 0
2017-07-20 19:59:11,999 : INFO : PROGRESS: at 5.44% examples, 285536 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:13,052 : INFO : PROGRESS: at 5.45% examples, 285707 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:14,056 : INFO : PROGRESS: at 5.46% examples, 285881 words/s, in_qsize 7, out_qsize 0
2017-07-20 19:59:15,068 : INFO : PROGRESS: at 5.47% examples, 286024 words/s, in_q

2017-07-20 20:00:40,338 : INFO : PROGRESS: at 6.09% examples, 286749 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:00:41,348 : INFO : PROGRESS: at 6.10% examples, 286765 words/s, in_qsize 1, out_qsize 1
2017-07-20 20:00:42,366 : INFO : PROGRESS: at 6.10% examples, 286551 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:00:43,389 : INFO : PROGRESS: at 6.11% examples, 286691 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:00:44,421 : INFO : PROGRESS: at 6.12% examples, 286827 words/s, in_qsize 0, out_qsize 0
2017-07-20 20:00:45,981 : INFO : PROGRESS: at 6.12% examples, 286368 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:00:47,038 : INFO : PROGRESS: at 6.13% examples, 286517 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:00:48,085 : INFO : PROGRESS: at 6.14% examples, 286669 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:00:49,098 : INFO : PROGRESS: at 6.15% examples, 286810 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:00:50,125 : INFO : PROGRESS: at 6.16% examples, 286761 words/s, in_q

2017-07-20 20:02:15,097 : INFO : PROGRESS: at 6.77% examples, 286968 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:16,103 : INFO : PROGRESS: at 6.78% examples, 287107 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:17,128 : INFO : PROGRESS: at 6.79% examples, 287231 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:18,170 : INFO : PROGRESS: at 6.80% examples, 287370 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:20,426 : INFO : PROGRESS: at 6.80% examples, 286973 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:21,473 : INFO : PROGRESS: at 6.81% examples, 287110 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:22,488 : INFO : PROGRESS: at 6.82% examples, 287236 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:23,537 : INFO : PROGRESS: at 6.83% examples, 287359 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:02:24,567 : INFO : PROGRESS: at 6.84% examples, 287388 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:02:25,577 : INFO : PROGRESS: at 6.85% examples, 287380 words/s, in_q

2017-07-20 20:03:53,920 : INFO : PROGRESS: at 7.48% examples, 287763 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:03:54,923 : INFO : PROGRESS: at 7.48% examples, 287786 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:03:56,555 : INFO : PROGRESS: at 7.49% examples, 287481 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:03:57,560 : INFO : PROGRESS: at 7.50% examples, 287607 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:03:58,596 : INFO : PROGRESS: at 7.51% examples, 287716 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:03:59,653 : INFO : PROGRESS: at 7.52% examples, 287832 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:04:00,691 : INFO : PROGRESS: at 7.52% examples, 287736 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:04:02,846 : INFO : PROGRESS: at 7.53% examples, 287523 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:04:03,850 : INFO : PROGRESS: at 7.54% examples, 287652 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:04:04,879 : INFO : PROGRESS: at 7.55% examples, 287762 words/s, in_q

2017-07-20 20:05:28,915 : INFO : PROGRESS: at 8.16% examples, 288147 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:05:29,955 : INFO : PROGRESS: at 8.17% examples, 288167 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:05:31,773 : INFO : PROGRESS: at 8.17% examples, 287839 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:05:32,803 : INFO : PROGRESS: at 8.18% examples, 287958 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:05:33,819 : INFO : PROGRESS: at 8.19% examples, 288062 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:05:34,827 : INFO : PROGRESS: at 8.20% examples, 288171 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:05:35,871 : INFO : PROGRESS: at 8.21% examples, 288182 words/s, in_qsize 5, out_qsize 1
2017-07-20 20:05:37,436 : INFO : PROGRESS: at 8.21% examples, 287886 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:05:38,440 : INFO : PROGRESS: at 8.22% examples, 288001 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:05:39,448 : INFO : PROGRESS: at 8.23% examples, 288107 words/s, in_q

2017-07-20 20:07:09,706 : INFO : PROGRESS: at 8.88% examples, 288278 words/s, in_qsize 6, out_qsize 1
2017-07-20 20:07:10,706 : INFO : PROGRESS: at 8.89% examples, 288378 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:07:11,710 : INFO : PROGRESS: at 8.90% examples, 288460 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:07:12,732 : INFO : PROGRESS: at 8.91% examples, 288554 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:07:14,848 : INFO : PROGRESS: at 8.91% examples, 288248 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:07:15,861 : INFO : PROGRESS: at 8.92% examples, 288343 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:07:16,867 : INFO : PROGRESS: at 8.93% examples, 288439 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:07:17,899 : INFO : PROGRESS: at 8.94% examples, 288538 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:07:18,925 : INFO : PROGRESS: at 8.95% examples, 288551 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:07:19,945 : INFO : PROGRESS: at 8.96% examples, 288557 words/s, in_q

2017-07-20 20:08:46,714 : INFO : PROGRESS: at 9.59% examples, 288763 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:08:47,716 : INFO : PROGRESS: at 9.60% examples, 288855 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:08:49,506 : INFO : PROGRESS: at 9.61% examples, 288640 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:08:50,506 : INFO : PROGRESS: at 9.62% examples, 288739 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:08:51,524 : INFO : PROGRESS: at 9.63% examples, 288827 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:08:52,541 : INFO : PROGRESS: at 9.64% examples, 288915 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:08:53,555 : INFO : PROGRESS: at 9.65% examples, 288907 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:08:54,805 : INFO : PROGRESS: at 9.66% examples, 288870 words/s, in_qsize 1, out_qsize 2
2017-07-20 20:08:55,822 : INFO : PROGRESS: at 9.67% examples, 288919 words/s, in_qsize 0, out_qsize 0
2017-07-20 20:08:57,115 : INFO : PROGRESS: at 9.67% examples, 288658 words/s, in_q

2017-07-20 20:10:24,122 : INFO : PROGRESS: at 10.29% examples, 289178 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:26,153 : INFO : PROGRESS: at 10.30% examples, 288881 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:27,161 : INFO : PROGRESS: at 10.31% examples, 288975 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:28,173 : INFO : PROGRESS: at 10.32% examples, 289051 words/s, in_qsize 8, out_qsize 0
2017-07-20 20:10:29,180 : INFO : PROGRESS: at 10.33% examples, 289141 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:30,207 : INFO : PROGRESS: at 10.33% examples, 289159 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:32,002 : INFO : PROGRESS: at 10.34% examples, 288945 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:33,013 : INFO : PROGRESS: at 10.35% examples, 289032 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:34,030 : INFO : PROGRESS: at 10.36% examples, 289112 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:10:35,065 : INFO : PROGRESS: at 10.37% examples, 289203 wor

2017-07-20 20:12:02,845 : INFO : PROGRESS: at 11.00% examples, 289433 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:03,854 : INFO : PROGRESS: at 11.01% examples, 289517 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:05,657 : INFO : PROGRESS: at 11.01% examples, 289313 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:06,697 : INFO : PROGRESS: at 11.02% examples, 289398 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:07,712 : INFO : PROGRESS: at 11.03% examples, 289481 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:08,716 : INFO : PROGRESS: at 11.04% examples, 289560 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:10,744 : INFO : PROGRESS: at 11.05% examples, 289308 words/s, in_qsize 8, out_qsize 0
2017-07-20 20:12:11,753 : INFO : PROGRESS: at 11.06% examples, 289393 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:12,786 : INFO : PROGRESS: at 11.07% examples, 289466 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:12:13,809 : INFO : PROGRESS: at 11.08% examples, 289548 wor

2017-07-20 20:13:39,904 : INFO : PROGRESS: at 11.70% examples, 289761 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:42,007 : INFO : PROGRESS: at 11.71% examples, 289569 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:43,013 : INFO : PROGRESS: at 11.71% examples, 289648 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:44,051 : INFO : PROGRESS: at 11.73% examples, 289723 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:45,066 : INFO : PROGRESS: at 11.74% examples, 289801 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:46,095 : INFO : PROGRESS: at 11.74% examples, 289817 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:48,050 : INFO : PROGRESS: at 11.75% examples, 289603 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:49,051 : INFO : PROGRESS: at 11.76% examples, 289684 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:50,057 : INFO : PROGRESS: at 11.77% examples, 289751 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:13:51,068 : INFO : PROGRESS: at 11.78% examples, 289830 wor

2017-07-20 20:15:17,238 : INFO : PROGRESS: at 12.39% examples, 289790 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:18,291 : INFO : PROGRESS: at 12.40% examples, 289863 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:19,296 : INFO : PROGRESS: at 12.41% examples, 289941 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:20,312 : INFO : PROGRESS: at 12.42% examples, 290009 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:22,220 : INFO : PROGRESS: at 12.43% examples, 289827 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:23,234 : INFO : PROGRESS: at 12.44% examples, 289907 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:24,250 : INFO : PROGRESS: at 12.45% examples, 289975 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:25,270 : INFO : PROGRESS: at 12.46% examples, 290047 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:26,290 : INFO : PROGRESS: at 12.47% examples, 290063 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:15:27,309 : INFO : PROGRESS: at 12.48% examples, 290071 wor

2017-07-20 20:16:52,304 : INFO : PROGRESS: at 13.11% examples, 290180 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:16:53,309 : INFO : PROGRESS: at 13.12% examples, 290250 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:16:55,185 : INFO : PROGRESS: at 13.13% examples, 290076 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:16:56,186 : INFO : PROGRESS: at 13.13% examples, 290148 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:16:57,198 : INFO : PROGRESS: at 13.14% examples, 290211 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:16:58,229 : INFO : PROGRESS: at 13.15% examples, 290277 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:16:59,234 : INFO : PROGRESS: at 13.16% examples, 290294 words/s, in_qsize 6, out_qsize 0
2017-07-20 20:17:00,986 : INFO : PROGRESS: at 13.17% examples, 290076 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:17:02,006 : INFO : PROGRESS: at 13.17% examples, 290146 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:17:03,013 : INFO : PROGRESS: at 13.18% examples, 290215 wor

2017-07-20 20:18:29,117 : INFO : PROGRESS: at 13.81% examples, 290416 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:30,140 : INFO : PROGRESS: at 13.82% examples, 290476 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:31,906 : INFO : PROGRESS: at 13.82% examples, 290307 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:32,908 : INFO : PROGRESS: at 13.83% examples, 290374 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:33,917 : INFO : PROGRESS: at 13.84% examples, 290433 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:34,980 : INFO : PROGRESS: at 13.85% examples, 290497 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:36,036 : INFO : PROGRESS: at 13.86% examples, 290468 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:37,122 : INFO : PROGRESS: at 13.86% examples, 290396 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:38,129 : INFO : PROGRESS: at 13.87% examples, 290463 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:18:39,138 : INFO : PROGRESS: at 13.88% examples, 290485 wor

2017-07-20 20:20:03,924 : INFO : PROGRESS: at 14.49% examples, 290601 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:20:04,927 : INFO : PROGRESS: at 14.50% examples, 290661 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:20:07,022 : INFO : PROGRESS: at 14.51% examples, 290467 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:20:08,023 : INFO : PROGRESS: at 14.52% examples, 290532 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:20:09,029 : INFO : PROGRESS: at 14.53% examples, 290585 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:20:10,035 : INFO : PROGRESS: at 14.54% examples, 290649 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:20:11,038 : INFO : PROGRESS: at 14.54% examples, 290660 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:20:13,036 : INFO : PROGRESS: at 14.55% examples, 290446 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:20:14,051 : INFO : PROGRESS: at 14.56% examples, 290512 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:20:15,060 : INFO : PROGRESS: at 14.57% examples, 290567 wor

2017-07-20 20:21:42,289 : INFO : PROGRESS: at 15.19% examples, 290719 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:43,305 : INFO : PROGRESS: at 15.20% examples, 290773 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:45,326 : INFO : PROGRESS: at 15.21% examples, 290622 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:46,341 : INFO : PROGRESS: at 15.22% examples, 290685 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:47,365 : INFO : PROGRESS: at 15.23% examples, 290744 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:48,379 : INFO : PROGRESS: at 15.24% examples, 290799 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:50,629 : INFO : PROGRESS: at 15.25% examples, 290621 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:51,662 : INFO : PROGRESS: at 15.26% examples, 290683 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:52,678 : INFO : PROGRESS: at 15.27% examples, 290738 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:21:53,695 : INFO : PROGRESS: at 15.28% examples, 290800 wor

2017-07-20 20:23:18,249 : INFO : PROGRESS: at 15.89% examples, 290757 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:19,280 : INFO : PROGRESS: at 15.90% examples, 290817 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:20,290 : INFO : PROGRESS: at 15.91% examples, 290873 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:21,307 : INFO : PROGRESS: at 15.92% examples, 290930 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:23,322 : INFO : PROGRESS: at 15.93% examples, 290790 words/s, in_qsize 8, out_qsize 0
2017-07-20 20:23:24,334 : INFO : PROGRESS: at 15.94% examples, 290848 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:25,355 : INFO : PROGRESS: at 15.95% examples, 290905 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:26,382 : INFO : PROGRESS: at 15.96% examples, 290960 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:27,396 : INFO : PROGRESS: at 15.97% examples, 290973 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:23:28,449 : INFO : PROGRESS: at 15.97% examples, 290949 wor

2017-07-20 20:24:56,040 : INFO : PROGRESS: at 16.60% examples, 290944 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:24:57,043 : INFO : PROGRESS: at 16.61% examples, 291001 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:24:58,050 : INFO : PROGRESS: at 16.62% examples, 291053 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:24:59,077 : INFO : PROGRESS: at 16.63% examples, 291103 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:25:00,098 : INFO : PROGRESS: at 16.64% examples, 291119 words/s, in_qsize 4, out_qsize 0
2017-07-20 20:25:01,692 : INFO : PROGRESS: at 16.64% examples, 290957 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:25:02,718 : INFO : PROGRESS: at 16.65% examples, 291013 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:25:03,727 : INFO : PROGRESS: at 16.66% examples, 291064 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:25:04,735 : INFO : PROGRESS: at 16.67% examples, 291120 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:25:05,805 : INFO : PROGRESS: at 16.68% examples, 291117 wor

2017-07-20 20:26:33,616 : INFO : PROGRESS: at 17.31% examples, 291243 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:34,643 : INFO : PROGRESS: at 17.32% examples, 291261 words/s, in_qsize 0, out_qsize 0
2017-07-20 20:26:36,176 : INFO : PROGRESS: at 17.32% examples, 291088 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:37,223 : INFO : PROGRESS: at 17.33% examples, 291140 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:38,265 : INFO : PROGRESS: at 17.34% examples, 291194 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:39,271 : INFO : PROGRESS: at 17.35% examples, 291247 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:41,079 : INFO : PROGRESS: at 17.36% examples, 291099 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:42,117 : INFO : PROGRESS: at 17.37% examples, 291153 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:43,122 : INFO : PROGRESS: at 17.38% examples, 291203 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:26:44,124 : INFO : PROGRESS: at 17.39% examples, 291258 wor

2017-07-20 20:28:08,524 : INFO : PROGRESS: at 18.00% examples, 291372 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:09,550 : INFO : PROGRESS: at 18.01% examples, 291339 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:11,302 : INFO : PROGRESS: at 18.01% examples, 291210 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:12,344 : INFO : PROGRESS: at 18.02% examples, 291261 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:13,389 : INFO : PROGRESS: at 18.03% examples, 291312 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:14,415 : INFO : PROGRESS: at 18.04% examples, 291357 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:16,571 : INFO : PROGRESS: at 18.05% examples, 291199 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:17,605 : INFO : PROGRESS: at 18.06% examples, 291251 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:18,610 : INFO : PROGRESS: at 18.07% examples, 291297 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:28:19,624 : INFO : PROGRESS: at 18.08% examples, 291348 wor

2017-07-20 20:29:44,170 : INFO : PROGRESS: at 18.69% examples, 291354 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:46,516 : INFO : PROGRESS: at 18.70% examples, 291205 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:47,539 : INFO : PROGRESS: at 18.71% examples, 291242 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:48,582 : INFO : PROGRESS: at 18.72% examples, 291250 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:29:49,630 : INFO : PROGRESS: at 18.73% examples, 291291 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:51,679 : INFO : PROGRESS: at 18.73% examples, 291167 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:52,689 : INFO : PROGRESS: at 18.74% examples, 291209 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:53,692 : INFO : PROGRESS: at 18.75% examples, 291251 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:54,693 : INFO : PROGRESS: at 18.76% examples, 291294 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:29:56,577 : INFO : PROGRESS: at 18.77% examples, 291173 wor

2017-07-20 20:31:20,461 : INFO : PROGRESS: at 19.36% examples, 290918 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:31:21,523 : INFO : PROGRESS: at 19.36% examples, 290898 words/s, in_qsize 1, out_qsize 2
2017-07-20 20:31:22,527 : INFO : PROGRESS: at 19.37% examples, 290902 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:31:23,570 : INFO : PROGRESS: at 19.38% examples, 290897 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:31:25,023 : INFO : PROGRESS: at 19.38% examples, 290827 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:31:26,068 : INFO : PROGRESS: at 19.39% examples, 290864 words/s, in_qsize 6, out_qsize 1
2017-07-20 20:31:27,117 : INFO : PROGRESS: at 19.40% examples, 290904 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:31:28,158 : INFO : PROGRESS: at 19.41% examples, 290911 words/s, in_qsize 3, out_qsize 0
2017-07-20 20:31:29,833 : INFO : PROGRESS: at 19.41% examples, 290760 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:31:30,836 : INFO : PROGRESS: at 19.42% examples, 290801 wor

2017-07-20 20:32:59,106 : INFO : PROGRESS: at 20.04% examples, 290592 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:00,928 : INFO : PROGRESS: at 20.05% examples, 290473 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:01,958 : INFO : PROGRESS: at 20.05% examples, 290512 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:02,958 : INFO : PROGRESS: at 20.06% examples, 290541 words/s, in_qsize 5, out_qsize 2
2017-07-20 20:33:03,979 : INFO : PROGRESS: at 20.07% examples, 290576 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:04,993 : INFO : PROGRESS: at 20.08% examples, 290577 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:05,997 : INFO : PROGRESS: at 20.09% examples, 290577 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:07,399 : INFO : PROGRESS: at 20.09% examples, 290487 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:08,400 : INFO : PROGRESS: at 20.10% examples, 290527 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:33:09,418 : INFO : PROGRESS: at 20.11% examples, 290559 wor

2017-07-20 20:34:38,600 : INFO : PROGRESS: at 20.72% examples, 290266 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:34:39,728 : INFO : PROGRESS: at 20.73% examples, 290255 words/s, in_qsize 5, out_qsize 1
2017-07-20 20:34:40,735 : INFO : PROGRESS: at 20.74% examples, 290267 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:34:41,776 : INFO : PROGRESS: at 20.75% examples, 290277 words/s, in_qsize 2, out_qsize 0
2017-07-20 20:34:43,336 : INFO : PROGRESS: at 20.75% examples, 290145 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:34:44,363 : INFO : PROGRESS: at 20.76% examples, 290187 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:34:45,370 : INFO : PROGRESS: at 20.77% examples, 290229 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:34:46,421 : INFO : PROGRESS: at 20.78% examples, 290272 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:34:48,445 : INFO : PROGRESS: at 20.79% examples, 290137 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:34:49,448 : INFO : PROGRESS: at 20.80% examples, 290182 wor

2017-07-20 20:36:14,894 : INFO : PROGRESS: at 21.41% examples, 290324 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:36:15,944 : INFO : PROGRESS: at 21.42% examples, 290307 words/s, in_qsize 2, out_qsize 2
2017-07-20 20:36:16,960 : INFO : PROGRESS: at 21.43% examples, 290319 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:36:17,978 : INFO : PROGRESS: at 21.44% examples, 290331 words/s, in_qsize 4, out_qsize 0
2017-07-20 20:36:19,394 : INFO : PROGRESS: at 21.44% examples, 290223 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:36:20,434 : INFO : PROGRESS: at 21.45% examples, 290267 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:36:21,480 : INFO : PROGRESS: at 21.46% examples, 290310 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:36:22,505 : INFO : PROGRESS: at 21.47% examples, 290354 words/s, in_qsize 5, out_qsize 0
2017-07-20 20:36:24,239 : INFO : PROGRESS: at 21.47% examples, 290219 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:36:25,255 : INFO : PROGRESS: at 21.48% examples, 290263 wor

2017-07-20 20:37:51,234 : INFO : PROGRESS: at 22.11% examples, 290334 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:37:52,281 : INFO : PROGRESS: at 22.12% examples, 290376 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:37:53,310 : INFO : PROGRESS: at 22.13% examples, 290414 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:37:54,362 : INFO : PROGRESS: at 22.14% examples, 290452 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:37:55,406 : INFO : PROGRESS: at 22.15% examples, 290458 words/s, in_qsize 5, out_qsize 0
2017-07-20 20:37:56,414 : INFO : PROGRESS: at 22.15% examples, 290445 words/s, in_qsize 4, out_qsize 0
2017-07-20 20:37:57,996 : INFO : PROGRESS: at 22.16% examples, 290325 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:37:59,017 : INFO : PROGRESS: at 22.17% examples, 290369 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:38:00,041 : INFO : PROGRESS: at 22.18% examples, 290406 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:38:01,081 : INFO : PROGRESS: at 22.19% examples, 290447 wor

2017-07-20 20:39:26,935 : INFO : PROGRESS: at 22.80% examples, 290464 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:39:27,937 : INFO : PROGRESS: at 22.81% examples, 290488 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:39:28,956 : INFO : PROGRESS: at 22.82% examples, 290522 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:39:29,968 : INFO : PROGRESS: at 22.83% examples, 290532 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:39:30,996 : INFO : PROGRESS: at 22.84% examples, 290545 words/s, in_qsize 5, out_qsize 0
2017-07-20 20:39:32,697 : INFO : PROGRESS: at 22.84% examples, 290420 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:39:33,699 : INFO : PROGRESS: at 22.85% examples, 290461 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:39:34,726 : INFO : PROGRESS: at 22.86% examples, 290493 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:39:35,734 : INFO : PROGRESS: at 22.87% examples, 290529 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:39:36,743 : INFO : PROGRESS: at 22.88% examples, 290537 wor

2017-07-20 20:40:58,888 : INFO : PROGRESS: at 23.49% examples, 290609 words/s, in_qsize 8, out_qsize 0
2017-07-20 20:40:59,895 : INFO : PROGRESS: at 23.49% examples, 290589 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:41:00,924 : INFO : PROGRESS: at 23.50% examples, 290598 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:41:02,505 : INFO : PROGRESS: at 23.50% examples, 290500 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:41:03,505 : INFO : PROGRESS: at 23.51% examples, 290539 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:41:04,519 : INFO : PROGRESS: at 23.52% examples, 290574 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:41:05,534 : INFO : PROGRESS: at 23.54% examples, 290614 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:41:07,479 : INFO : PROGRESS: at 23.54% examples, 290501 words/s, in_qsize 6, out_qsize 1
2017-07-20 20:41:08,522 : INFO : PROGRESS: at 23.55% examples, 290542 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:41:09,554 : INFO : PROGRESS: at 23.56% examples, 290571 wor

2017-07-20 20:42:37,794 : INFO : PROGRESS: at 24.19% examples, 290639 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:38,803 : INFO : PROGRESS: at 24.20% examples, 290674 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:39,818 : INFO : PROGRESS: at 24.21% examples, 290711 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:41,805 : INFO : PROGRESS: at 24.21% examples, 290584 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:42,840 : INFO : PROGRESS: at 24.22% examples, 290623 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:43,856 : INFO : PROGRESS: at 24.23% examples, 290658 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:44,857 : INFO : PROGRESS: at 24.24% examples, 290696 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:45,872 : INFO : PROGRESS: at 24.25% examples, 290702 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:42:46,900 : INFO : PROGRESS: at 24.26% examples, 290711 words/s, in_qsize 0, out_qsize 0
2017-07-20 20:42:48,229 : INFO : PROGRESS: at 24.26% examples, 290608 wor

2017-07-20 20:44:14,141 : INFO : PROGRESS: at 24.88% examples, 290738 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:15,143 : INFO : PROGRESS: at 24.89% examples, 290770 words/s, in_qsize 8, out_qsize 0
2017-07-20 20:44:17,494 : INFO : PROGRESS: at 24.90% examples, 290664 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:18,527 : INFO : PROGRESS: at 24.91% examples, 290702 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:19,540 : INFO : PROGRESS: at 24.92% examples, 290736 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:20,566 : INFO : PROGRESS: at 24.93% examples, 290774 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:22,711 : INFO : PROGRESS: at 24.94% examples, 290685 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:23,714 : INFO : PROGRESS: at 24.95% examples, 290723 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:24,733 : INFO : PROGRESS: at 24.96% examples, 290757 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:44:25,742 : INFO : PROGRESS: at 24.97% examples, 290791 wor

2017-07-20 20:45:52,378 : INFO : PROGRESS: at 25.59% examples, 290792 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:45:53,389 : INFO : PROGRESS: at 25.60% examples, 290828 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:45:54,395 : INFO : PROGRESS: at 25.61% examples, 290863 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:45:55,439 : INFO : PROGRESS: at 25.61% examples, 290858 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:45:56,488 : INFO : PROGRESS: at 25.62% examples, 290869 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:45:58,228 : INFO : PROGRESS: at 25.63% examples, 290771 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:45:59,266 : INFO : PROGRESS: at 25.64% examples, 290808 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:46:00,278 : INFO : PROGRESS: at 25.65% examples, 290844 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:46:01,282 : INFO : PROGRESS: at 25.66% examples, 290878 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:46:02,351 : INFO : PROGRESS: at 25.66% examples, 290862 wor

2017-07-20 20:47:27,429 : INFO : PROGRESS: at 26.28% examples, 290924 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:47:28,473 : INFO : PROGRESS: at 26.29% examples, 290956 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:47:29,494 : INFO : PROGRESS: at 26.30% examples, 290963 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:47:30,504 : INFO : PROGRESS: at 26.31% examples, 290973 words/s, in_qsize 0, out_qsize 0
2017-07-20 20:47:32,052 : INFO : PROGRESS: at 26.31% examples, 290858 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:47:33,079 : INFO : PROGRESS: at 26.32% examples, 290894 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:47:34,095 : INFO : PROGRESS: at 26.33% examples, 290926 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:47:35,125 : INFO : PROGRESS: at 26.34% examples, 290960 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:47:36,129 : INFO : PROGRESS: at 26.35% examples, 290971 words/s, in_qsize 8, out_qsize 0
2017-07-20 20:47:37,867 : INFO : PROGRESS: at 26.35% examples, 290868 wor

2017-07-20 20:49:03,720 : INFO : PROGRESS: at 26.97% examples, 290980 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:04,755 : INFO : PROGRESS: at 26.98% examples, 291013 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:05,770 : INFO : PROGRESS: at 26.99% examples, 291049 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:06,774 : INFO : PROGRESS: at 27.00% examples, 291049 words/s, in_qsize 4, out_qsize 0
2017-07-20 20:49:08,298 : INFO : PROGRESS: at 27.00% examples, 290954 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:09,330 : INFO : PROGRESS: at 27.01% examples, 290981 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:10,335 : INFO : PROGRESS: at 27.02% examples, 291010 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:11,357 : INFO : PROGRESS: at 27.03% examples, 291044 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:13,355 : INFO : PROGRESS: at 27.04% examples, 290983 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:49:14,421 : INFO : PROGRESS: at 27.05% examples, 291016 wor

2017-07-20 20:50:40,888 : INFO : PROGRESS: at 27.68% examples, 291102 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:50:41,894 : INFO : PROGRESS: at 27.69% examples, 291135 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:50:42,911 : INFO : PROGRESS: at 27.70% examples, 291142 words/s, in_qsize 6, out_qsize 0
2017-07-20 20:50:44,653 : INFO : PROGRESS: at 27.70% examples, 291039 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:50:45,688 : INFO : PROGRESS: at 27.71% examples, 291073 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:50:46,741 : INFO : PROGRESS: at 27.72% examples, 291104 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:50:47,805 : INFO : PROGRESS: at 27.73% examples, 291136 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:50:49,046 : INFO : PROGRESS: at 27.74% examples, 291086 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:50:50,103 : INFO : PROGRESS: at 27.75% examples, 291118 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:50:51,306 : INFO : PROGRESS: at 27.76% examples, 291135 wor

2017-07-20 20:52:15,832 : INFO : PROGRESS: at 28.36% examples, 291169 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:52:16,840 : INFO : PROGRESS: at 28.37% examples, 291199 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:52:19,492 : INFO : PROGRESS: at 28.38% examples, 291098 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:52:20,522 : INFO : PROGRESS: at 28.39% examples, 291130 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:52:21,542 : INFO : PROGRESS: at 28.40% examples, 291163 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:52:22,558 : INFO : PROGRESS: at 28.41% examples, 291194 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:52:23,611 : INFO : PROGRESS: at 28.42% examples, 291213 words/s, in_qsize 5, out_qsize 2
2017-07-20 20:52:24,613 : INFO : PROGRESS: at 28.43% examples, 291223 words/s, in_qsize 1, out_qsize 0
2017-07-20 20:52:26,207 : INFO : PROGRESS: at 28.43% examples, 291121 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:52:27,231 : INFO : PROGRESS: at 28.44% examples, 291154 wor

2017-07-20 20:53:55,622 : INFO : PROGRESS: at 29.08% examples, 291155 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:53:56,646 : INFO : PROGRESS: at 29.08% examples, 291156 words/s, in_qsize 5, out_qsize 2
2017-07-20 20:53:58,650 : INFO : PROGRESS: at 29.09% examples, 291074 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:53:59,698 : INFO : PROGRESS: at 29.10% examples, 291106 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:54:00,699 : INFO : PROGRESS: at 29.11% examples, 291138 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:54:01,739 : INFO : PROGRESS: at 29.12% examples, 291166 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:54:02,782 : INFO : PROGRESS: at 29.13% examples, 291168 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:54:03,785 : INFO : PROGRESS: at 29.14% examples, 291170 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:54:04,818 : INFO : PROGRESS: at 29.15% examples, 291172 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:54:06,548 : INFO : PROGRESS: at 29.15% examples, 291079 wor

2017-07-20 20:55:32,292 : INFO : PROGRESS: at 29.78% examples, 291099 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:33,309 : INFO : PROGRESS: at 29.79% examples, 291130 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:34,326 : INFO : PROGRESS: at 29.80% examples, 291158 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:36,392 : INFO : PROGRESS: at 29.80% examples, 291063 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:37,397 : INFO : PROGRESS: at 29.81% examples, 291094 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:38,442 : INFO : PROGRESS: at 29.82% examples, 291122 words/s, in_qsize 8, out_qsize 1
2017-07-20 20:55:39,463 : INFO : PROGRESS: at 29.83% examples, 291145 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:41,476 : INFO : PROGRESS: at 29.84% examples, 291059 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:42,507 : INFO : PROGRESS: at 29.85% examples, 291088 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:55:43,508 : INFO : PROGRESS: at 29.86% examples, 291117 wor

2017-07-20 20:57:08,712 : INFO : PROGRESS: at 30.47% examples, 291175 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:10,366 : INFO : PROGRESS: at 30.48% examples, 291100 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:11,370 : INFO : PROGRESS: at 30.49% examples, 291130 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:12,398 : INFO : PROGRESS: at 30.50% examples, 291157 words/s, in_qsize 8, out_qsize 0
2017-07-20 20:57:13,407 : INFO : PROGRESS: at 30.51% examples, 291183 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:15,321 : INFO : PROGRESS: at 30.51% examples, 291091 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:16,382 : INFO : PROGRESS: at 30.52% examples, 291120 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:17,426 : INFO : PROGRESS: at 30.53% examples, 291150 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:18,433 : INFO : PROGRESS: at 30.54% examples, 291181 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:57:20,461 : INFO : PROGRESS: at 30.55% examples, 291079 wor

2017-07-20 20:58:48,491 : INFO : PROGRESS: at 31.19% examples, 291243 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:50,409 : INFO : PROGRESS: at 31.19% examples, 291157 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:51,417 : INFO : PROGRESS: at 31.20% examples, 291187 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:52,420 : INFO : PROGRESS: at 31.21% examples, 291215 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:53,450 : INFO : PROGRESS: at 31.22% examples, 291241 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:55,037 : INFO : PROGRESS: at 31.23% examples, 291166 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:56,058 : INFO : PROGRESS: at 31.24% examples, 291197 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:57,081 : INFO : PROGRESS: at 31.25% examples, 291224 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:58,095 : INFO : PROGRESS: at 31.26% examples, 291253 words/s, in_qsize 7, out_qsize 0
2017-07-20 20:58:59,108 : INFO : PROGRESS: at 31.27% examples, 291256 wor

2017-07-20 21:00:28,277 : INFO : PROGRESS: at 31.89% examples, 291199 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:00:29,279 : INFO : PROGRESS: at 31.90% examples, 291229 words/s, in_qsize 8, out_qsize 0
2017-07-20 21:00:30,292 : INFO : PROGRESS: at 31.91% examples, 291255 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:00:31,309 : INFO : PROGRESS: at 31.92% examples, 291282 words/s, in_qsize 7, out_qsize 1
2017-07-20 21:00:33,418 : INFO : PROGRESS: at 31.93% examples, 291188 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:00:34,460 : INFO : PROGRESS: at 31.94% examples, 291217 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:00:35,479 : INFO : PROGRESS: at 31.95% examples, 291246 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:00:36,487 : INFO : PROGRESS: at 31.96% examples, 291273 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:00:37,508 : INFO : PROGRESS: at 31.97% examples, 291272 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:00:39,444 : INFO : PROGRESS: at 31.97% examples, 291206 wor

2017-07-20 21:02:04,620 : INFO : PROGRESS: at 32.60% examples, 291345 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:02:06,717 : INFO : PROGRESS: at 32.61% examples, 291252 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:02:07,761 : INFO : PROGRESS: at 32.62% examples, 291280 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:02:08,769 : INFO : PROGRESS: at 32.63% examples, 291309 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:02:09,773 : INFO : PROGRESS: at 32.64% examples, 291337 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:02:10,820 : INFO : PROGRESS: at 32.65% examples, 291341 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:02:11,906 : INFO : PROGRESS: at 32.66% examples, 291336 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:02:12,931 : INFO : PROGRESS: at 32.66% examples, 291334 words/s, in_qsize 8, out_qsize 3
2017-07-20 21:02:13,945 : INFO : PROGRESS: at 32.67% examples, 291345 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:02:15,100 : INFO : PROGRESS: at 32.68% examples, 291339 wor

2017-07-20 21:03:42,657 : INFO : PROGRESS: at 33.32% examples, 291320 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:03:43,687 : INFO : PROGRESS: at 33.33% examples, 291345 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:03:44,695 : INFO : PROGRESS: at 33.34% examples, 291372 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:03:45,867 : INFO : PROGRESS: at 33.35% examples, 291360 words/s, in_qsize 7, out_qsize 1
2017-07-20 21:03:46,884 : INFO : PROGRESS: at 33.36% examples, 291369 words/s, in_qsize 5, out_qsize 0
2017-07-20 21:03:48,388 : INFO : PROGRESS: at 33.36% examples, 291296 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:03:49,446 : INFO : PROGRESS: at 33.37% examples, 291323 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:03:50,452 : INFO : PROGRESS: at 33.38% examples, 291350 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:03:51,472 : INFO : PROGRESS: at 33.39% examples, 291375 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:03:53,483 : INFO : PROGRESS: at 33.40% examples, 291292 wor

2017-07-20 21:05:20,174 : INFO : PROGRESS: at 34.02% examples, 291391 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:05:21,189 : INFO : PROGRESS: at 34.03% examples, 291418 words/s, in_qsize 8, out_qsize 0
2017-07-20 21:05:22,190 : INFO : PROGRESS: at 34.04% examples, 291425 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:05:23,198 : INFO : PROGRESS: at 34.05% examples, 291432 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:05:24,958 : INFO : PROGRESS: at 34.05% examples, 291351 words/s, in_qsize 8, out_qsize 0
2017-07-20 21:05:25,979 : INFO : PROGRESS: at 34.06% examples, 291378 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:05:26,997 : INFO : PROGRESS: at 34.07% examples, 291404 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:05:28,049 : INFO : PROGRESS: at 34.08% examples, 291430 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:05:29,885 : INFO : PROGRESS: at 34.09% examples, 291361 words/s, in_qsize 8, out_qsize 0
2017-07-20 21:05:30,892 : INFO : PROGRESS: at 34.10% examples, 291390 wor

2017-07-20 21:06:56,083 : INFO : PROGRESS: at 34.71% examples, 291427 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:06:57,086 : INFO : PROGRESS: at 34.72% examples, 291452 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:06:58,092 : INFO : PROGRESS: at 34.73% examples, 291477 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:07:00,018 : INFO : PROGRESS: at 34.74% examples, 291418 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:07:01,073 : INFO : PROGRESS: at 34.75% examples, 291444 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:07:02,075 : INFO : PROGRESS: at 34.76% examples, 291471 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:07:03,095 : INFO : PROGRESS: at 34.77% examples, 291493 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:07:04,103 : INFO : PROGRESS: at 34.77% examples, 291480 words/s, in_qsize 6, out_qsize 1
2017-07-20 21:07:05,702 : INFO : PROGRESS: at 34.78% examples, 291412 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:07:06,713 : INFO : PROGRESS: at 34.79% examples, 291438 wor

2017-07-20 21:08:33,435 : INFO : PROGRESS: at 35.41% examples, 291477 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:34,474 : INFO : PROGRESS: at 35.42% examples, 291503 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:35,478 : INFO : PROGRESS: at 35.43% examples, 291529 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:36,479 : INFO : PROGRESS: at 35.44% examples, 291533 words/s, in_qsize 0, out_qsize 0
2017-07-20 21:08:38,076 : INFO : PROGRESS: at 35.44% examples, 291449 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:39,130 : INFO : PROGRESS: at 35.45% examples, 291474 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:40,169 : INFO : PROGRESS: at 35.47% examples, 291500 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:41,225 : INFO : PROGRESS: at 35.48% examples, 291526 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:42,667 : INFO : PROGRESS: at 35.48% examples, 291483 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:08:43,726 : INFO : PROGRESS: at 35.49% examples, 291508 wor

2017-07-20 21:10:10,406 : INFO : PROGRESS: at 36.12% examples, 291571 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:11,427 : INFO : PROGRESS: at 36.13% examples, 291593 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:13,521 : INFO : PROGRESS: at 36.14% examples, 291513 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:14,538 : INFO : PROGRESS: at 36.15% examples, 291538 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:15,565 : INFO : PROGRESS: at 36.16% examples, 291557 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:16,574 : INFO : PROGRESS: at 36.17% examples, 291582 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:17,578 : INFO : PROGRESS: at 36.18% examples, 291585 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:19,721 : INFO : PROGRESS: at 36.19% examples, 291524 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:20,742 : INFO : PROGRESS: at 36.20% examples, 291551 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:10:21,766 : INFO : PROGRESS: at 36.21% examples, 291576 wor

2017-07-20 21:11:48,187 : INFO : PROGRESS: at 36.83% examples, 291598 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:49,188 : INFO : PROGRESS: at 36.84% examples, 291622 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:50,227 : INFO : PROGRESS: at 36.85% examples, 291645 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:52,744 : INFO : PROGRESS: at 36.86% examples, 291575 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:53,786 : INFO : PROGRESS: at 36.87% examples, 291600 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:54,794 : INFO : PROGRESS: at 36.88% examples, 291624 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:55,813 : INFO : PROGRESS: at 36.89% examples, 291649 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:57,730 : INFO : PROGRESS: at 36.89% examples, 291587 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:58,762 : INFO : PROGRESS: at 36.90% examples, 291613 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:11:59,772 : INFO : PROGRESS: at 36.91% examples, 291636 wor

2017-07-20 21:13:27,541 : INFO : PROGRESS: at 37.51% examples, 291357 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:28,594 : INFO : PROGRESS: at 37.52% examples, 291375 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:30,853 : INFO : PROGRESS: at 37.52% examples, 291302 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:31,879 : INFO : PROGRESS: at 37.53% examples, 291322 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:32,904 : INFO : PROGRESS: at 37.54% examples, 291341 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:33,932 : INFO : PROGRESS: at 37.55% examples, 291363 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:34,944 : INFO : PROGRESS: at 37.56% examples, 291361 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:36,813 : INFO : PROGRESS: at 37.56% examples, 291292 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:37,818 : INFO : PROGRESS: at 37.57% examples, 291309 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:13:38,843 : INFO : PROGRESS: at 37.58% examples, 291329 wor

2017-07-20 21:15:07,292 : INFO : PROGRESS: at 38.18% examples, 291017 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:08,297 : INFO : PROGRESS: at 38.19% examples, 291036 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:09,314 : INFO : PROGRESS: at 38.20% examples, 291051 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:11,613 : INFO : PROGRESS: at 38.20% examples, 290973 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:12,616 : INFO : PROGRESS: at 38.21% examples, 290993 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:13,637 : INFO : PROGRESS: at 38.22% examples, 291011 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:14,655 : INFO : PROGRESS: at 38.23% examples, 291027 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:15,682 : INFO : PROGRESS: at 38.24% examples, 291027 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:17,752 : INFO : PROGRESS: at 38.25% examples, 290965 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:15:18,753 : INFO : PROGRESS: at 38.26% examples, 290986 wor

2017-07-20 21:16:46,219 : INFO : PROGRESS: at 38.86% examples, 290746 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:47,269 : INFO : PROGRESS: at 38.87% examples, 290760 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:48,342 : INFO : PROGRESS: at 38.88% examples, 290766 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:49,386 : INFO : PROGRESS: at 38.88% examples, 290778 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:50,388 : INFO : PROGRESS: at 38.89% examples, 290775 words/s, in_qsize 6, out_qsize 1
2017-07-20 21:16:51,437 : INFO : PROGRESS: at 38.90% examples, 290782 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:53,308 : INFO : PROGRESS: at 38.90% examples, 290705 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:54,311 : INFO : PROGRESS: at 38.91% examples, 290727 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:55,332 : INFO : PROGRESS: at 38.92% examples, 290741 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:16:56,338 : INFO : PROGRESS: at 38.93% examples, 290758 wor

2017-07-20 21:18:21,571 : INFO : PROGRESS: at 39.52% examples, 290583 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:22,580 : INFO : PROGRESS: at 39.53% examples, 290607 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:23,585 : INFO : PROGRESS: at 39.54% examples, 290627 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:24,587 : INFO : PROGRESS: at 39.55% examples, 290649 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:26,740 : INFO : PROGRESS: at 39.56% examples, 290574 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:27,742 : INFO : PROGRESS: at 39.57% examples, 290592 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:18:28,744 : INFO : PROGRESS: at 39.58% examples, 290614 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:29,746 : INFO : PROGRESS: at 39.58% examples, 290635 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:30,757 : INFO : PROGRESS: at 39.59% examples, 290639 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:18:32,387 : INFO : PROGRESS: at 39.60% examples, 290580 wor

2017-07-20 21:19:56,571 : INFO : PROGRESS: at 40.21% examples, 290649 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:19:57,702 : INFO : PROGRESS: at 40.22% examples, 290645 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:19:58,736 : INFO : PROGRESS: at 40.23% examples, 290659 words/s, in_qsize 0, out_qsize 0
2017-07-20 21:20:00,107 : INFO : PROGRESS: at 40.23% examples, 290591 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:20:01,162 : INFO : PROGRESS: at 40.24% examples, 290613 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:20:02,164 : INFO : PROGRESS: at 40.26% examples, 290637 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:20:03,197 : INFO : PROGRESS: at 40.26% examples, 290658 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:20:04,204 : INFO : PROGRESS: at 40.27% examples, 290663 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:20:05,879 : INFO : PROGRESS: at 40.28% examples, 290597 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:20:06,939 : INFO : PROGRESS: at 40.29% examples, 290619 wor

2017-07-20 21:21:32,812 : INFO : PROGRESS: at 40.90% examples, 290689 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:33,818 : INFO : PROGRESS: at 40.91% examples, 290694 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:35,823 : INFO : PROGRESS: at 40.92% examples, 290625 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:36,847 : INFO : PROGRESS: at 40.93% examples, 290648 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:37,868 : INFO : PROGRESS: at 40.94% examples, 290668 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:38,882 : INFO : PROGRESS: at 40.95% examples, 290692 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:40,763 : INFO : PROGRESS: at 40.95% examples, 290638 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:41,771 : INFO : PROGRESS: at 40.96% examples, 290661 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:42,782 : INFO : PROGRESS: at 40.97% examples, 290681 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:21:43,783 : INFO : PROGRESS: at 40.98% examples, 290701 wor

2017-07-20 21:23:10,708 : INFO : PROGRESS: at 41.59% examples, 290662 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:23:11,754 : INFO : PROGRESS: at 41.60% examples, 290679 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:23:12,760 : INFO : PROGRESS: at 41.61% examples, 290699 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:23:14,906 : INFO : PROGRESS: at 41.62% examples, 290647 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:23:15,912 : INFO : PROGRESS: at 41.63% examples, 290670 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:23:16,934 : INFO : PROGRESS: at 41.64% examples, 290690 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:23:17,949 : INFO : PROGRESS: at 41.65% examples, 290708 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:23:18,993 : INFO : PROGRESS: at 41.66% examples, 290713 words/s, in_qsize 6, out_qsize 0
2017-07-20 21:23:20,025 : INFO : PROGRESS: at 41.67% examples, 290705 words/s, in_qsize 6, out_qsize 1
2017-07-20 21:23:22,323 : INFO : PROGRESS: at 41.67% examples, 290647 wor

2017-07-20 21:24:47,745 : INFO : PROGRESS: at 42.29% examples, 290678 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:24:48,748 : INFO : PROGRESS: at 42.30% examples, 290697 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:24:49,792 : INFO : PROGRESS: at 42.31% examples, 290717 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:24:50,805 : INFO : PROGRESS: at 42.32% examples, 290722 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:24:52,008 : INFO : PROGRESS: at 42.33% examples, 290719 words/s, in_qsize 3, out_qsize 2
2017-07-20 21:24:53,039 : INFO : PROGRESS: at 42.34% examples, 290730 words/s, in_qsize 0, out_qsize 0
2017-07-20 21:24:54,533 : INFO : PROGRESS: at 42.34% examples, 290662 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:24:55,594 : INFO : PROGRESS: at 42.35% examples, 290683 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:24:56,674 : INFO : PROGRESS: at 42.36% examples, 290703 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:24:57,706 : INFO : PROGRESS: at 42.37% examples, 290725 wor

2017-07-20 21:26:23,706 : INFO : PROGRESS: at 42.99% examples, 290750 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:26:24,727 : INFO : PROGRESS: at 43.00% examples, 290755 words/s, in_qsize 0, out_qsize 0
2017-07-20 21:26:26,252 : INFO : PROGRESS: at 43.00% examples, 290686 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:26:27,308 : INFO : PROGRESS: at 43.02% examples, 290707 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:26:28,313 : INFO : PROGRESS: at 43.03% examples, 290729 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:26:29,335 : INFO : PROGRESS: at 43.04% examples, 290746 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:26:30,350 : INFO : PROGRESS: at 43.04% examples, 290751 words/s, in_qsize 1, out_qsize 0
2017-07-20 21:26:31,697 : INFO : PROGRESS: at 43.05% examples, 290696 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:26:32,735 : INFO : PROGRESS: at 43.06% examples, 290717 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:26:33,741 : INFO : PROGRESS: at 43.07% examples, 290735 wor

2017-07-20 21:27:57,353 : INFO : PROGRESS: at 43.68% examples, 290774 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:27:58,582 : INFO : PROGRESS: at 43.69% examples, 290761 words/s, in_qsize 7, out_qsize 1
2017-07-20 21:28:00,604 : INFO : PROGRESS: at 43.70% examples, 290716 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:28:01,614 : INFO : PROGRESS: at 43.71% examples, 290737 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:28:02,615 : INFO : PROGRESS: at 43.72% examples, 290756 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:28:03,624 : INFO : PROGRESS: at 43.73% examples, 290776 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:28:05,570 : INFO : PROGRESS: at 43.73% examples, 290715 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:28:06,573 : INFO : PROGRESS: at 43.74% examples, 290735 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:28:07,592 : INFO : PROGRESS: at 43.75% examples, 290754 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:28:08,597 : INFO : PROGRESS: at 43.76% examples, 290774 wor

2017-07-20 21:29:35,401 : INFO : PROGRESS: at 44.38% examples, 290777 words/s, in_qsize 6, out_qsize 1
2017-07-20 21:29:36,406 : INFO : PROGRESS: at 44.39% examples, 290797 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:37,439 : INFO : PROGRESS: at 44.40% examples, 290801 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:39,355 : INFO : PROGRESS: at 44.40% examples, 290735 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:40,399 : INFO : PROGRESS: at 44.41% examples, 290755 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:41,410 : INFO : PROGRESS: at 44.42% examples, 290776 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:42,411 : INFO : PROGRESS: at 44.43% examples, 290796 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:44,797 : INFO : PROGRESS: at 44.44% examples, 290734 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:45,808 : INFO : PROGRESS: at 44.45% examples, 290755 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:29:46,834 : INFO : PROGRESS: at 44.46% examples, 290774 wor

2017-07-20 21:31:17,016 : INFO : PROGRESS: at 45.09% examples, 290777 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:18,022 : INFO : PROGRESS: at 45.10% examples, 290796 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:19,043 : INFO : PROGRESS: at 45.11% examples, 290813 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:21,213 : INFO : PROGRESS: at 45.12% examples, 290769 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:22,222 : INFO : PROGRESS: at 45.13% examples, 290790 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:23,243 : INFO : PROGRESS: at 45.14% examples, 290808 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:24,258 : INFO : PROGRESS: at 45.15% examples, 290827 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:25,262 : INFO : PROGRESS: at 45.16% examples, 290831 words/s, in_qsize 6, out_qsize 0
2017-07-20 21:31:26,995 : INFO : PROGRESS: at 45.16% examples, 290768 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:31:28,010 : INFO : PROGRESS: at 45.17% examples, 290788 wor

2017-07-20 21:32:53,188 : INFO : PROGRESS: at 45.80% examples, 290851 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:32:54,294 : INFO : PROGRESS: at 45.81% examples, 290844 words/s, in_qsize 5, out_qsize 2
2017-07-20 21:32:56,587 : INFO : PROGRESS: at 45.81% examples, 290786 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:32:57,647 : INFO : PROGRESS: at 45.82% examples, 290806 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:32:58,650 : INFO : PROGRESS: at 45.84% examples, 290826 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:32:59,693 : INFO : PROGRESS: at 45.85% examples, 290844 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:33:00,726 : INFO : PROGRESS: at 45.85% examples, 290849 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:33:01,915 : INFO : PROGRESS: at 45.86% examples, 290845 words/s, in_qsize 7, out_qsize 2
2017-07-20 21:33:04,081 : INFO : PROGRESS: at 45.87% examples, 290797 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:33:05,104 : INFO : PROGRESS: at 45.88% examples, 290817 wor

2017-07-20 21:34:28,407 : INFO : PROGRESS: at 46.49% examples, 290934 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:30,531 : INFO : PROGRESS: at 46.50% examples, 290892 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:31,559 : INFO : PROGRESS: at 46.51% examples, 290914 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:32,560 : INFO : PROGRESS: at 46.52% examples, 290938 words/s, in_qsize 8, out_qsize 0
2017-07-20 21:34:33,574 : INFO : PROGRESS: at 46.53% examples, 290957 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:34,594 : INFO : PROGRESS: at 46.54% examples, 290949 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:36,335 : INFO : PROGRESS: at 46.54% examples, 290905 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:37,349 : INFO : PROGRESS: at 46.55% examples, 290929 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:38,362 : INFO : PROGRESS: at 46.56% examples, 290950 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:34:39,389 : INFO : PROGRESS: at 46.57% examples, 290972 wor

2017-07-20 21:36:05,408 : INFO : PROGRESS: at 47.22% examples, 291210 words/s, in_qsize 6, out_qsize 0
2017-07-20 21:36:07,273 : INFO : PROGRESS: at 47.23% examples, 291144 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:36:08,309 : INFO : PROGRESS: at 47.24% examples, 291169 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:36:09,311 : INFO : PROGRESS: at 47.25% examples, 291195 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:36:10,355 : INFO : PROGRESS: at 47.26% examples, 291217 words/s, in_qsize 6, out_qsize 0
2017-07-20 21:36:11,398 : INFO : PROGRESS: at 47.27% examples, 291215 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:36:13,272 : INFO : PROGRESS: at 47.27% examples, 291171 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:36:14,272 : INFO : PROGRESS: at 47.28% examples, 291194 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:36:15,293 : INFO : PROGRESS: at 47.29% examples, 291216 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:36:16,296 : INFO : PROGRESS: at 47.30% examples, 291238 wor

2017-07-20 21:37:42,044 : INFO : PROGRESS: at 47.97% examples, 291492 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:37:44,580 : INFO : PROGRESS: at 47.98% examples, 291433 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:37:45,588 : INFO : PROGRESS: at 47.99% examples, 291456 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:37:46,612 : INFO : PROGRESS: at 48.00% examples, 291479 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:37:47,641 : INFO : PROGRESS: at 48.01% examples, 291502 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:37:49,323 : INFO : PROGRESS: at 48.01% examples, 291454 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:37:50,352 : INFO : PROGRESS: at 48.02% examples, 291478 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:37:51,372 : INFO : PROGRESS: at 48.04% examples, 291501 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:37:52,374 : INFO : PROGRESS: at 48.05% examples, 291525 words/s, in_qsize 3, out_qsize 0
2017-07-20 21:37:54,150 : INFO : PROGRESS: at 48.05% examples, 291460 wor

2017-07-20 21:39:20,575 : INFO : PROGRESS: at 48.70% examples, 291746 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:39:21,577 : INFO : PROGRESS: at 48.72% examples, 291768 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:39:23,624 : INFO : PROGRESS: at 48.72% examples, 291725 words/s, in_qsize 8, out_qsize 0
2017-07-20 21:39:24,626 : INFO : PROGRESS: at 48.73% examples, 291748 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:39:25,627 : INFO : PROGRESS: at 48.74% examples, 291771 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:39:26,666 : INFO : PROGRESS: at 48.76% examples, 291793 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:39:27,672 : INFO : PROGRESS: at 48.76% examples, 291796 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:39:28,724 : INFO : PROGRESS: at 48.77% examples, 291800 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:39:29,811 : INFO : PROGRESS: at 48.78% examples, 291789 words/s, in_qsize 8, out_qsize 3
2017-07-20 21:39:30,847 : INFO : PROGRESS: at 48.79% examples, 291800 wor

2017-07-20 21:40:57,822 : INFO : PROGRESS: at 49.47% examples, 292028 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:40:58,832 : INFO : PROGRESS: at 49.48% examples, 292052 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:40:59,842 : INFO : PROGRESS: at 49.48% examples, 292043 words/s, in_qsize 5, out_qsize 2
2017-07-20 21:41:01,027 : INFO : PROGRESS: at 49.49% examples, 292044 words/s, in_qsize 3, out_qsize 3
2017-07-20 21:41:02,947 : INFO : PROGRESS: at 49.50% examples, 292007 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:41:03,953 : INFO : PROGRESS: at 49.52% examples, 292030 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:41:04,986 : INFO : PROGRESS: at 49.53% examples, 292054 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:41:05,998 : INFO : PROGRESS: at 49.54% examples, 292075 words/s, in_qsize 0, out_qsize 0
2017-07-20 21:41:07,658 : INFO : PROGRESS: at 49.54% examples, 292010 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:41:08,665 : INFO : PROGRESS: at 49.55% examples, 292034 wor

2017-07-20 21:42:32,787 : INFO : PROGRESS: at 50.19% examples, 292272 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:42:33,922 : INFO : PROGRESS: at 50.20% examples, 292284 words/s, in_qsize 3, out_qsize 2
2017-07-20 21:42:36,112 : INFO : PROGRESS: at 50.21% examples, 292236 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:42:37,124 : INFO : PROGRESS: at 50.22% examples, 292258 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:42:38,136 : INFO : PROGRESS: at 50.23% examples, 292282 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:42:39,170 : INFO : PROGRESS: at 50.24% examples, 292301 words/s, in_qsize 5, out_qsize 1
2017-07-20 21:42:40,183 : INFO : PROGRESS: at 50.25% examples, 292298 words/s, in_qsize 5, out_qsize 1
2017-07-20 21:42:42,392 : INFO : PROGRESS: at 50.26% examples, 292260 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:42:43,439 : INFO : PROGRESS: at 50.27% examples, 292284 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:42:44,495 : INFO : PROGRESS: at 50.29% examples, 292307 wor

2017-07-20 21:44:08,770 : INFO : PROGRESS: at 50.92% examples, 292491 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:44:09,771 : INFO : PROGRESS: at 50.93% examples, 292512 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:44:10,777 : INFO : PROGRESS: at 50.94% examples, 292534 words/s, in_qsize 5, out_qsize 1
2017-07-20 21:44:12,326 : INFO : PROGRESS: at 50.94% examples, 292485 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:44:13,359 : INFO : PROGRESS: at 50.95% examples, 292508 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:44:14,361 : INFO : PROGRESS: at 50.97% examples, 292531 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:44:15,408 : INFO : PROGRESS: at 50.98% examples, 292553 words/s, in_qsize 4, out_qsize 0
2017-07-20 21:44:17,186 : INFO : PROGRESS: at 50.98% examples, 292492 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:44:18,207 : INFO : PROGRESS: at 50.99% examples, 292515 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:44:19,214 : INFO : PROGRESS: at 51.00% examples, 292539 wor

2017-07-20 21:45:43,462 : INFO : PROGRESS: at 51.63% examples, 292703 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:44,468 : INFO : PROGRESS: at 51.64% examples, 292727 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:45,488 : INFO : PROGRESS: at 51.66% examples, 292748 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:46,495 : INFO : PROGRESS: at 51.67% examples, 292768 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:45:48,187 : INFO : PROGRESS: at 51.67% examples, 292718 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:49,189 : INFO : PROGRESS: at 51.68% examples, 292741 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:50,194 : INFO : PROGRESS: at 51.69% examples, 292761 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:51,200 : INFO : PROGRESS: at 51.70% examples, 292782 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:53,353 : INFO : PROGRESS: at 51.71% examples, 292723 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:45:54,357 : INFO : PROGRESS: at 51.72% examples, 292747 wor

2017-07-20 21:47:17,254 : INFO : PROGRESS: at 52.34% examples, 292925 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:47:18,258 : INFO : PROGRESS: at 52.35% examples, 292946 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:47:19,283 : INFO : PROGRESS: at 52.37% examples, 292969 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:47:20,424 : INFO : PROGRESS: at 52.38% examples, 292983 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:47:21,477 : INFO : PROGRESS: at 52.39% examples, 292984 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:47:23,425 : INFO : PROGRESS: at 52.39% examples, 292943 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:47:24,460 : INFO : PROGRESS: at 52.40% examples, 292963 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:47:25,470 : INFO : PROGRESS: at 52.42% examples, 292987 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:47:26,486 : INFO : PROGRESS: at 52.43% examples, 293008 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:47:28,384 : INFO : PROGRESS: at 52.43% examples, 292950 wor

2017-07-20 21:48:53,016 : INFO : PROGRESS: at 53.08% examples, 293070 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:48:55,047 : INFO : PROGRESS: at 53.09% examples, 293023 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:48:56,103 : INFO : PROGRESS: at 53.10% examples, 293037 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:48:57,130 : INFO : PROGRESS: at 53.11% examples, 293053 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:48:58,152 : INFO : PROGRESS: at 53.12% examples, 293070 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:49:00,387 : INFO : PROGRESS: at 53.13% examples, 293011 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:49:01,430 : INFO : PROGRESS: at 53.13% examples, 293027 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:49:02,457 : INFO : PROGRESS: at 53.15% examples, 293045 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:49:03,471 : INFO : PROGRESS: at 53.16% examples, 293064 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:49:04,475 : INFO : PROGRESS: at 53.16% examples, 293062 wor

2017-07-20 21:50:32,769 : INFO : PROGRESS: at 53.77% examples, 292939 words/s, in_qsize 3, out_qsize 1
2017-07-20 21:50:33,775 : INFO : PROGRESS: at 53.78% examples, 292943 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:35,572 : INFO : PROGRESS: at 53.79% examples, 292901 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:36,576 : INFO : PROGRESS: at 53.80% examples, 292922 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:37,597 : INFO : PROGRESS: at 53.81% examples, 292942 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:38,608 : INFO : PROGRESS: at 53.82% examples, 292956 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:40,505 : INFO : PROGRESS: at 53.82% examples, 292900 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:41,520 : INFO : PROGRESS: at 53.83% examples, 292919 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:42,534 : INFO : PROGRESS: at 53.84% examples, 292938 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:50:43,554 : INFO : PROGRESS: at 53.85% examples, 292957 wor

2017-07-20 21:52:07,004 : INFO : PROGRESS: at 54.47% examples, 293045 words/s, in_qsize 0, out_qsize 0
2017-07-20 21:52:08,554 : INFO : PROGRESS: at 54.47% examples, 292988 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:09,554 : INFO : PROGRESS: at 54.48% examples, 293007 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:10,574 : INFO : PROGRESS: at 54.49% examples, 293028 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:11,583 : INFO : PROGRESS: at 54.50% examples, 293047 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:13,295 : INFO : PROGRESS: at 54.51% examples, 293000 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:14,317 : INFO : PROGRESS: at 54.52% examples, 293018 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:15,322 : INFO : PROGRESS: at 54.53% examples, 293037 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:16,352 : INFO : PROGRESS: at 54.54% examples, 293052 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:52:17,358 : INFO : PROGRESS: at 54.55% examples, 293057 wor

2017-07-20 21:53:44,545 : INFO : PROGRESS: at 55.17% examples, 293081 words/s, in_qsize 8, out_qsize 0
2017-07-20 21:53:45,556 : INFO : PROGRESS: at 55.18% examples, 293101 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:46,609 : INFO : PROGRESS: at 55.19% examples, 293120 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:47,622 : INFO : PROGRESS: at 55.21% examples, 293140 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:49,689 : INFO : PROGRESS: at 55.21% examples, 293084 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:50,715 : INFO : PROGRESS: at 55.22% examples, 293104 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:51,717 : INFO : PROGRESS: at 55.23% examples, 293124 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:52,721 : INFO : PROGRESS: at 55.24% examples, 293143 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:54,535 : INFO : PROGRESS: at 55.25% examples, 293099 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:53:55,541 : INFO : PROGRESS: at 55.26% examples, 293121 wor

2017-07-20 21:55:22,347 : INFO : PROGRESS: at 55.91% examples, 293223 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:55:23,350 : INFO : PROGRESS: at 55.92% examples, 293243 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:55:25,298 : INFO : PROGRESS: at 55.93% examples, 293191 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:55:26,300 : INFO : PROGRESS: at 55.94% examples, 293210 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:55:27,303 : INFO : PROGRESS: at 55.95% examples, 293232 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:55:28,317 : INFO : PROGRESS: at 55.96% examples, 293252 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:55:29,362 : INFO : PROGRESS: at 55.97% examples, 293249 words/s, in_qsize 4, out_qsize 1
2017-07-20 21:55:31,770 : INFO : PROGRESS: at 55.98% examples, 293209 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:55:32,771 : INFO : PROGRESS: at 55.99% examples, 293231 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:55:33,813 : INFO : PROGRESS: at 56.00% examples, 293251 wor

2017-07-20 21:56:58,483 : INFO : PROGRESS: at 56.64% examples, 293404 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:56:59,531 : INFO : PROGRESS: at 56.65% examples, 293425 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:57:00,539 : INFO : PROGRESS: at 56.66% examples, 293446 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:57:01,547 : INFO : PROGRESS: at 56.67% examples, 293465 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:57:02,566 : INFO : PROGRESS: at 56.68% examples, 293459 words/s, in_qsize 6, out_qsize 1
2017-07-20 21:57:04,518 : INFO : PROGRESS: at 56.69% examples, 293422 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:57:05,572 : INFO : PROGRESS: at 56.70% examples, 293444 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:57:06,584 : INFO : PROGRESS: at 56.71% examples, 293465 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:57:07,588 : INFO : PROGRESS: at 56.72% examples, 293484 words/s, in_qsize 6, out_qsize 0
2017-07-20 21:57:09,360 : INFO : PROGRESS: at 56.72% examples, 293432 wor

2017-07-20 21:58:34,781 : INFO : PROGRESS: at 57.39% examples, 293704 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:58:36,296 : INFO : PROGRESS: at 57.40% examples, 293673 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:58:37,304 : INFO : PROGRESS: at 57.41% examples, 293694 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:58:38,314 : INFO : PROGRESS: at 57.42% examples, 293711 words/s, in_qsize 0, out_qsize 0
2017-07-20 21:58:39,588 : INFO : PROGRESS: at 57.42% examples, 293667 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:58:40,616 : INFO : PROGRESS: at 57.43% examples, 293689 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:58:41,622 : INFO : PROGRESS: at 57.44% examples, 293709 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:58:44,128 : INFO : PROGRESS: at 57.45% examples, 293671 words/s, in_qsize 8, out_qsize 1
2017-07-20 21:58:45,149 : INFO : PROGRESS: at 57.46% examples, 293694 words/s, in_qsize 7, out_qsize 0
2017-07-20 21:58:46,158 : INFO : PROGRESS: at 57.47% examples, 293714 wor

2017-07-20 22:00:12,137 : INFO : PROGRESS: at 58.14% examples, 293917 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:00:13,159 : INFO : PROGRESS: at 58.15% examples, 293934 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:00:14,185 : INFO : PROGRESS: at 58.16% examples, 293953 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:00:15,200 : INFO : PROGRESS: at 58.17% examples, 293960 words/s, in_qsize 3, out_qsize 0
2017-07-20 22:00:16,774 : INFO : PROGRESS: at 58.17% examples, 293912 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:00:17,818 : INFO : PROGRESS: at 58.18% examples, 293933 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:00:18,819 : INFO : PROGRESS: at 58.19% examples, 293952 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:00:19,840 : INFO : PROGRESS: at 58.20% examples, 293969 words/s, in_qsize 1, out_qsize 0
2017-07-20 22:00:21,330 : INFO : PROGRESS: at 58.20% examples, 293922 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:00:22,332 : INFO : PROGRESS: at 58.21% examples, 293942 wor

2017-07-20 22:01:48,349 : INFO : PROGRESS: at 58.89% examples, 294173 words/s, in_qsize 2, out_qsize 1
2017-07-20 22:01:49,365 : INFO : PROGRESS: at 58.90% examples, 294179 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:01:51,170 : INFO : PROGRESS: at 58.90% examples, 294134 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:01:52,202 : INFO : PROGRESS: at 58.92% examples, 294154 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:01:53,254 : INFO : PROGRESS: at 58.93% examples, 294173 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:01:54,424 : INFO : PROGRESS: at 58.94% examples, 294184 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:01:56,374 : INFO : PROGRESS: at 58.95% examples, 294151 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:01:57,415 : INFO : PROGRESS: at 58.96% examples, 294171 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:01:58,426 : INFO : PROGRESS: at 58.97% examples, 294191 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:01:59,483 : INFO : PROGRESS: at 58.98% examples, 294210 wor

2017-07-20 22:03:25,435 : INFO : PROGRESS: at 59.63% examples, 294359 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:03:26,452 : INFO : PROGRESS: at 59.64% examples, 294379 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:03:27,464 : INFO : PROGRESS: at 59.65% examples, 294398 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:03:28,469 : INFO : PROGRESS: at 59.67% examples, 294419 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:03:29,478 : INFO : PROGRESS: at 59.67% examples, 294422 words/s, in_qsize 1, out_qsize 0
2017-07-20 22:03:30,964 : INFO : PROGRESS: at 59.68% examples, 294376 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:03:32,008 : INFO : PROGRESS: at 59.69% examples, 294396 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:03:33,056 : INFO : PROGRESS: at 59.70% examples, 294416 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:03:34,127 : INFO : PROGRESS: at 59.71% examples, 294424 words/s, in_qsize 1, out_qsize 2
2017-07-20 22:03:36,277 : INFO : PROGRESS: at 59.72% examples, 294385 wor

2017-07-20 22:05:01,775 : INFO : PROGRESS: at 60.38% examples, 294603 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:02,819 : INFO : PROGRESS: at 60.39% examples, 294623 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:03,832 : INFO : PROGRESS: at 60.40% examples, 294643 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:04,859 : INFO : PROGRESS: at 60.42% examples, 294662 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:05,864 : INFO : PROGRESS: at 60.42% examples, 294658 words/s, in_qsize 3, out_qsize 0
2017-07-20 22:05:07,298 : INFO : PROGRESS: at 60.42% examples, 294617 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:08,310 : INFO : PROGRESS: at 60.43% examples, 294633 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:09,342 : INFO : PROGRESS: at 60.44% examples, 294641 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:10,379 : INFO : PROGRESS: at 60.45% examples, 294656 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:05:12,379 : INFO : PROGRESS: at 60.46% examples, 294611 wor

2017-07-20 22:06:35,363 : INFO : PROGRESS: at 61.12% examples, 294873 words/s, in_qsize 2, out_qsize 0
2017-07-20 22:06:37,179 : INFO : PROGRESS: at 61.12% examples, 294817 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:06:38,199 : INFO : PROGRESS: at 61.13% examples, 294837 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:06:39,214 : INFO : PROGRESS: at 61.14% examples, 294853 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:06:40,217 : INFO : PROGRESS: at 61.15% examples, 294873 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:06:41,997 : INFO : PROGRESS: at 61.15% examples, 294837 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:06:42,998 : INFO : PROGRESS: at 61.16% examples, 294857 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:06:44,030 : INFO : PROGRESS: at 61.18% examples, 294874 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:06:45,044 : INFO : PROGRESS: at 61.19% examples, 294892 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:06:46,412 : INFO : PROGRESS: at 61.19% examples, 294850 wor

2017-07-20 22:08:10,567 : INFO : PROGRESS: at 61.85% examples, 295081 words/s, in_qsize 1, out_qsize 2
2017-07-20 22:08:12,681 : INFO : PROGRESS: at 61.85% examples, 295041 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:08:13,722 : INFO : PROGRESS: at 61.86% examples, 295060 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:08:14,727 : INFO : PROGRESS: at 61.88% examples, 295080 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:08:15,770 : INFO : PROGRESS: at 61.89% examples, 295099 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:08:17,299 : INFO : PROGRESS: at 61.89% examples, 295056 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:08:18,326 : INFO : PROGRESS: at 61.90% examples, 295076 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:08:19,340 : INFO : PROGRESS: at 61.91% examples, 295095 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:08:20,348 : INFO : PROGRESS: at 61.92% examples, 295113 words/s, in_qsize 6, out_qsize 0
2017-07-20 22:08:22,069 : INFO : PROGRESS: at 61.93% examples, 295066 wor

2017-07-20 22:09:49,453 : INFO : PROGRESS: at 62.61% examples, 295290 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:09:50,455 : INFO : PROGRESS: at 62.62% examples, 295307 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:09:51,511 : INFO : PROGRESS: at 62.64% examples, 295325 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:09:53,198 : INFO : PROGRESS: at 62.64% examples, 295278 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:09:54,239 : INFO : PROGRESS: at 62.65% examples, 295297 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:09:55,296 : INFO : PROGRESS: at 62.66% examples, 295315 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:09:56,322 : INFO : PROGRESS: at 62.67% examples, 295333 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:09:57,751 : INFO : PROGRESS: at 62.67% examples, 295289 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:09:58,774 : INFO : PROGRESS: at 62.68% examples, 295308 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:09:59,777 : INFO : PROGRESS: at 62.69% examples, 295327 wor

2017-07-20 22:11:24,817 : INFO : PROGRESS: at 63.37% examples, 295532 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:11:26,136 : INFO : PROGRESS: at 63.37% examples, 295490 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:11:27,156 : INFO : PROGRESS: at 63.38% examples, 295510 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:11:28,162 : INFO : PROGRESS: at 63.39% examples, 295528 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:11:29,183 : INFO : PROGRESS: at 63.40% examples, 295545 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:11:30,186 : INFO : PROGRESS: at 63.41% examples, 295541 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:11:32,249 : INFO : PROGRESS: at 63.42% examples, 295506 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:11:33,283 : INFO : PROGRESS: at 63.43% examples, 295525 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:11:34,320 : INFO : PROGRESS: at 63.44% examples, 295544 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:11:35,324 : INFO : PROGRESS: at 63.45% examples, 295562 wor

2017-07-20 22:13:01,289 : INFO : PROGRESS: at 64.10% examples, 295704 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:02,295 : INFO : PROGRESS: at 64.12% examples, 295723 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:03,307 : INFO : PROGRESS: at 64.13% examples, 295739 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:04,330 : INFO : PROGRESS: at 64.14% examples, 295756 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:13:05,993 : INFO : PROGRESS: at 64.14% examples, 295706 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:06,993 : INFO : PROGRESS: at 64.15% examples, 295725 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:08,011 : INFO : PROGRESS: at 64.16% examples, 295742 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:09,023 : INFO : PROGRESS: at 64.17% examples, 295760 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:10,986 : INFO : PROGRESS: at 64.18% examples, 295724 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:13:12,004 : INFO : PROGRESS: at 64.19% examples, 295743 wor

2017-07-20 22:14:37,010 : INFO : PROGRESS: at 64.85% examples, 295933 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:38,022 : INFO : PROGRESS: at 64.86% examples, 295950 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:39,843 : INFO : PROGRESS: at 64.86% examples, 295911 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:40,882 : INFO : PROGRESS: at 64.87% examples, 295929 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:41,891 : INFO : PROGRESS: at 64.88% examples, 295946 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:42,905 : INFO : PROGRESS: at 64.90% examples, 295965 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:44,857 : INFO : PROGRESS: at 64.90% examples, 295918 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:45,880 : INFO : PROGRESS: at 64.91% examples, 295937 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:46,897 : INFO : PROGRESS: at 64.92% examples, 295953 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:14:48,067 : INFO : PROGRESS: at 64.93% examples, 295967 wor

2017-07-20 22:16:16,574 : INFO : PROGRESS: at 65.62% examples, 296158 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:16:17,576 : INFO : PROGRESS: at 65.63% examples, 296163 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:16:18,980 : INFO : PROGRESS: at 65.63% examples, 296120 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:16:20,009 : INFO : PROGRESS: at 65.64% examples, 296139 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:16:21,018 : INFO : PROGRESS: at 65.65% examples, 296157 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:16:22,028 : INFO : PROGRESS: at 65.66% examples, 296174 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:16:23,044 : INFO : PROGRESS: at 65.67% examples, 296171 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:16:24,688 : INFO : PROGRESS: at 65.67% examples, 296132 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:16:25,722 : INFO : PROGRESS: at 65.68% examples, 296150 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:16:26,728 : INFO : PROGRESS: at 65.70% examples, 296167 wor

2017-07-20 22:17:53,912 : INFO : PROGRESS: at 66.37% examples, 296354 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:17:54,916 : INFO : PROGRESS: at 66.38% examples, 296370 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:17:56,316 : INFO : PROGRESS: at 66.38% examples, 296328 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:17:57,347 : INFO : PROGRESS: at 66.39% examples, 296346 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:17:58,390 : INFO : PROGRESS: at 66.41% examples, 296364 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:17:59,439 : INFO : PROGRESS: at 66.42% examples, 296381 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:18:00,490 : INFO : PROGRESS: at 66.42% examples, 296356 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:18:01,502 : INFO : PROGRESS: at 66.43% examples, 296374 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:18:02,503 : INFO : PROGRESS: at 66.44% examples, 296389 words/s, in_qsize 1, out_qsize 0
2017-07-20 22:18:04,072 : INFO : PROGRESS: at 66.44% examples, 296345 wor

2017-07-20 22:19:27,725 : INFO : PROGRESS: at 67.10% examples, 296557 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:19:28,754 : INFO : PROGRESS: at 67.11% examples, 296562 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:19:30,351 : INFO : PROGRESS: at 67.11% examples, 296515 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:19:31,357 : INFO : PROGRESS: at 67.12% examples, 296534 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:19:32,366 : INFO : PROGRESS: at 67.13% examples, 296551 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:19:33,381 : INFO : PROGRESS: at 67.14% examples, 296568 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:19:34,406 : INFO : PROGRESS: at 67.15% examples, 296574 words/s, in_qsize 2, out_qsize 0
2017-07-20 22:19:36,162 : INFO : PROGRESS: at 67.15% examples, 296524 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:19:37,183 : INFO : PROGRESS: at 67.16% examples, 296543 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:19:38,188 : INFO : PROGRESS: at 67.17% examples, 296560 wor

2017-07-20 22:21:04,917 : INFO : PROGRESS: at 67.84% examples, 296708 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:05,919 : INFO : PROGRESS: at 67.85% examples, 296726 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:06,938 : INFO : PROGRESS: at 67.87% examples, 296742 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:07,962 : INFO : PROGRESS: at 67.88% examples, 296759 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:09,073 : INFO : PROGRESS: at 67.88% examples, 296758 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:11,110 : INFO : PROGRESS: at 67.89% examples, 296716 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:12,155 : INFO : PROGRESS: at 67.90% examples, 296733 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:13,165 : INFO : PROGRESS: at 67.91% examples, 296749 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:14,176 : INFO : PROGRESS: at 67.92% examples, 296765 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:21:15,195 : INFO : PROGRESS: at 67.93% examples, 296770 wor

2017-07-20 22:22:44,802 : INFO : PROGRESS: at 68.61% examples, 296908 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:45,834 : INFO : PROGRESS: at 68.62% examples, 296926 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:46,839 : INFO : PROGRESS: at 68.63% examples, 296942 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:47,868 : INFO : PROGRESS: at 68.64% examples, 296959 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:49,573 : INFO : PROGRESS: at 68.65% examples, 296923 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:50,607 : INFO : PROGRESS: at 68.66% examples, 296940 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:51,613 : INFO : PROGRESS: at 68.67% examples, 296957 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:52,621 : INFO : PROGRESS: at 68.68% examples, 296972 words/s, in_qsize 5, out_qsize 0
2017-07-20 22:22:54,560 : INFO : PROGRESS: at 68.68% examples, 296921 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:22:55,562 : INFO : PROGRESS: at 68.69% examples, 296940 wor

2017-07-20 22:24:20,355 : INFO : PROGRESS: at 69.37% examples, 297113 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:21,377 : INFO : PROGRESS: at 69.38% examples, 297129 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:22,554 : INFO : PROGRESS: at 69.39% examples, 297136 words/s, in_qsize 2, out_qsize 2
2017-07-20 22:24:23,598 : INFO : PROGRESS: at 69.40% examples, 297140 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:25,689 : INFO : PROGRESS: at 69.41% examples, 297103 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:26,697 : INFO : PROGRESS: at 69.42% examples, 297121 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:27,707 : INFO : PROGRESS: at 69.43% examples, 297137 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:28,729 : INFO : PROGRESS: at 69.44% examples, 297154 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:30,505 : INFO : PROGRESS: at 69.45% examples, 297116 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:24:31,549 : INFO : PROGRESS: at 69.46% examples, 297133 wor

2017-07-20 22:25:54,990 : INFO : PROGRESS: at 70.10% examples, 297279 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:25:55,997 : INFO : PROGRESS: at 70.11% examples, 297296 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:25:57,027 : INFO : PROGRESS: at 70.12% examples, 297311 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:25:58,040 : INFO : PROGRESS: at 70.13% examples, 297316 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:25:59,354 : INFO : PROGRESS: at 70.13% examples, 297278 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:26:00,388 : INFO : PROGRESS: at 70.15% examples, 297295 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:26:01,413 : INFO : PROGRESS: at 70.16% examples, 297312 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:26:02,425 : INFO : PROGRESS: at 70.17% examples, 297327 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:26:04,101 : INFO : PROGRESS: at 70.17% examples, 297284 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:26:05,109 : INFO : PROGRESS: at 70.18% examples, 297301 wor

2017-07-20 22:27:30,768 : INFO : PROGRESS: at 70.84% examples, 297452 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:27:31,774 : INFO : PROGRESS: at 70.86% examples, 297469 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:27:32,777 : INFO : PROGRESS: at 70.87% examples, 297484 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:27:34,818 : INFO : PROGRESS: at 70.87% examples, 297440 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:27:35,856 : INFO : PROGRESS: at 70.88% examples, 297457 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:27:36,857 : INFO : PROGRESS: at 70.89% examples, 297474 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:27:37,864 : INFO : PROGRESS: at 70.90% examples, 297489 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:27:39,589 : INFO : PROGRESS: at 70.91% examples, 297456 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:27:40,626 : INFO : PROGRESS: at 70.92% examples, 297473 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:27:41,658 : INFO : PROGRESS: at 70.93% examples, 297490 wor

2017-07-20 22:29:06,105 : INFO : PROGRESS: at 71.57% examples, 297607 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:29:07,106 : INFO : PROGRESS: at 71.59% examples, 297624 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:29:08,115 : INFO : PROGRESS: at 71.60% examples, 297640 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:29:09,139 : INFO : PROGRESS: at 71.61% examples, 297654 words/s, in_qsize 6, out_qsize 0
2017-07-20 22:29:10,305 : INFO : PROGRESS: at 71.61% examples, 297629 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:29:11,310 : INFO : PROGRESS: at 71.62% examples, 297645 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:29:12,353 : INFO : PROGRESS: at 71.63% examples, 297661 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:29:14,105 : INFO : PROGRESS: at 71.63% examples, 297616 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:29:15,159 : INFO : PROGRESS: at 71.65% examples, 297633 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:29:16,181 : INFO : PROGRESS: at 71.66% examples, 297649 wor

2017-07-20 22:30:39,212 : INFO : PROGRESS: at 72.30% examples, 297809 words/s, in_qsize 6, out_qsize 0
2017-07-20 22:30:40,820 : INFO : PROGRESS: at 72.30% examples, 297771 words/s, in_qsize 7, out_qsize 1
2017-07-20 22:30:41,853 : INFO : PROGRESS: at 72.31% examples, 297787 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:30:42,865 : INFO : PROGRESS: at 72.32% examples, 297803 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:30:43,873 : INFO : PROGRESS: at 72.34% examples, 297820 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:30:46,285 : INFO : PROGRESS: at 72.34% examples, 297781 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:30:47,287 : INFO : PROGRESS: at 72.36% examples, 297798 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:30:48,296 : INFO : PROGRESS: at 72.37% examples, 297814 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:30:49,316 : INFO : PROGRESS: at 72.38% examples, 297823 words/s, in_qsize 6, out_qsize 0
2017-07-20 22:30:50,347 : INFO : PROGRESS: at 72.38% examples, 297824 wor

2017-07-20 22:32:15,912 : INFO : PROGRESS: at 73.07% examples, 297947 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:16,924 : INFO : PROGRESS: at 73.08% examples, 297962 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:17,924 : INFO : PROGRESS: at 73.09% examples, 297977 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:19,493 : INFO : PROGRESS: at 73.09% examples, 297943 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:20,499 : INFO : PROGRESS: at 73.10% examples, 297958 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:21,516 : INFO : PROGRESS: at 73.11% examples, 297974 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:22,516 : INFO : PROGRESS: at 73.12% examples, 297990 words/s, in_qsize 6, out_qsize 0
2017-07-20 22:32:24,321 : INFO : PROGRESS: at 73.13% examples, 297947 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:25,357 : INFO : PROGRESS: at 73.14% examples, 297964 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:32:26,393 : INFO : PROGRESS: at 73.15% examples, 297980 wor

2017-07-20 22:33:51,304 : INFO : PROGRESS: at 73.80% examples, 298108 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:33:52,330 : INFO : PROGRESS: at 73.81% examples, 298123 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:33:53,343 : INFO : PROGRESS: at 73.82% examples, 298138 words/s, in_qsize 1, out_qsize 0
2017-07-20 22:33:54,761 : INFO : PROGRESS: at 73.82% examples, 298102 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:33:55,805 : INFO : PROGRESS: at 73.83% examples, 298118 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:33:56,858 : INFO : PROGRESS: at 73.84% examples, 298134 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:33:58,042 : INFO : PROGRESS: at 73.85% examples, 298142 words/s, in_qsize 1, out_qsize 3
2017-07-20 22:33:59,434 : INFO : PROGRESS: at 73.86% examples, 298130 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:34:00,437 : INFO : PROGRESS: at 73.87% examples, 298141 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:34:01,438 : INFO : PROGRESS: at 73.88% examples, 298149 wor

2017-07-20 22:35:26,580 : INFO : PROGRESS: at 74.54% examples, 298296 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:29,054 : INFO : PROGRESS: at 74.55% examples, 298253 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:30,066 : INFO : PROGRESS: at 74.56% examples, 298268 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:31,068 : INFO : PROGRESS: at 74.57% examples, 298284 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:35:32,075 : INFO : PROGRESS: at 74.58% examples, 298299 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:33,076 : INFO : PROGRESS: at 74.59% examples, 298304 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:34,738 : INFO : PROGRESS: at 74.59% examples, 298271 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:35,744 : INFO : PROGRESS: at 74.60% examples, 298287 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:36,763 : INFO : PROGRESS: at 74.62% examples, 298302 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:35:37,819 : INFO : PROGRESS: at 74.63% examples, 298317 wor

2017-07-20 22:37:03,228 : INFO : PROGRESS: at 75.28% examples, 298448 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:37:04,240 : INFO : PROGRESS: at 75.28% examples, 298444 words/s, in_qsize 5, out_qsize 1
2017-07-20 22:37:05,254 : INFO : PROGRESS: at 75.30% examples, 298452 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:37:06,284 : INFO : PROGRESS: at 75.30% examples, 298450 words/s, in_qsize 4, out_qsize 2
2017-07-20 22:37:07,309 : INFO : PROGRESS: at 75.32% examples, 298457 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:37:08,315 : INFO : PROGRESS: at 75.32% examples, 298462 words/s, in_qsize 1, out_qsize 0
2017-07-20 22:37:09,885 : INFO : PROGRESS: at 75.33% examples, 298422 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:37:10,897 : INFO : PROGRESS: at 75.34% examples, 298438 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:37:11,928 : INFO : PROGRESS: at 75.35% examples, 298452 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:37:12,930 : INFO : PROGRESS: at 75.36% examples, 298465 wor

2017-07-20 22:38:38,257 : INFO : PROGRESS: at 76.03% examples, 298608 words/s, in_qsize 1, out_qsize 0
2017-07-20 22:38:39,714 : INFO : PROGRESS: at 76.03% examples, 298572 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:38:40,763 : INFO : PROGRESS: at 76.04% examples, 298587 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:38:41,773 : INFO : PROGRESS: at 76.05% examples, 298603 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:38:42,784 : INFO : PROGRESS: at 76.06% examples, 298618 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:38:44,831 : INFO : PROGRESS: at 76.07% examples, 298582 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:38:45,861 : INFO : PROGRESS: at 76.08% examples, 298598 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:38:46,867 : INFO : PROGRESS: at 76.09% examples, 298613 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:38:47,886 : INFO : PROGRESS: at 76.10% examples, 298626 words/s, in_qsize 1, out_qsize 0
2017-07-20 22:38:49,280 : INFO : PROGRESS: at 76.10% examples, 298592 wor

2017-07-20 22:40:12,350 : INFO : PROGRESS: at 76.75% examples, 298762 words/s, in_qsize 2, out_qsize 0
2017-07-20 22:40:13,868 : INFO : PROGRESS: at 76.76% examples, 298725 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:40:14,869 : INFO : PROGRESS: at 76.77% examples, 298740 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:40:15,891 : INFO : PROGRESS: at 76.78% examples, 298754 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:40:16,898 : INFO : PROGRESS: at 76.79% examples, 298770 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:40:17,957 : INFO : PROGRESS: at 76.80% examples, 298768 words/s, in_qsize 4, out_qsize 2
2017-07-20 22:40:18,981 : INFO : PROGRESS: at 76.81% examples, 298774 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:40:19,989 : INFO : PROGRESS: at 76.82% examples, 298779 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:40:21,590 : INFO : PROGRESS: at 76.82% examples, 298735 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:40:22,625 : INFO : PROGRESS: at 76.83% examples, 298751 wor

2017-07-20 22:41:50,240 : INFO : PROGRESS: at 77.51% examples, 298901 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:41:51,249 : INFO : PROGRESS: at 77.52% examples, 298914 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:41:53,091 : INFO : PROGRESS: at 77.52% examples, 298876 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:41:54,096 : INFO : PROGRESS: at 77.53% examples, 298891 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:41:55,112 : INFO : PROGRESS: at 77.54% examples, 298905 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:41:56,350 : INFO : PROGRESS: at 77.55% examples, 298913 words/s, in_qsize 3, out_qsize 1
2017-07-20 22:41:58,292 : INFO : PROGRESS: at 77.56% examples, 298888 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:41:59,329 : INFO : PROGRESS: at 77.57% examples, 298904 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:42:00,339 : INFO : PROGRESS: at 77.58% examples, 298919 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:42:01,495 : INFO : PROGRESS: at 77.59% examples, 298926 wor

2017-07-20 22:43:28,274 : INFO : PROGRESS: at 78.27% examples, 299045 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:43:29,318 : INFO : PROGRESS: at 78.28% examples, 299060 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:43:30,345 : INFO : PROGRESS: at 78.29% examples, 299056 words/s, in_qsize 6, out_qsize 1
2017-07-20 22:43:32,454 : INFO : PROGRESS: at 78.30% examples, 299028 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:43:33,487 : INFO : PROGRESS: at 78.31% examples, 299043 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:43:34,498 : INFO : PROGRESS: at 78.32% examples, 299057 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:43:35,599 : INFO : PROGRESS: at 78.33% examples, 299063 words/s, in_qsize 1, out_qsize 3
2017-07-20 22:43:38,076 : INFO : PROGRESS: at 78.34% examples, 299032 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:43:39,084 : INFO : PROGRESS: at 78.35% examples, 299047 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:43:40,085 : INFO : PROGRESS: at 78.36% examples, 299061 wor

2017-07-20 22:45:03,953 : INFO : PROGRESS: at 79.02% examples, 299191 words/s, in_qsize 6, out_qsize 1
2017-07-20 22:45:04,998 : INFO : PROGRESS: at 79.03% examples, 299195 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:06,780 : INFO : PROGRESS: at 79.03% examples, 299157 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:07,781 : INFO : PROGRESS: at 79.04% examples, 299172 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:08,797 : INFO : PROGRESS: at 79.05% examples, 299186 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:09,797 : INFO : PROGRESS: at 79.06% examples, 299198 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:11,468 : INFO : PROGRESS: at 79.07% examples, 299169 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:12,502 : INFO : PROGRESS: at 79.08% examples, 299182 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:13,505 : INFO : PROGRESS: at 79.09% examples, 299197 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:45:14,540 : INFO : PROGRESS: at 79.10% examples, 299203 wor

2017-07-20 22:46:40,955 : INFO : PROGRESS: at 79.77% examples, 299313 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:46:41,957 : INFO : PROGRESS: at 79.78% examples, 299327 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:46:43,305 : INFO : PROGRESS: at 79.79% examples, 299330 words/s, in_qsize 2, out_qsize 0
2017-07-20 22:46:45,220 : INFO : PROGRESS: at 79.80% examples, 299303 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:46:46,239 : INFO : PROGRESS: at 79.81% examples, 299317 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:46:47,282 : INFO : PROGRESS: at 79.82% examples, 299332 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:46:48,283 : INFO : PROGRESS: at 79.83% examples, 299346 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:46:49,309 : INFO : PROGRESS: at 79.84% examples, 299342 words/s, in_qsize 4, out_qsize 1
2017-07-20 22:46:51,332 : INFO : PROGRESS: at 79.84% examples, 299315 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:46:52,336 : INFO : PROGRESS: at 79.86% examples, 299330 wor

2017-07-20 22:48:16,652 : INFO : PROGRESS: at 80.50% examples, 299424 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:48:17,677 : INFO : PROGRESS: at 80.51% examples, 299439 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:48:18,687 : INFO : PROGRESS: at 80.52% examples, 299452 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:48:19,731 : INFO : PROGRESS: at 80.53% examples, 299466 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:48:20,753 : INFO : PROGRESS: at 80.54% examples, 299471 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:48:22,196 : INFO : PROGRESS: at 80.54% examples, 299433 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:48:23,241 : INFO : PROGRESS: at 80.56% examples, 299447 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:48:24,271 : INFO : PROGRESS: at 80.57% examples, 299462 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:48:25,276 : INFO : PROGRESS: at 80.58% examples, 299475 words/s, in_qsize 0, out_qsize 1
2017-07-20 22:48:26,575 : INFO : PROGRESS: at 80.58% examples, 299445 wor

2017-07-20 22:49:51,264 : INFO : PROGRESS: at 81.23% examples, 299560 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:49:52,270 : INFO : PROGRESS: at 81.25% examples, 299574 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:49:53,307 : INFO : PROGRESS: at 81.26% examples, 299587 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:49:54,328 : INFO : PROGRESS: at 81.27% examples, 299602 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:49:55,717 : INFO : PROGRESS: at 81.27% examples, 299568 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:49:56,750 : INFO : PROGRESS: at 81.28% examples, 299583 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:49:57,750 : INFO : PROGRESS: at 81.29% examples, 299597 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:49:58,760 : INFO : PROGRESS: at 81.30% examples, 299611 words/s, in_qsize 5, out_qsize 0
2017-07-20 22:50:00,484 : INFO : PROGRESS: at 81.30% examples, 299573 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:50:01,505 : INFO : PROGRESS: at 81.31% examples, 299588 wor

2017-07-20 22:51:27,640 : INFO : PROGRESS: at 81.98% examples, 299712 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:51:28,693 : INFO : PROGRESS: at 81.99% examples, 299725 words/s, in_qsize 5, out_qsize 0
2017-07-20 22:51:30,812 : INFO : PROGRESS: at 82.00% examples, 299698 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:51:31,814 : INFO : PROGRESS: at 82.02% examples, 299713 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:51:32,817 : INFO : PROGRESS: at 82.03% examples, 299725 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:51:33,826 : INFO : PROGRESS: at 82.04% examples, 299738 words/s, in_qsize 0, out_qsize 0
2017-07-20 22:51:35,364 : INFO : PROGRESS: at 82.04% examples, 299697 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:51:36,364 : INFO : PROGRESS: at 82.05% examples, 299712 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:51:37,378 : INFO : PROGRESS: at 82.06% examples, 299725 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:51:38,381 : INFO : PROGRESS: at 82.07% examples, 299739 wor

2017-07-20 22:53:04,571 : INFO : PROGRESS: at 82.74% examples, 299859 words/s, in_qsize 6, out_qsize 0
2017-07-20 22:53:06,206 : INFO : PROGRESS: at 82.74% examples, 299825 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:53:07,211 : INFO : PROGRESS: at 82.76% examples, 299840 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:53:08,229 : INFO : PROGRESS: at 82.77% examples, 299853 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:53:09,243 : INFO : PROGRESS: at 82.78% examples, 299864 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:53:10,327 : INFO : PROGRESS: at 82.79% examples, 299864 words/s, in_qsize 7, out_qsize 1
2017-07-20 22:53:12,248 : INFO : PROGRESS: at 82.79% examples, 299831 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:53:13,276 : INFO : PROGRESS: at 82.80% examples, 299843 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:53:14,285 : INFO : PROGRESS: at 82.81% examples, 299857 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:53:15,289 : INFO : PROGRESS: at 82.82% examples, 299872 wor

2017-07-20 22:54:41,133 : INFO : PROGRESS: at 83.50% examples, 299958 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:42,827 : INFO : PROGRESS: at 83.50% examples, 299931 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:43,839 : INFO : PROGRESS: at 83.52% examples, 299944 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:44,870 : INFO : PROGRESS: at 83.53% examples, 299958 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:45,899 : INFO : PROGRESS: at 83.54% examples, 299970 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:54:47,526 : INFO : PROGRESS: at 83.54% examples, 299934 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:48,546 : INFO : PROGRESS: at 83.55% examples, 299948 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:49,567 : INFO : PROGRESS: at 83.56% examples, 299961 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:51,766 : INFO : PROGRESS: at 83.57% examples, 299941 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:54:52,768 : INFO : PROGRESS: at 83.58% examples, 299955 wor

2017-07-20 22:56:16,993 : INFO : PROGRESS: at 84.22% examples, 300049 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:56:17,995 : INFO : PROGRESS: at 84.23% examples, 300062 words/s, in_qsize 8, out_qsize 0
2017-07-20 22:56:19,048 : INFO : PROGRESS: at 84.25% examples, 300075 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:56:20,104 : INFO : PROGRESS: at 84.25% examples, 300073 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:56:22,137 : INFO : PROGRESS: at 84.26% examples, 300044 words/s, in_qsize 8, out_qsize 1
2017-07-20 22:56:23,181 : INFO : PROGRESS: at 84.27% examples, 300058 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:56:24,231 : INFO : PROGRESS: at 84.28% examples, 300072 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:56:25,353 : INFO : PROGRESS: at 84.30% examples, 300079 words/s, in_qsize 0, out_qsize 2
2017-07-20 22:56:26,377 : INFO : PROGRESS: at 84.30% examples, 300084 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:56:27,415 : INFO : PROGRESS: at 84.32% examples, 300088 wor

2017-07-20 22:57:54,063 : INFO : PROGRESS: at 84.97% examples, 300177 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:57:55,987 : INFO : PROGRESS: at 84.98% examples, 300143 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:57:57,009 : INFO : PROGRESS: at 84.99% examples, 300157 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:57:58,038 : INFO : PROGRESS: at 85.00% examples, 300170 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:57:59,074 : INFO : PROGRESS: at 85.01% examples, 300183 words/s, in_qsize 4, out_qsize 0
2017-07-20 22:58:00,617 : INFO : PROGRESS: at 85.01% examples, 300151 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:58:01,621 : INFO : PROGRESS: at 85.02% examples, 300162 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:58:02,633 : INFO : PROGRESS: at 85.03% examples, 300171 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:58:03,652 : INFO : PROGRESS: at 85.04% examples, 300184 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:58:05,704 : INFO : PROGRESS: at 85.05% examples, 300151 wor

2017-07-20 22:59:33,206 : INFO : PROGRESS: at 85.73% examples, 300278 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:59:34,222 : INFO : PROGRESS: at 85.74% examples, 300291 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:59:35,231 : INFO : PROGRESS: at 85.75% examples, 300296 words/s, in_qsize 5, out_qsize 0
2017-07-20 22:59:36,317 : INFO : PROGRESS: at 85.76% examples, 300289 words/s, in_qsize 6, out_qsize 2
2017-07-20 22:59:38,163 : INFO : PROGRESS: at 85.77% examples, 300268 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:59:39,208 : INFO : PROGRESS: at 85.78% examples, 300282 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:59:40,223 : INFO : PROGRESS: at 85.79% examples, 300294 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:59:41,295 : INFO : PROGRESS: at 85.80% examples, 300299 words/s, in_qsize 0, out_qsize 2
2017-07-20 22:59:42,299 : INFO : PROGRESS: at 85.81% examples, 300305 words/s, in_qsize 7, out_qsize 0
2017-07-20 22:59:44,121 : INFO : PROGRESS: at 85.81% examples, 300270 wor

2017-07-20 23:01:09,007 : INFO : PROGRESS: at 86.48% examples, 300409 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:10,030 : INFO : PROGRESS: at 86.48% examples, 300393 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:11,042 : INFO : PROGRESS: at 86.49% examples, 300405 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:13,338 : INFO : PROGRESS: at 86.50% examples, 300374 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:14,387 : INFO : PROGRESS: at 86.51% examples, 300388 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:15,392 : INFO : PROGRESS: at 86.52% examples, 300401 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:16,415 : INFO : PROGRESS: at 86.53% examples, 300414 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:17,444 : INFO : PROGRESS: at 86.54% examples, 300417 words/s, in_qsize 0, out_qsize 0
2017-07-20 23:01:18,736 : INFO : PROGRESS: at 86.54% examples, 300387 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:01:19,743 : INFO : PROGRESS: at 86.55% examples, 300400 wor

2017-07-20 23:02:44,132 : INFO : PROGRESS: at 87.20% examples, 300503 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:02:45,146 : INFO : PROGRESS: at 87.21% examples, 300516 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:02:46,158 : INFO : PROGRESS: at 87.22% examples, 300528 words/s, in_qsize 5, out_qsize 0
2017-07-20 23:02:47,712 : INFO : PROGRESS: at 87.23% examples, 300497 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:02:48,753 : INFO : PROGRESS: at 87.24% examples, 300511 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:02:49,759 : INFO : PROGRESS: at 87.25% examples, 300523 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:02:50,817 : INFO : PROGRESS: at 87.26% examples, 300535 words/s, in_qsize 5, out_qsize 1
2017-07-20 23:02:51,941 : INFO : PROGRESS: at 87.26% examples, 300528 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:02:53,897 : INFO : PROGRESS: at 87.27% examples, 300503 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:02:54,941 : INFO : PROGRESS: at 87.28% examples, 300516 wor

2017-07-20 23:04:18,912 : INFO : PROGRESS: at 87.93% examples, 300594 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:19,941 : INFO : PROGRESS: at 87.94% examples, 300608 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:20,953 : INFO : PROGRESS: at 87.96% examples, 300621 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:22,152 : INFO : PROGRESS: at 87.97% examples, 300629 words/s, in_qsize 4, out_qsize 0
2017-07-20 23:04:24,379 : INFO : PROGRESS: at 87.98% examples, 300599 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:25,405 : INFO : PROGRESS: at 87.99% examples, 300613 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:26,412 : INFO : PROGRESS: at 88.00% examples, 300626 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:27,425 : INFO : PROGRESS: at 88.01% examples, 300639 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:29,021 : INFO : PROGRESS: at 88.01% examples, 300610 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:04:30,064 : INFO : PROGRESS: at 88.02% examples, 300624 wor

2017-07-20 23:05:54,475 : INFO : PROGRESS: at 88.67% examples, 300729 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:05:55,513 : INFO : PROGRESS: at 88.68% examples, 300742 words/s, in_qsize 3, out_qsize 0
2017-07-20 23:05:57,395 : INFO : PROGRESS: at 88.68% examples, 300701 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:05:58,409 : INFO : PROGRESS: at 88.69% examples, 300715 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:05:59,416 : INFO : PROGRESS: at 88.70% examples, 300727 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:06:00,436 : INFO : PROGRESS: at 88.72% examples, 300740 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:06:02,414 : INFO : PROGRESS: at 88.72% examples, 300714 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:06:03,415 : INFO : PROGRESS: at 88.73% examples, 300728 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:06:04,416 : INFO : PROGRESS: at 88.74% examples, 300740 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:06:05,434 : INFO : PROGRESS: at 88.76% examples, 300752 wor

2017-07-20 23:07:30,687 : INFO : PROGRESS: at 89.43% examples, 300839 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:31,701 : INFO : PROGRESS: at 89.44% examples, 300852 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:33,426 : INFO : PROGRESS: at 89.45% examples, 300822 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:34,448 : INFO : PROGRESS: at 89.46% examples, 300835 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:35,456 : INFO : PROGRESS: at 89.47% examples, 300847 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:36,508 : INFO : PROGRESS: at 89.48% examples, 300859 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:37,789 : INFO : PROGRESS: at 89.49% examples, 300854 words/s, in_qsize 4, out_qsize 3
2017-07-20 23:07:38,811 : INFO : PROGRESS: at 89.50% examples, 300859 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:40,431 : INFO : PROGRESS: at 89.50% examples, 300834 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:07:41,481 : INFO : PROGRESS: at 89.52% examples, 300847 wor

2017-07-20 23:09:04,293 : INFO : PROGRESS: at 90.16% examples, 300948 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:09:05,343 : INFO : PROGRESS: at 90.17% examples, 300960 words/s, in_qsize 4, out_qsize 0
2017-07-20 23:09:06,804 : INFO : PROGRESS: at 90.17% examples, 300931 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:09:07,810 : INFO : PROGRESS: at 90.18% examples, 300944 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:09:08,823 : INFO : PROGRESS: at 90.19% examples, 300956 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:09:09,826 : INFO : PROGRESS: at 90.20% examples, 300966 words/s, in_qsize 5, out_qsize 0
2017-07-20 23:09:12,153 : INFO : PROGRESS: at 90.21% examples, 300933 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:09:13,199 : INFO : PROGRESS: at 90.22% examples, 300944 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:09:14,204 : INFO : PROGRESS: at 90.23% examples, 300957 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:09:15,236 : INFO : PROGRESS: at 90.24% examples, 300969 wor

2017-07-20 23:10:40,262 : INFO : PROGRESS: at 90.90% examples, 301072 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:10:42,251 : INFO : PROGRESS: at 90.91% examples, 301040 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:10:43,295 : INFO : PROGRESS: at 90.92% examples, 301053 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:10:44,345 : INFO : PROGRESS: at 90.93% examples, 301065 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:10:45,370 : INFO : PROGRESS: at 90.94% examples, 301077 words/s, in_qsize 1, out_qsize 0
2017-07-20 23:10:46,797 : INFO : PROGRESS: at 90.94% examples, 301047 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:10:47,815 : INFO : PROGRESS: at 90.95% examples, 301060 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:10:48,829 : INFO : PROGRESS: at 90.97% examples, 301072 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:10:49,855 : INFO : PROGRESS: at 90.98% examples, 301084 words/s, in_qsize 5, out_qsize 0
2017-07-20 23:10:51,625 : INFO : PROGRESS: at 90.98% examples, 301048 wor

2017-07-20 23:12:15,233 : INFO : PROGRESS: at 91.63% examples, 301169 words/s, in_qsize 4, out_qsize 0
2017-07-20 23:12:16,738 : INFO : PROGRESS: at 91.63% examples, 301140 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:12:17,781 : INFO : PROGRESS: at 91.65% examples, 301152 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:12:18,786 : INFO : PROGRESS: at 91.66% examples, 301165 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:12:19,804 : INFO : PROGRESS: at 91.67% examples, 301177 words/s, in_qsize 6, out_qsize 0
2017-07-20 23:12:21,621 : INFO : PROGRESS: at 91.67% examples, 301141 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:12:22,640 : INFO : PROGRESS: at 91.68% examples, 301154 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:12:23,670 : INFO : PROGRESS: at 91.69% examples, 301165 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:12:24,687 : INFO : PROGRESS: at 91.70% examples, 301178 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:12:26,424 : INFO : PROGRESS: at 91.71% examples, 301149 wor

2017-07-20 23:13:50,295 : INFO : PROGRESS: at 92.36% examples, 301248 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:13:51,325 : INFO : PROGRESS: at 92.37% examples, 301260 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:13:52,407 : INFO : PROGRESS: at 92.38% examples, 301268 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:13:53,450 : INFO : PROGRESS: at 92.39% examples, 301268 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:13:55,554 : INFO : PROGRESS: at 92.39% examples, 301239 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:13:56,557 : INFO : PROGRESS: at 92.40% examples, 301252 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:13:57,563 : INFO : PROGRESS: at 92.42% examples, 301264 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:13:58,573 : INFO : PROGRESS: at 92.43% examples, 301276 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:14:00,219 : INFO : PROGRESS: at 92.43% examples, 301247 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:14:01,229 : INFO : PROGRESS: at 92.44% examples, 301261 wor

2017-07-20 23:15:24,825 : INFO : PROGRESS: at 93.11% examples, 301354 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:15:25,841 : INFO : PROGRESS: at 93.12% examples, 301367 words/s, in_qsize 6, out_qsize 0
2017-07-20 23:15:27,392 : INFO : PROGRESS: at 93.13% examples, 301338 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:15:28,436 : INFO : PROGRESS: at 93.14% examples, 301351 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:15:29,476 : INFO : PROGRESS: at 93.15% examples, 301363 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:15:30,606 : INFO : PROGRESS: at 93.16% examples, 301370 words/s, in_qsize 5, out_qsize 1
2017-07-20 23:15:32,798 : INFO : PROGRESS: at 93.17% examples, 301342 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:15:33,818 : INFO : PROGRESS: at 93.18% examples, 301355 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:15:34,827 : INFO : PROGRESS: at 93.19% examples, 301367 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:15:35,876 : INFO : PROGRESS: at 93.20% examples, 301380 wor

2017-07-20 23:16:59,988 : INFO : PROGRESS: at 93.84% examples, 301461 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:17:01,384 : INFO : PROGRESS: at 93.85% examples, 301463 words/s, in_qsize 0, out_qsize 2
2017-07-20 23:17:02,611 : INFO : PROGRESS: at 93.86% examples, 301456 words/s, in_qsize 4, out_qsize 0
2017-07-20 23:17:03,628 : INFO : PROGRESS: at 93.87% examples, 301465 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:17:04,630 : INFO : PROGRESS: at 93.88% examples, 301469 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:17:06,372 : INFO : PROGRESS: at 93.89% examples, 301444 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:17:07,383 : INFO : PROGRESS: at 93.90% examples, 301457 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:17:08,413 : INFO : PROGRESS: at 93.91% examples, 301468 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:17:09,413 : INFO : PROGRESS: at 93.92% examples, 301478 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:17:11,163 : INFO : PROGRESS: at 93.92% examples, 301446 wor

2017-07-20 23:18:36,441 : INFO : PROGRESS: at 94.59% examples, 301565 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:18:38,298 : INFO : PROGRESS: at 94.59% examples, 301534 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:18:39,341 : INFO : PROGRESS: at 94.60% examples, 301545 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:18:40,349 : INFO : PROGRESS: at 94.62% examples, 301558 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:18:41,356 : INFO : PROGRESS: at 94.63% examples, 301568 words/s, in_qsize 6, out_qsize 1
2017-07-20 23:18:42,932 : INFO : PROGRESS: at 94.63% examples, 301540 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:18:43,935 : INFO : PROGRESS: at 94.64% examples, 301553 words/s, in_qsize 8, out_qsize 0
2017-07-20 23:18:44,936 : INFO : PROGRESS: at 94.65% examples, 301565 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:18:45,938 : INFO : PROGRESS: at 94.66% examples, 301575 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:18:47,766 : INFO : PROGRESS: at 94.67% examples, 301542 wor

2017-07-20 23:20:12,033 : INFO : PROGRESS: at 95.32% examples, 301654 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:20:13,578 : INFO : PROGRESS: at 95.33% examples, 301628 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:20:14,579 : INFO : PROGRESS: at 95.34% examples, 301640 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:20:15,612 : INFO : PROGRESS: at 95.35% examples, 301651 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:20:16,642 : INFO : PROGRESS: at 95.36% examples, 301663 words/s, in_qsize 3, out_qsize 0
2017-07-20 23:20:18,277 : INFO : PROGRESS: at 95.36% examples, 301631 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:20:19,322 : INFO : PROGRESS: at 95.37% examples, 301643 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:20:20,332 : INFO : PROGRESS: at 95.39% examples, 301655 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:20:21,425 : INFO : PROGRESS: at 95.39% examples, 301659 words/s, in_qsize 4, out_qsize 0
2017-07-20 23:20:23,346 : INFO : PROGRESS: at 95.40% examples, 301638 wor

2017-07-20 23:21:49,937 : INFO : PROGRESS: at 96.08% examples, 301736 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:21:50,948 : INFO : PROGRESS: at 96.09% examples, 301748 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:21:51,963 : INFO : PROGRESS: at 96.10% examples, 301759 words/s, in_qsize 0, out_qsize 0
2017-07-20 23:21:53,383 : INFO : PROGRESS: at 96.10% examples, 301729 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:21:54,390 : INFO : PROGRESS: at 96.12% examples, 301742 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:21:55,404 : INFO : PROGRESS: at 96.13% examples, 301753 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:21:56,419 : INFO : PROGRESS: at 96.14% examples, 301764 words/s, in_qsize 4, out_qsize 0
2017-07-20 23:21:58,172 : INFO : PROGRESS: at 96.14% examples, 301730 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:21:59,179 : INFO : PROGRESS: at 96.15% examples, 301742 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:22:00,196 : INFO : PROGRESS: at 96.16% examples, 301753 wor

2017-07-20 23:23:23,689 : INFO : PROGRESS: at 96.81% examples, 301840 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:24,694 : INFO : PROGRESS: at 96.82% examples, 301844 words/s, in_qsize 0, out_qsize 0
2017-07-20 23:23:26,275 : INFO : PROGRESS: at 96.82% examples, 301808 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:27,286 : INFO : PROGRESS: at 96.83% examples, 301820 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:28,314 : INFO : PROGRESS: at 96.84% examples, 301831 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:29,316 : INFO : PROGRESS: at 96.85% examples, 301843 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:31,543 : INFO : PROGRESS: at 96.86% examples, 301812 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:32,546 : INFO : PROGRESS: at 96.87% examples, 301824 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:33,567 : INFO : PROGRESS: at 96.88% examples, 301835 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:23:34,575 : INFO : PROGRESS: at 96.89% examples, 301847 wor

2017-07-20 23:24:59,817 : INFO : PROGRESS: at 97.54% examples, 301924 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:25:01,223 : INFO : PROGRESS: at 97.55% examples, 301925 words/s, in_qsize 4, out_qsize 0
2017-07-20 23:25:03,174 : INFO : PROGRESS: at 97.56% examples, 301904 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:25:04,179 : INFO : PROGRESS: at 97.57% examples, 301916 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:25:05,192 : INFO : PROGRESS: at 97.58% examples, 301927 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:25:06,370 : INFO : PROGRESS: at 97.59% examples, 301933 words/s, in_qsize 3, out_qsize 1
2017-07-20 23:25:07,381 : INFO : PROGRESS: at 97.61% examples, 301939 words/s, in_qsize 6, out_qsize 0
2017-07-20 23:25:09,354 : INFO : PROGRESS: at 97.61% examples, 301909 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:25:10,388 : INFO : PROGRESS: at 97.62% examples, 301920 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:25:11,392 : INFO : PROGRESS: at 97.63% examples, 301931 wor

2017-07-20 23:26:37,226 : INFO : PROGRESS: at 98.30% examples, 301997 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:26:38,259 : INFO : PROGRESS: at 98.31% examples, 302009 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:26:39,272 : INFO : PROGRESS: at 98.32% examples, 302019 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:26:40,405 : INFO : PROGRESS: at 98.33% examples, 302026 words/s, in_qsize 2, out_qsize 0
2017-07-20 23:26:41,419 : INFO : PROGRESS: at 98.34% examples, 302031 words/s, in_qsize 0, out_qsize 0
2017-07-20 23:26:42,889 : INFO : PROGRESS: at 98.34% examples, 301998 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:26:43,895 : INFO : PROGRESS: at 98.35% examples, 302010 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:26:44,928 : INFO : PROGRESS: at 98.36% examples, 302021 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:26:45,937 : INFO : PROGRESS: at 98.37% examples, 302033 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:26:47,006 : INFO : PROGRESS: at 98.38% examples, 302031 wor

2017-07-20 23:28:09,802 : INFO : PROGRESS: at 99.03% examples, 302109 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:11,614 : INFO : PROGRESS: at 99.03% examples, 302079 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:12,655 : INFO : PROGRESS: at 99.04% examples, 302091 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:13,675 : INFO : PROGRESS: at 99.05% examples, 302102 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:14,679 : INFO : PROGRESS: at 99.07% examples, 302113 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:16,251 : INFO : PROGRESS: at 99.07% examples, 302088 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:17,264 : INFO : PROGRESS: at 99.08% examples, 302101 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:18,277 : INFO : PROGRESS: at 99.09% examples, 302112 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:28:19,513 : INFO : PROGRESS: at 99.10% examples, 302112 words/s, in_qsize 8, out_qsize 2
2017-07-20 23:28:20,518 : INFO : PROGRESS: at 99.11% examples, 302113 wor

2017-07-20 23:29:47,401 : INFO : PROGRESS: at 99.78% examples, 302183 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:29:48,485 : INFO : PROGRESS: at 99.79% examples, 302187 words/s, in_qsize 2, out_qsize 3
2017-07-20 23:29:50,469 : INFO : PROGRESS: at 99.80% examples, 302166 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:29:51,486 : INFO : PROGRESS: at 99.81% examples, 302178 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:29:52,491 : INFO : PROGRESS: at 99.82% examples, 302188 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:29:53,494 : INFO : PROGRESS: at 99.83% examples, 302200 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:29:54,688 : INFO : PROGRESS: at 99.84% examples, 302194 words/s, in_qsize 3, out_qsize 2
2017-07-20 23:29:56,591 : INFO : PROGRESS: at 99.84% examples, 302174 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:29:57,628 : INFO : PROGRESS: at 99.86% examples, 302185 words/s, in_qsize 7, out_qsize 0
2017-07-20 23:29:58,641 : INFO : PROGRESS: at 99.87% examples, 302197 wor

# Save

In [8]:
! mkdir -p {join(DATA_FOLDER, 'saved/')}

In [9]:
model_name = 'saved/w2v_model_%s_w3' % dim
model.save(join(DATA_FOLDER, model_name))
# model = gensim.models.Word2Vec.load(join(DATA_FOLDER, model_name))

2017-07-20 23:30:15,635 : INFO : saving Word2Vec object under ../data/saved/w2v_model_300_w3, separately None
2017-07-20 23:30:15,639 : INFO : storing np array 'syn0' to ../data/saved/w2v_model_300_w3.wv.syn0.npy
2017-07-20 23:30:16,128 : INFO : not storing attribute syn0norm
2017-07-20 23:30:16,129 : INFO : storing np array 'syn1neg' to ../data/saved/w2v_model_300_w3.syn1neg.npy
2017-07-20 23:30:17,178 : INFO : not storing attribute cum_table
2017-07-20 23:30:19,117 : INFO : saved ../data/saved/w2v_model_300_w3


In [19]:
model.wv.most_similar(positive=['помидор'], topn=100)

[('ландски', 0.653936505317688),
 ('испански', 0.6457735300064087),
 ('мексикански', 0.6404526829719543),
 ('корейски', 0.6396678686141968),
 ('луком', 0.6394015550613403),
 ('венгерски', 0.6392226815223694),
 ('егорлыкски', 0.6357219815254211),
 ('кабачка', 0.6335285902023315),
 ('датски', 0.6319401264190674),
 ('харчо', 0.6316151022911072),
 ('томатов', 0.6303468942642212),
 ('редиска', 0.6300629377365112),
 ('макрель', 0.6299110054969788),
 ('таджикски', 0.6283292770385742),
 ('пихельштейнски', 0.6281647682189941),
 ('раккио', 0.627670168876648),
 ('баклажанин', 0.6275602579116821),
 ('форшмак', 0.6269422173500061),
 ('спарж', 0.6264820694923401),
 ('сардинопс', 0.6256702542304993),
 ('зажарка', 0.6255209445953369),
 ('мусак', 0.6254160404205322),
 ('латук', 0.624730110168457),
 ('шотландски', 0.6224321126937866),
 ('цуккини', 0.6219453811645508),
 ('чакапуля', 0.6219143867492676),
 ('черемшой', 0.6201030611991882),
 ('владивостокски', 0.6199373602867126),
 ('кубански', 0.6189488768

# Tensorflow visualisation

In [8]:
vocab_size = len(model.wv.vocab)
embedding_dim = model.vector_size

W = tf.Variable(tf.constant(0.0, shape=[vocab_size, embedding_dim]),
                trainable=False, name="W")
embedding_placeholder = tf.placeholder(tf.float32, [vocab_size, embedding_dim])
embedding_init = W.assign(embedding_placeholder)

In [9]:
import csv

vocab = dict(enumerate(model.wv.index2word))
vdf = pd.DataFrame.from_dict(vocab, orient='index')
vdf.to_csv('../data/processed/vocab.tsv', header=False, sep='\t', index=False)


In [10]:
with tf.Session() as sess:
    final_embed_matrix = sess.run(embedding_init, feed_dict={embedding_placeholder: model.wv.syn0})
    
#     final_embed_matrix = sess.run(weights)

    # it has to variable. constants don't work here. you can't reuse model.embed_matrix
    embedding_var = tf.Variable(final_embed_matrix, name='embedding')
    sess.run(embedding_var.initializer)

    config = projector.ProjectorConfig()
    summary_writer = tf.summary.FileWriter('../data/processed')

    # add embedding to the config file
    embedding = config.embeddings.add()
    embedding.tensor_name = embedding_var.name

    # link this tensor to its metadata file, in this case the first 500 words of vocab
    embedding.metadata_path = 'vocab.tsv'

    # saves a configuration file that TensorBoard will read during startup.
    projector.visualize_embeddings(summary_writer, config)
    saver_embed = tf.train.Saver([embedding_var])
    saver_embed.save(sess, '../data/processed/model3.ckpt', 1)


# Phrases

## Bigram

In [3]:
bigram = gensim.models.Phrases(Sentences(join(DATA_FOLDER, 'documents/')))

2017-09-27 12:00:11,419 [MainThread  ] [INFO ]  collecting all words and their counts
2017-09-27 12:00:11,423 [MainThread  ] [INFO ]  ../data/documents/674.json.gz
2017-09-27 12:00:12,801 [MainThread  ] [INFO ]  PROGRESS: at sentence #0, processed 0 words and 0 word types
2017-09-27 12:00:13,054 [MainThread  ] [INFO ]  PROGRESS: at sentence #10000, processed 215157 words and 88228 word types
2017-09-27 12:00:13,351 [MainThread  ] [INFO ]  PROGRESS: at sentence #20000, processed 434821 words and 167144 word types
2017-09-27 12:00:13,671 [MainThread  ] [INFO ]  PROGRESS: at sentence #30000, processed 650225 words and 242273 word types
2017-09-27 12:00:13,969 [MainThread  ] [INFO ]  PROGRESS: at sentence #40000, processed 876484 words and 307222 word types
2017-09-27 12:00:14,334 [MainThread  ] [INFO ]  PROGRESS: at sentence #50000, processed 1106013 words and 367356 word types
2017-09-27 12:00:14,614 [MainThread  ] [INFO ]  PROGRESS: at sentence #60000, processed 1322326 words and 425076

KeyboardInterrupt: 

In [None]:
bigram.save('../data/saved/bigram')

In [3]:
bigram = gensim.models.phrases.Phrases.load(join(DATA_FOLDER, '../data/saved/bigram'))

2017-09-27 13:30:40,328 [MainThread  ] [INFO ]  loading Phrases object from ../data/../data/saved/bigram
2017-09-27 13:30:49,979 [MainThread  ] [INFO ]  loaded ../data/../data/saved/bigram


In [60]:
sentences = Sentences(join(DATA_FOLDER, 'documents/'))
for phrase, score in islice(bigram.export_phrases(sentences), 1000):
    print('{0}   {1}'.format(phrase, score))

2017-09-27 14:20:41,007 [MainThread  ] [INFO ]  0: ../data/documents/72.json.gz


маринадный заливка   338.519314005
консервный промышленность   40.1941253921
маринадный заливка   338.519314005
резинотехнический изделие   11.9184606059
хлорсульфировать полиэтилен   195.139701867
хлорсульфировать полиэтилен   195.139701867
экологически чистый   53.7831689966
детонационный стук   207.310001499
аккумуляторный батарея   71.3640937225
аккумуляторный батарея   71.3640937225
золото серебро   19.7843616849
катушка индуктивность   28.176506679
машиностроение приборостроение   14.7190976767
ввинчивать вывинчивать   58.8406142324
производительность труд   12.5296462192
испытательный стенд   20.055985761
диаметральный противоположно   66.2605101191
глушитель шум   27.5462566583
глушитель шум   27.5462566583
глушитель шум   27.5462566583
очистной комбайн   24.8301290317
очистной комбайн   24.8301290317
резать кромка   13.0431266045
кинематически связанный   12.9356296566
гипсометрия пласт   31.4388328233
физико механический   12.7172095375
резать кромка   13.0431266045
многоатом

зубчатый венец   35.0268612795
зубчатый венец   35.0268612795
физико химический   23.3553322243
контрольно измерительный   37.4218616856
rs триггер   21.5408918042
оперативный запоминать   14.5492511812
сульфидный медно   228.95134482
полезный ископаемое   17.8123643822
пиритсодержащий сульфидный   14.6872916578
сульфидный медно   228.95134482
собиратель вспениватель   334.76234632
весы поосный   110.667630656
железнодорожный транспорт   37.842189218
подъездный путь   14.4767112758
тахометрический расходомер   59.0085457967
тахометрический расходомер   59.0085457967
тахометрический расходомер   59.0085457967
рупор предрупорный   34.6438486736
электроакустический преобразователь   22.6437490891
изгибный колебание   14.3532409159
геодезический приборостроение   36.3789049734
геодезический маркшейдерский   98.0988711271
надир зенит   279.291898578
фокусный расстояние   19.0697918036
окулярный микрометр   110.599837571
координатный сетка   11.6583141801
надир зенит   279.291898578
аминоспи

In [61]:
text = u'изобретение относится к пищевой промышленности\n . известен способ получения плодово-  ш одного сиропа, предусматривающий рас- \n тморение сахара внесение лимонной  «.немоты, выдержку сиропа, охлаждение и \n ,ильтрооание его, купажирование сиропа с  лимонной кислотой, пантокрином, настоями\n  чилибухи, женьшеня, солодкового корня,  лимонного или апельсинового, кориандра и  ореха. недостатком известного сиропа является  го. что в его состав входит труднодоступ- \n ное и дорогостоящее сырье, низкая  стабильность биологически активных вещее  то. известен способ получения плодово-  я одного сиропа из плодов рябины, предус- \n мз1 рмвающий приготовление экстракта,  фильтрацию его, введение сахара пли сорбита\n  и упаривание, добавление пупаренный  сироп лимонной и аскорбиновой кислоты, \n издержку при 86°с в течение 30 мин. розлив  и  ь-достатком известного способа явля-  jrrn к, что сироп практически не обогащен \n f.i h. itичоски активными веществами, что  снижает его пищевую ценность. наиболее близким техническим решением  к предлагаемому является способ пол- \n /чения плодово-ягодного сиропа,  предусматривающий приготовление плодово-ягодного\n  экстракта, смешивание его с сахаром , внесение лимонной кислоты в него и \n термообработку до 90-95°с, выдержку плодово-ягодного  сиропа в течение 30-60 мин, \n охлаждение до 75-80°с, смешивание с водным  концентратом шиповника, разделение \n аскорбиновой кислоты на две равные части,  одну из которых растворяют в воде при перемешивании\n , вносят в раствор 20-40 %  водно-спиртовой экстракт биомассы женьшеня\n , перемешивают до однородного состояния , выдерживают 30-60 мин и \n купажируют с плодово-ягодным экстрактом  и второй частью аскорбиновой кислоты, купаж  перемешивают. недостатком известного способа являются  недостаточно высокие диетические  свойства сиропа.\n техническим результатом является повышение  диетических свойств готового продукта\n , его стабильности и снижение расхода  сахара. это достигается, тем, что в способе получения  сиропа, предусматривающем приготовление\n  плодово-ягодного компонента,  включающее экстракцию плодово-ягодного \n сырья водой. экстракцию шиповника водой  и соединение с плодово-ягодным компонентов  и лимонной кислотой, выдерживание  полученной смеси в течение 1-2,5 ч для \n завершения экстракции, затем полученный  экстракт упаривают при 65-70°с до содержания\n  сухих веществ 4-6 %, концентрат  разделяют на две части, одну из частей смешивают\n  с сахаром- песком и упаривают, после  чего полученный сироп смешивают со \n второй частью концентрата и аскорбиновой кислотой, полученный готовый продукт разливают\n . для повышения биологических качеств  в готовый продукт дополнительно \n вводят витамины bi, б2, вз, во, рр и с при  следующем соотношении, мг на 100 г сиро5  па: bi 0,24-0,28 820,07-0,09 830,11-0.13 \n вб 0,18-0.22 0рр 0,18-0,22 с 18,8-22,8 данный способ экстракции шиповника  позволяет лучше экстрагировать каротино- \n иды и другие биологически и физиологиче5  ски активные вещества, что обусловлено \n синергизмом и образованием новых химических  связей. что же касается того, что концентрат  разделяют на 2 части, а увариванию подвер0\n  гают только 1 масть, то этот прием направ--  лен на сохранение питатопьных и \n биологически активных веществ получаемого  сиропа. в обычных пищевых рационах, \n включающих продукты животного и расти5  тельного происхождения, наиболее дефицитными\n , чаще всего зимой и ранней  весной,являются витамины с, в1,в2,вз,веи \n pp. разработано также соотношение витаминов  в-|,в2.вз,в(),с и рр и получаемого си0\n  ропа, что позволяет компенсировать  нехватку витаминов. предлагаемый способ осуществляют  следующим образом. 5 к 420-440 кг протертых ягод и/или плодов  добавляют 1300 л воды и экстрагируют \n их при 95- 970с в течение 1-2 ч. в иффузо-  ре плоды шиповник заливают , добавляют\n  1,6-2,0 кг лимонной .нслоты и 0 полученный плодово-ягодный экстракт.\n смесь выдерживают в течение 1,0-2.5 ч. экстракт  отделяют от осч,ка ц угиривают при \n 65-70°с до сод чжэния сухих веществ 4-6  %. концентрат разделяют на две части, одну \n 5 из которых смешиьгкуг с 1440 кг сахара-песка , упаривают при 90-95°с в течение 30-60 \n мин, затем сироп охлаждают до 75-80°с. к  сиропу добавляют остальную часть концентрата\n  и аскорбиновую кислоту, перемешивают  и разливают. п р и м е р 1. 420 кг протертых ягод  рябины красной и черноплодной заливают \n 1300 л воды и экстрагируют при 97°с в течение  1 ч. плоды шиповника заливают водой, \n добавляют 1,6 кг лимонной кислоты п пол-  ученный ягодный экстракт и смесь выдерживают\n  1 ч, экстракт отделяют от осадка,  упаривают 2 ч при 65°с до содержания в \n концентрате сухих веществ а % . концентрат  разделяют на две части, в одну из них в \n количестве 480 л добавляют 1440 кг сахара-  песка и уваривают при 90°с в течение 30 \n мин. затем сироп охлаждают до 75°с, смешивают  его с 300 л оставшегося концентрата\n  и- 8,2 г аскорбиновой кислоты. смесь  перемешивают и разливают. п р и м е р 2. 430 кг протертых ягод  красной и черноплодной рябины, клюквы и \n брусники заливают 1300 л воды и экстрагируют  при 95°с в течение 1,5 ч. плоды ти- \n повника заливают водой, добавляют 2,0 кг  лимонной кислоты и полученный ягодный \n экстракт, выдерживают смесь при 67°с 2 ч  до получения экстракта с содержанием сухих\n  веществ 5 %. экстракт отделяют от  осадка, упаривают при 70°с до содержания \n сухих веществ 6 %. концентрат разделяют формула изобретения \n 1. способ получения сиропа, предусматри-  вающий приготовление водного экстракта \n шиповника и приготовление плодово-ягодное  о компонента, включающее экстракцию \n плодово-ягодного сырья водой, купажирование  с сахаром - песком, уваривание и охлаждение\n  полученного плодово-ягодного  компонента, соединение с водным экстрактом  шиповника и лимонной кислоты,\n перемешивание готового продукта с зскор-  биновой кислотой и розлив, отличающийся \n тем, что соединение плодово-ягодного  компонента с водным экстрактом шиповника\n  и лимонной кислотой осуществляют в процессе экстракции шиповника и полученную\n  смесь выдерживают в течение 1 -  2,5 ч для завершения экстракции и упари5 ю  15  20 \n 25  0  5 п  5 на две части, одну из них в количестве 500 л \n вносят 1440 кг сахара-песка и упаривают  при 95°с в течение 30 мин. после этого \n сироп охлаждают до 80°с, смешивают с оставшимся  количеством концентрата и 8,2 кг \n аскорбиновой кислоты, перемешивают и  разливают. пример 3. способ осуществляют \n аналогично поимеоу 1. но экстрагируют 440  кг протертых ягод красной рябины, черемухи\n  и  рники 2 ч при 97°с, а выдержку плодов  шиповника осуществляют при 70°с в  течение 2,5 ч. предлагаемый способ позволяет повысить  диети.ческие свойства готового продукта\n , ею стабильность. двукратная  экстракция ягод позволяет извлечь дополнительное\n  количество сахара, фруктозы,  сорбозы, глюкозы, ор1анических кислот, \n свободных аминокислот, каратиноидов и дубильных  веществ. (56j авторское свидетельство ссср  № 1500244, кл. а 23 l 2/00, 1985. сироп витаминизированный из плодов  рябины с сорбитом ту 64-0307-1-87. сироп из плодов шиповника с биоженьшенем  iу 64-5-175-90. вают при температуре 65 - 70 с до содержания  сухих веществ 4-6 %, полученный \n концентрат разделяют на две части, причем  купажированию с сахаром-песком и \n увариванию подвергают только одну часть,  а вторую часть смешивают с полученным  сиропом 2. способ по п.1, отличающийся тем,  что при перемешивании готового продукта \n дополнительно вводят витамины bl 82,  вз, вб, рр и с при следующем соотношении . мг/100 г сиропа: bi  0,24-0,28 в20,07 - 0.09 бз0,11-0,13 bg0,18-0,22 рр0,18-0,22 с18,8-22,8\n",'
doc = []
for sentence in nltk.sent_tokenize(text):
    tokenized_sent = list(tokenize(sentence, stop_list=simple_stop_list))
    doc.append(tokenized_sent)

for phrase, score in bigram.export_phrases(doc):
    print('{0}   {1}'.format(phrase, score))

водно спиртовой   226.221757447
плодово ягодный   1539.49973915
авторское свидетельство   167.717854718
ссср кл   39.5114021874


In [66]:
sentences = Sentences(join(DATA_FOLDER, 'documents/'))
model = Word2Vec(bigram[sentences], size=dim, sg=1, min_count=5, window=10, workers=cpu_count)

2017-09-27 14:31:37,803 [MainThread  ] [INFO ]  0: ../data/documents/72.json.gz
2017-09-27 14:31:37,944 [MainThread  ] [DEBUG]  Fast version of gensim.models.word2vec is being used
2017-09-27 14:31:37,945 [MainThread  ] [INFO ]  collecting all words and their counts
2017-09-27 14:31:37,946 [MainThread  ] [INFO ]  PROGRESS: at sentence #0, processed 0 words, keeping 0 word types
2017-09-27 14:31:38,713 [MainThread  ] [INFO ]  1: ../data/documents/228.json.gz
2017-09-27 14:31:40,765 [MainThread  ] [INFO ]  PROGRESS: at sentence #10000, processed 172754 words, keeping 17982 word types
2017-09-27 14:31:42,077 [MainThread  ] [INFO ]  PROGRESS: at sentence #20000, processed 353297 words, keeping 30496 word types
2017-09-27 14:31:43,424 [MainThread  ] [INFO ]  PROGRESS: at sentence #30000, processed 536780 words, keeping 41342 word types
2017-09-27 14:31:44,819 [MainThread  ] [INFO ]  PROGRESS: at sentence #40000, processed 728442 words, keeping 52539 word types
2017-09-27 14:31:46,173 [MainT

2017-09-27 14:33:17,223 [MainThread  ] [INFO ]  PROGRESS: at sentence #520000, processed 10139711 words, keeping 204790 word types
2017-09-27 14:33:18,764 [MainThread  ] [INFO ]  PROGRESS: at sentence #530000, processed 10356942 words, keeping 206158 word types
2017-09-27 14:33:20,219 [MainThread  ] [INFO ]  16: ../data/documents/793.json.gz
2017-09-27 14:33:22,850 [MainThread  ] [INFO ]  PROGRESS: at sentence #540000, processed 10569837 words, keeping 208025 word types
2017-09-27 14:33:24,860 [MainThread  ] [INFO ]  PROGRESS: at sentence #550000, processed 10848931 words, keeping 210157 word types
2017-09-27 14:33:25,623 [MainThread  ] [INFO ]  17: ../data/documents/253.json.gz
2017-09-27 14:33:30,880 [MainThread  ] [INFO ]  PROGRESS: at sentence #560000, processed 11067783 words, keeping 212726 word types
2017-09-27 14:33:32,163 [MainThread  ] [INFO ]  PROGRESS: at sentence #570000, processed 11239984 words, keeping 215284 word types
2017-09-27 14:33:33,524 [MainThread  ] [INFO ]  PR

2017-09-27 14:35:09,847 [MainThread  ] [INFO ]  PROGRESS: at sentence #1090000, processed 21571395 words, keeping 293502 word types
2017-09-27 14:35:11,259 [MainThread  ] [INFO ]  PROGRESS: at sentence #1100000, processed 21771553 words, keeping 295332 word types
2017-09-27 14:35:12,576 [MainThread  ] [INFO ]  PROGRESS: at sentence #1110000, processed 21946540 words, keeping 296572 word types
2017-09-27 14:35:13,898 [MainThread  ] [INFO ]  PROGRESS: at sentence #1120000, processed 22123324 words, keeping 299081 word types
2017-09-27 14:35:14,452 [MainThread  ] [INFO ]  26: ../data/documents/702.json.gz
2017-09-27 14:35:16,451 [MainThread  ] [INFO ]  PROGRESS: at sentence #1130000, processed 22364827 words, keeping 300680 word types
2017-09-27 14:35:18,227 [MainThread  ] [INFO ]  PROGRESS: at sentence #1140000, processed 22613879 words, keeping 302873 word types
2017-09-27 14:35:19,025 [MainThread  ] [INFO ]  27: ../data/documents/865.json.gz
2017-09-27 14:35:26,841 [MainThread  ] [INFO

2017-09-27 14:37:02,088 [MainThread  ] [INFO ]  PROGRESS: at sentence #1650000, processed 32593385 words, keeping 380489 word types
2017-09-27 14:37:03,496 [MainThread  ] [INFO ]  PROGRESS: at sentence #1660000, processed 32776975 words, keeping 382042 word types
2017-09-27 14:37:05,006 [MainThread  ] [INFO ]  PROGRESS: at sentence #1670000, processed 32982387 words, keeping 383309 word types
2017-09-27 14:37:06,528 [MainThread  ] [INFO ]  PROGRESS: at sentence #1680000, processed 33181942 words, keeping 384393 word types
2017-09-27 14:37:07,983 [MainThread  ] [INFO ]  PROGRESS: at sentence #1690000, processed 33377402 words, keeping 385687 word types
2017-09-27 14:37:09,477 [MainThread  ] [INFO ]  PROGRESS: at sentence #1700000, processed 33577219 words, keeping 387511 word types
2017-09-27 14:37:10,886 [MainThread  ] [INFO ]  PROGRESS: at sentence #1710000, processed 33766475 words, keeping 388406 word types
2017-09-27 14:37:12,208 [MainThread  ] [INFO ]  PROGRESS: at sentence #17200

2017-09-27 14:38:47,638 [MainThread  ] [INFO ]  PROGRESS: at sentence #2240000, processed 43847366 words, keeping 469843 word types
2017-09-27 14:38:48,894 [MainThread  ] [INFO ]  PROGRESS: at sentence #2250000, processed 44011167 words, keeping 471201 word types
2017-09-27 14:38:49,724 [MainThread  ] [INFO ]  41: ../data/documents/335.json.gz
2017-09-27 14:38:51,749 [MainThread  ] [INFO ]  PROGRESS: at sentence #2260000, processed 44188912 words, keeping 474111 word types
2017-09-27 14:38:53,183 [MainThread  ] [INFO ]  PROGRESS: at sentence #2270000, processed 44392666 words, keeping 478817 word types
2017-09-27 14:38:54,624 [MainThread  ] [INFO ]  PROGRESS: at sentence #2280000, processed 44588842 words, keeping 483184 word types
2017-09-27 14:38:56,038 [MainThread  ] [INFO ]  PROGRESS: at sentence #2290000, processed 44779288 words, keeping 486464 word types
2017-09-27 14:38:57,532 [MainThread  ] [INFO ]  PROGRESS: at sentence #2300000, processed 44978078 words, keeping 490602 word 

2017-09-27 14:40:38,124 [MainThread  ] [INFO ]  PROGRESS: at sentence #2820000, processed 54976294 words, keeping 555392 word types
2017-09-27 14:40:39,692 [MainThread  ] [INFO ]  PROGRESS: at sentence #2830000, processed 55189412 words, keeping 556140 word types
2017-09-27 14:40:41,175 [MainThread  ] [INFO ]  PROGRESS: at sentence #2840000, processed 55384108 words, keeping 558096 word types
2017-09-27 14:40:42,633 [MainThread  ] [INFO ]  PROGRESS: at sentence #2850000, processed 55579127 words, keeping 559320 word types
2017-09-27 14:40:44,168 [MainThread  ] [INFO ]  PROGRESS: at sentence #2860000, processed 55788318 words, keeping 560425 word types
2017-09-27 14:40:45,522 [MainThread  ] [INFO ]  PROGRESS: at sentence #2870000, processed 55972652 words, keeping 561790 word types
2017-09-27 14:40:47,003 [MainThread  ] [INFO ]  PROGRESS: at sentence #2880000, processed 56173853 words, keeping 562540 word types
2017-09-27 14:40:48,471 [MainThread  ] [INFO ]  PROGRESS: at sentence #28900

2017-09-27 14:42:24,855 [MainThread  ] [INFO ]  PROGRESS: at sentence #3410000, processed 66261295 words, keeping 617052 word types
2017-09-27 14:42:26,256 [MainThread  ] [INFO ]  PROGRESS: at sentence #3420000, processed 66450247 words, keeping 618055 word types
2017-09-27 14:42:27,695 [MainThread  ] [INFO ]  PROGRESS: at sentence #3430000, processed 66639822 words, keeping 619184 word types
2017-09-27 14:42:28,051 [MainThread  ] [INFO ]  54: ../data/documents/918.json.gz
2017-09-27 14:42:42,202 [MainThread  ] [INFO ]  PROGRESS: at sentence #3440000, processed 66988163 words, keeping 620495 word types
2017-09-27 14:42:44,433 [MainThread  ] [INFO ]  PROGRESS: at sentence #3450000, processed 67291587 words, keeping 622352 word types
2017-09-27 14:42:47,594 [MainThread  ] [INFO ]  PROGRESS: at sentence #3460000, processed 67740122 words, keeping 623138 word types
2017-09-27 14:42:49,804 [MainThread  ] [INFO ]  PROGRESS: at sentence #3470000, processed 68043636 words, keeping 623945 word 

2017-09-27 14:44:38,121 [MainThread  ] [INFO ]  PROGRESS: at sentence #4000000, processed 80304323 words, keeping 675028 word types
2017-09-27 14:44:39,251 [MainThread  ] [INFO ]  59: ../data/documents/829.json.gz
2017-09-27 14:44:43,711 [MainThread  ] [INFO ]  PROGRESS: at sentence #4010000, processed 80519321 words, keeping 675695 word types
2017-09-27 14:44:45,353 [MainThread  ] [INFO ]  PROGRESS: at sentence #4020000, processed 80740967 words, keeping 676389 word types
2017-09-27 14:44:47,029 [MainThread  ] [INFO ]  PROGRESS: at sentence #4030000, processed 80957264 words, keeping 677132 word types
2017-09-27 14:44:48,635 [MainThread  ] [INFO ]  PROGRESS: at sentence #4040000, processed 81173205 words, keeping 677822 word types
2017-09-27 14:44:50,232 [MainThread  ] [INFO ]  PROGRESS: at sentence #4050000, processed 81388416 words, keeping 678427 word types
2017-09-27 14:44:51,772 [MainThread  ] [INFO ]  PROGRESS: at sentence #4060000, processed 81601844 words, keeping 679375 word 

2017-09-27 14:46:26,413 [MainThread  ] [INFO ]  PROGRESS: at sentence #4580000, processed 91218202 words, keeping 731958 word types
2017-09-27 14:46:27,802 [MainThread  ] [INFO ]  PROGRESS: at sentence #4590000, processed 91397990 words, keeping 732759 word types
2017-09-27 14:46:28,692 [MainThread  ] [INFO ]  66: ../data/documents/173.json.gz
2017-09-27 14:46:29,721 [MainThread  ] [INFO ]  PROGRESS: at sentence #4600000, processed 91596285 words, keeping 734055 word types
2017-09-27 14:46:30,620 [MainThread  ] [INFO ]  67: ../data/documents/154.json.gz
2017-09-27 14:46:35,492 [MainThread  ] [INFO ]  PROGRESS: at sentence #4610000, processed 91801002 words, keeping 735176 word types
2017-09-27 14:46:36,835 [MainThread  ] [INFO ]  PROGRESS: at sentence #4620000, processed 91970248 words, keeping 736392 word types
2017-09-27 14:46:38,201 [MainThread  ] [INFO ]  PROGRESS: at sentence #4630000, processed 92145128 words, keeping 737556 word types
2017-09-27 14:46:39,669 [MainThread  ] [INFO

2017-09-27 14:48:10,595 [MainThread  ] [INFO ]  77: ../data/documents/30.json.gz
2017-09-27 14:48:11,331 [MainThread  ] [INFO ]  PROGRESS: at sentence #5140000, processed 101896737 words, keeping 799267 word types
2017-09-27 14:48:11,564 [MainThread  ] [INFO ]  78: ../data/documents/491.json.gz
2017-09-27 14:48:13,806 [MainThread  ] [INFO ]  PROGRESS: at sentence #5150000, processed 102160236 words, keeping 800934 word types
2017-09-27 14:48:15,277 [MainThread  ] [INFO ]  79: ../data/documents/898.json.gz
2017-09-27 14:48:18,224 [MainThread  ] [INFO ]  PROGRESS: at sentence #5160000, processed 102408273 words, keeping 802300 word types
2017-09-27 14:48:20,093 [MainThread  ] [INFO ]  PROGRESS: at sentence #5170000, processed 102671593 words, keeping 803274 word types
2017-09-27 14:48:21,498 [MainThread  ] [INFO ]  80: ../data/documents/852.json.gz
2017-09-27 14:48:22,505 [MainThread  ] [INFO ]  PROGRESS: at sentence #5180000, processed 102923013 words, keeping 804329 word types
2017-09-

2017-09-27 14:50:09,094 [MainThread  ] [INFO ]  PROGRESS: at sentence #5680000, processed 113605231 words, keeping 845378 word types
2017-09-27 14:50:10,549 [MainThread  ] [INFO ]  PROGRESS: at sentence #5690000, processed 113797367 words, keeping 845904 word types
2017-09-27 14:50:12,013 [MainThread  ] [INFO ]  PROGRESS: at sentence #5700000, processed 113988168 words, keeping 846574 word types
2017-09-27 14:50:13,488 [MainThread  ] [INFO ]  PROGRESS: at sentence #5710000, processed 114182114 words, keeping 847306 word types
2017-09-27 14:50:14,880 [MainThread  ] [INFO ]  PROGRESS: at sentence #5720000, processed 114368524 words, keeping 848784 word types
2017-09-27 14:50:16,367 [MainThread  ] [INFO ]  PROGRESS: at sentence #5730000, processed 114568484 words, keeping 850300 word types
2017-09-27 14:50:17,734 [MainThread  ] [INFO ]  PROGRESS: at sentence #5740000, processed 114751590 words, keeping 851480 word types
2017-09-27 14:50:19,321 [MainThread  ] [INFO ]  PROGRESS: at sentence

2017-09-27 14:51:57,195 [MainThread  ] [INFO ]  PROGRESS: at sentence #6250000, processed 124655263 words, keeping 911877 word types
2017-09-27 14:51:58,721 [MainThread  ] [INFO ]  PROGRESS: at sentence #6260000, processed 124856713 words, keeping 912402 word types
2017-09-27 14:52:00,298 [MainThread  ] [INFO ]  PROGRESS: at sentence #6270000, processed 125064198 words, keeping 912982 word types
2017-09-27 14:52:01,937 [MainThread  ] [INFO ]  PROGRESS: at sentence #6280000, processed 125268757 words, keeping 913823 word types
2017-09-27 14:52:03,289 [MainThread  ] [INFO ]  PROGRESS: at sentence #6290000, processed 125451612 words, keeping 914519 word types
2017-09-27 14:52:04,706 [MainThread  ] [INFO ]  PROGRESS: at sentence #6300000, processed 125637431 words, keeping 915227 word types
2017-09-27 14:52:06,109 [MainThread  ] [INFO ]  PROGRESS: at sentence #6310000, processed 125827623 words, keeping 915880 word types
2017-09-27 14:52:07,187 [MainThread  ] [INFO ]  99: ../data/documents

2017-09-27 14:53:41,778 [MainThread  ] [INFO ]  107: ../data/documents/860.json.gz
2017-09-27 14:53:47,356 [MainThread  ] [INFO ]  PROGRESS: at sentence #6820000, processed 135921290 words, keeping 951214 word types
2017-09-27 14:53:48,887 [MainThread  ] [INFO ]  PROGRESS: at sentence #6830000, processed 136115049 words, keeping 951646 word types
2017-09-27 14:53:50,376 [MainThread  ] [INFO ]  PROGRESS: at sentence #6840000, processed 136305804 words, keeping 952115 word types
2017-09-27 14:53:51,905 [MainThread  ] [INFO ]  PROGRESS: at sentence #6850000, processed 136504268 words, keeping 952694 word types
2017-09-27 14:53:53,366 [MainThread  ] [INFO ]  PROGRESS: at sentence #6860000, processed 136697489 words, keeping 953286 word types
2017-09-27 14:53:54,774 [MainThread  ] [INFO ]  PROGRESS: at sentence #6870000, processed 136885776 words, keeping 953920 word types
2017-09-27 14:53:56,236 [MainThread  ] [INFO ]  PROGRESS: at sentence #6880000, processed 137077598 words, keeping 9544

2017-09-27 14:55:35,757 [MainThread  ] [INFO ]  PROGRESS: at sentence #7360000, processed 146839350 words, keeping 1017439 word types
2017-09-27 14:55:37,032 [MainThread  ] [INFO ]  PROGRESS: at sentence #7370000, processed 147005215 words, keeping 1018628 word types
2017-09-27 14:55:38,408 [MainThread  ] [INFO ]  PROGRESS: at sentence #7380000, processed 147188390 words, keeping 1019490 word types
2017-09-27 14:55:39,725 [MainThread  ] [INFO ]  PROGRESS: at sentence #7390000, processed 147359570 words, keeping 1020301 word types
2017-09-27 14:55:41,011 [MainThread  ] [INFO ]  PROGRESS: at sentence #7400000, processed 147530753 words, keeping 1021025 word types
2017-09-27 14:55:42,314 [MainThread  ] [INFO ]  PROGRESS: at sentence #7410000, processed 147702828 words, keeping 1021881 word types
2017-09-27 14:55:43,422 [MainThread  ] [INFO ]  PROGRESS: at sentence #7420000, processed 147847450 words, keeping 1023160 word types
2017-09-27 14:55:44,667 [MainThread  ] [INFO ]  PROGRESS: at s

2017-09-27 14:57:19,615 [MainThread  ] [INFO ]  PROGRESS: at sentence #7930000, processed 157481244 words, keeping 1055346 word types
2017-09-27 14:57:20,911 [MainThread  ] [INFO ]  128: ../data/documents/449.json.gz
2017-09-27 14:57:21,741 [MainThread  ] [INFO ]  PROGRESS: at sentence #7940000, processed 157700946 words, keeping 1056145 word types
2017-09-27 14:57:23,629 [MainThread  ] [INFO ]  129: ../data/documents/358.json.gz
2017-09-27 14:57:24,216 [MainThread  ] [INFO ]  PROGRESS: at sentence #7950000, processed 158002936 words, keeping 1057309 word types
2017-09-27 14:57:25,714 [MainThread  ] [INFO ]  130: ../data/documents/930.json.gz
2017-09-27 14:57:31,300 [MainThread  ] [INFO ]  PROGRESS: at sentence #7960000, processed 158260340 words, keeping 1058327 word types
2017-09-27 14:57:32,862 [MainThread  ] [INFO ]  PROGRESS: at sentence #7970000, processed 158461158 words, keeping 1059342 word types
2017-09-27 14:57:34,552 [MainThread  ] [INFO ]  PROGRESS: at sentence #7980000, p

2017-09-27 14:59:10,390 [MainThread  ] [INFO ]  PROGRESS: at sentence #8470000, processed 168733923 words, keeping 1091374 word types
2017-09-27 14:59:11,725 [MainThread  ] [INFO ]  PROGRESS: at sentence #8480000, processed 168909877 words, keeping 1092177 word types
2017-09-27 14:59:13,060 [MainThread  ] [INFO ]  PROGRESS: at sentence #8490000, processed 169076464 words, keeping 1092862 word types
2017-09-27 14:59:14,379 [MainThread  ] [INFO ]  PROGRESS: at sentence #8500000, processed 169249354 words, keeping 1093570 word types
2017-09-27 14:59:15,703 [MainThread  ] [INFO ]  PROGRESS: at sentence #8510000, processed 169425874 words, keeping 1094212 word types
2017-09-27 14:59:16,144 [MainThread  ] [INFO ]  140: ../data/documents/730.json.gz
2017-09-27 14:59:21,693 [MainThread  ] [INFO ]  PROGRESS: at sentence #8520000, processed 169597928 words, keeping 1095028 word types
2017-09-27 14:59:23,211 [MainThread  ] [INFO ]  PROGRESS: at sentence #8530000, processed 169805317 words, keepin

2017-09-27 15:00:59,442 [MainThread  ] [INFO ]  PROGRESS: at sentence #9040000, processed 179878753 words, keeping 1155632 word types
2017-09-27 15:01:00,943 [MainThread  ] [INFO ]  147: ../data/documents/490.json.gz
2017-09-27 15:01:02,017 [MainThread  ] [INFO ]  PROGRESS: at sentence #9050000, processed 180171542 words, keeping 1156526 word types
2017-09-27 15:01:03,905 [MainThread  ] [INFO ]  148: ../data/documents/882.json.gz
2017-09-27 15:01:14,046 [MainThread  ] [INFO ]  PROGRESS: at sentence #9060000, processed 180449503 words, keeping 1157391 word types
2017-09-27 15:01:15,454 [MainThread  ] [INFO ]  PROGRESS: at sentence #9070000, processed 180641102 words, keeping 1157759 word types
2017-09-27 15:01:17,123 [MainThread  ] [INFO ]  PROGRESS: at sentence #9080000, processed 180872648 words, keeping 1159775 word types
2017-09-27 15:01:18,521 [MainThread  ] [INFO ]  PROGRESS: at sentence #9090000, processed 181056803 words, keeping 1160832 word types
2017-09-27 15:01:19,953 [MainT

2017-09-27 15:02:55,199 [MainThread  ] [INFO ]  PROGRESS: at sentence #9620000, processed 191530766 words, keeping 1194365 word types
2017-09-27 15:02:56,639 [MainThread  ] [INFO ]  PROGRESS: at sentence #9630000, processed 191725494 words, keeping 1195033 word types
2017-09-27 15:02:58,097 [MainThread  ] [INFO ]  PROGRESS: at sentence #9640000, processed 191917170 words, keeping 1195536 word types
2017-09-27 15:02:58,891 [MainThread  ] [INFO ]  153: ../data/documents/734.json.gz
2017-09-27 15:03:06,817 [MainThread  ] [INFO ]  PROGRESS: at sentence #9650000, processed 192110905 words, keeping 1196114 word types
2017-09-27 15:03:08,135 [MainThread  ] [INFO ]  PROGRESS: at sentence #9660000, processed 192289702 words, keeping 1196833 word types
2017-09-27 15:03:09,625 [MainThread  ] [INFO ]  PROGRESS: at sentence #9670000, processed 192480485 words, keeping 1197472 word types
2017-09-27 15:03:11,174 [MainThread  ] [INFO ]  PROGRESS: at sentence #9680000, processed 192681508 words, keepin

2017-09-27 15:04:50,536 [MainThread  ] [INFO ]  PROGRESS: at sentence #10190000, processed 202688174 words, keeping 1232326 word types
2017-09-27 15:04:51,990 [MainThread  ] [INFO ]  PROGRESS: at sentence #10200000, processed 202878842 words, keeping 1232799 word types
2017-09-27 15:04:53,291 [MainThread  ] [INFO ]  PROGRESS: at sentence #10210000, processed 203045683 words, keeping 1233397 word types
2017-09-27 15:04:54,827 [MainThread  ] [INFO ]  PROGRESS: at sentence #10220000, processed 203250491 words, keeping 1233889 word types
2017-09-27 15:04:56,211 [MainThread  ] [INFO ]  PROGRESS: at sentence #10230000, processed 203435505 words, keeping 1234275 word types
2017-09-27 15:04:57,587 [MainThread  ] [INFO ]  PROGRESS: at sentence #10240000, processed 203619060 words, keeping 1234762 word types
2017-09-27 15:04:59,016 [MainThread  ] [INFO ]  PROGRESS: at sentence #10250000, processed 203811582 words, keeping 1235634 word types
2017-09-27 15:05:00,471 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:06:37,720 [MainThread  ] [INFO ]  PROGRESS: at sentence #10780000, processed 213837024 words, keeping 1266867 word types
2017-09-27 15:06:39,124 [MainThread  ] [INFO ]  PROGRESS: at sentence #10790000, processed 214024388 words, keeping 1267285 word types
2017-09-27 15:06:40,550 [MainThread  ] [INFO ]  PROGRESS: at sentence #10800000, processed 214213690 words, keeping 1267837 word types
2017-09-27 15:06:41,972 [MainThread  ] [INFO ]  PROGRESS: at sentence #10810000, processed 214402850 words, keeping 1268137 word types
2017-09-27 15:06:43,264 [MainThread  ] [INFO ]  PROGRESS: at sentence #10820000, processed 214572667 words, keeping 1268771 word types
2017-09-27 15:06:44,643 [MainThread  ] [INFO ]  PROGRESS: at sentence #10830000, processed 214753483 words, keeping 1269281 word types
2017-09-27 15:06:45,978 [MainThread  ] [INFO ]  PROGRESS: at sentence #10840000, processed 214935358 words, keeping 1269596 word types
2017-09-27 15:06:47,392 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:08:21,237 [MainThread  ] [INFO ]  PROGRESS: at sentence #11320000, processed 224573964 words, keeping 1299948 word types
2017-09-27 15:08:22,825 [MainThread  ] [INFO ]  PROGRESS: at sentence #11330000, processed 224793772 words, keeping 1300349 word types
2017-09-27 15:08:24,282 [MainThread  ] [INFO ]  PROGRESS: at sentence #11340000, processed 224991487 words, keeping 1300853 word types
2017-09-27 15:08:24,671 [MainThread  ] [INFO ]  174: ../data/documents/488.json.gz
2017-09-27 15:08:26,814 [MainThread  ] [INFO ]  PROGRESS: at sentence #11350000, processed 225273201 words, keeping 1301755 word types
2017-09-27 15:08:27,604 [MainThread  ] [INFO ]  175: ../data/documents/85.json.gz
2017-09-27 15:08:32,560 [MainThread  ] [INFO ]  PROGRESS: at sentence #11360000, processed 225483083 words, keeping 1302431 word types
2017-09-27 15:08:33,898 [MainThread  ] [INFO ]  PROGRESS: at sentence #11370000, processed 225660030 words, keeping 1303490 word types
2017-09-27 15:08:35,274 [

2017-09-27 15:10:14,783 [MainThread  ] [INFO ]  PROGRESS: at sentence #11870000, processed 235255025 words, keeping 1330094 word types
2017-09-27 15:10:16,256 [MainThread  ] [INFO ]  PROGRESS: at sentence #11880000, processed 235454389 words, keeping 1330454 word types
2017-09-27 15:10:17,640 [MainThread  ] [INFO ]  PROGRESS: at sentence #11890000, processed 235643530 words, keeping 1330904 word types
2017-09-27 15:10:19,012 [MainThread  ] [INFO ]  PROGRESS: at sentence #11900000, processed 235832543 words, keeping 1331378 word types
2017-09-27 15:10:20,530 [MainThread  ] [INFO ]  PROGRESS: at sentence #11910000, processed 236039322 words, keeping 1331824 word types
2017-09-27 15:10:22,035 [MainThread  ] [INFO ]  PROGRESS: at sentence #11920000, processed 236242005 words, keeping 1332393 word types
2017-09-27 15:10:23,499 [MainThread  ] [INFO ]  PROGRESS: at sentence #11930000, processed 236437797 words, keeping 1332879 word types
2017-09-27 15:10:24,899 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:11:53,717 [MainThread  ] [INFO ]  192: ../data/documents/905.json.gz
2017-09-27 15:11:57,446 [MainThread  ] [INFO ]  PROGRESS: at sentence #12430000, processed 246257955 words, keeping 1363560 word types
2017-09-27 15:11:59,262 [MainThread  ] [INFO ]  PROGRESS: at sentence #12440000, processed 246512153 words, keeping 1364110 word types
2017-09-27 15:12:00,254 [MainThread  ] [INFO ]  193: ../data/documents/979.json.gz
2017-09-27 15:12:06,350 [MainThread  ] [INFO ]  PROGRESS: at sentence #12450000, processed 246737442 words, keeping 1364456 word types
2017-09-27 15:12:07,831 [MainThread  ] [INFO ]  PROGRESS: at sentence #12460000, processed 246933207 words, keeping 1364908 word types
2017-09-27 15:12:09,177 [MainThread  ] [INFO ]  PROGRESS: at sentence #12470000, processed 247110236 words, keeping 1365333 word types
2017-09-27 15:12:10,539 [MainThread  ] [INFO ]  PROGRESS: at sentence #12480000, processed 247295080 words, keeping 1365815 word types
2017-09-27 15:12:12,032 

2017-09-27 15:13:45,299 [MainThread  ] [INFO ]  PROGRESS: at sentence #12980000, processed 257155291 words, keeping 1413151 word types
2017-09-27 15:13:46,958 [MainThread  ] [INFO ]  PROGRESS: at sentence #12990000, processed 257380993 words, keeping 1413488 word types
2017-09-27 15:13:48,561 [MainThread  ] [INFO ]  PROGRESS: at sentence #13000000, processed 257595786 words, keeping 1413871 word types
2017-09-27 15:13:50,109 [MainThread  ] [INFO ]  PROGRESS: at sentence #13010000, processed 257805168 words, keeping 1414262 word types
2017-09-27 15:13:51,711 [MainThread  ] [INFO ]  PROGRESS: at sentence #13020000, processed 258021639 words, keeping 1414554 word types
2017-09-27 15:13:53,222 [MainThread  ] [INFO ]  PROGRESS: at sentence #13030000, processed 258227526 words, keeping 1414859 word types
2017-09-27 15:13:53,261 [MainThread  ] [INFO ]  202: ../data/documents/649.json.gz
2017-09-27 15:13:59,328 [MainThread  ] [INFO ]  PROGRESS: at sentence #13040000, processed 258427079 words,

2017-09-27 15:15:34,514 [MainThread  ] [INFO ]  PROGRESS: at sentence #13540000, processed 268337046 words, keeping 1446076 word types
2017-09-27 15:15:35,912 [MainThread  ] [INFO ]  210: ../data/documents/948.json.gz
2017-09-27 15:15:39,971 [MainThread  ] [INFO ]  PROGRESS: at sentence #13550000, processed 268527185 words, keeping 1446590 word types
2017-09-27 15:15:41,389 [MainThread  ] [INFO ]  PROGRESS: at sentence #13560000, processed 268716894 words, keeping 1446977 word types
2017-09-27 15:15:42,866 [MainThread  ] [INFO ]  PROGRESS: at sentence #13570000, processed 268914397 words, keeping 1447289 word types
2017-09-27 15:15:44,303 [MainThread  ] [INFO ]  PROGRESS: at sentence #13580000, processed 269107705 words, keeping 1447715 word types
2017-09-27 15:15:45,692 [MainThread  ] [INFO ]  PROGRESS: at sentence #13590000, processed 269293269 words, keeping 1448053 word types
2017-09-27 15:15:47,159 [MainThread  ] [INFO ]  PROGRESS: at sentence #13600000, processed 269484433 words,

2017-09-27 15:17:26,068 [MainThread  ] [INFO ]  PROGRESS: at sentence #14090000, processed 279176915 words, keeping 1472093 word types
2017-09-27 15:17:27,514 [MainThread  ] [INFO ]  PROGRESS: at sentence #14100000, processed 279367765 words, keeping 1472687 word types
2017-09-27 15:17:28,974 [MainThread  ] [INFO ]  PROGRESS: at sentence #14110000, processed 279559478 words, keeping 1473023 word types
2017-09-27 15:17:30,405 [MainThread  ] [INFO ]  PROGRESS: at sentence #14120000, processed 279739950 words, keeping 1473594 word types
2017-09-27 15:17:31,807 [MainThread  ] [INFO ]  PROGRESS: at sentence #14130000, processed 279926871 words, keeping 1474127 word types
2017-09-27 15:17:33,275 [MainThread  ] [INFO ]  PROGRESS: at sentence #14140000, processed 280125704 words, keeping 1474380 word types
2017-09-27 15:17:34,694 [MainThread  ] [INFO ]  PROGRESS: at sentence #14150000, processed 280318233 words, keeping 1474741 word types
2017-09-27 15:17:36,221 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:19:15,304 [MainThread  ] [INFO ]  226: ../data/documents/631.json.gz
2017-09-27 15:19:16,250 [MainThread  ] [INFO ]  PROGRESS: at sentence #14670000, processed 290471778 words, keeping 1547499 word types
2017-09-27 15:19:18,154 [MainThread  ] [INFO ]  PROGRESS: at sentence #14680000, processed 290733237 words, keeping 1548263 word types
2017-09-27 15:19:19,411 [MainThread  ] [INFO ]  227: ../data/documents/155.json.gz
2017-09-27 15:19:22,014 [MainThread  ] [INFO ]  PROGRESS: at sentence #14690000, processed 290974111 words, keeping 1548692 word types
2017-09-27 15:19:23,501 [MainThread  ] [INFO ]  PROGRESS: at sentence #14700000, processed 291155547 words, keeping 1549221 word types
2017-09-27 15:19:24,910 [MainThread  ] [INFO ]  PROGRESS: at sentence #14710000, processed 291337940 words, keeping 1549683 word types
2017-09-27 15:19:26,348 [MainThread  ] [INFO ]  PROGRESS: at sentence #14720000, processed 291519973 words, keeping 1550124 word types
2017-09-27 15:19:27,707 

2017-09-27 15:21:05,034 [MainThread  ] [INFO ]  PROGRESS: at sentence #15240000, processed 301453048 words, keeping 1572754 word types
2017-09-27 15:21:06,536 [MainThread  ] [INFO ]  PROGRESS: at sentence #15250000, processed 301655737 words, keeping 1573024 word types
2017-09-27 15:21:08,095 [MainThread  ] [INFO ]  PROGRESS: at sentence #15260000, processed 301860121 words, keeping 1573294 word types
2017-09-27 15:21:09,568 [MainThread  ] [INFO ]  PROGRESS: at sentence #15270000, processed 302055211 words, keeping 1573540 word types
2017-09-27 15:21:11,062 [MainThread  ] [INFO ]  PROGRESS: at sentence #15280000, processed 302250357 words, keeping 1573797 word types
2017-09-27 15:21:12,318 [MainThread  ] [INFO ]  232: ../data/documents/323.json.gz
2017-09-27 15:21:17,675 [MainThread  ] [INFO ]  PROGRESS: at sentence #15290000, processed 302446504 words, keeping 1574169 word types
2017-09-27 15:21:19,128 [MainThread  ] [INFO ]  PROGRESS: at sentence #15300000, processed 302629451 words,

2017-09-27 15:22:55,401 [MainThread  ] [INFO ]  PROGRESS: at sentence #15820000, processed 312501800 words, keeping 1599523 word types
2017-09-27 15:22:57,078 [MainThread  ] [INFO ]  PROGRESS: at sentence #15830000, processed 312721736 words, keeping 1600204 word types
2017-09-27 15:22:58,718 [MainThread  ] [INFO ]  PROGRESS: at sentence #15840000, processed 312936581 words, keeping 1602308 word types
2017-09-27 15:23:00,283 [MainThread  ] [INFO ]  PROGRESS: at sentence #15850000, processed 313141688 words, keeping 1603743 word types
2017-09-27 15:23:00,562 [MainThread  ] [INFO ]  237: ../data/documents/355.json.gz
2017-09-27 15:23:02,606 [MainThread  ] [INFO ]  238: ../data/documents/106.json.gz
2017-09-27 15:23:04,447 [MainThread  ] [INFO ]  PROGRESS: at sentence #15860000, processed 313424240 words, keeping 1604347 word types
2017-09-27 15:23:05,850 [MainThread  ] [INFO ]  PROGRESS: at sentence #15870000, processed 313605718 words, keeping 1604859 word types
2017-09-27 15:23:07,295 

2017-09-27 15:24:43,017 [MainThread  ] [INFO ]  PROGRESS: at sentence #16380000, processed 323460545 words, keeping 1629847 word types
2017-09-27 15:24:44,467 [MainThread  ] [INFO ]  PROGRESS: at sentence #16390000, processed 323645280 words, keeping 1630523 word types
2017-09-27 15:24:46,012 [MainThread  ] [INFO ]  PROGRESS: at sentence #16400000, processed 323841470 words, keeping 1630932 word types
2017-09-27 15:24:47,100 [MainThread  ] [INFO ]  245: ../data/documents/941.json.gz
2017-09-27 15:24:58,185 [MainThread  ] [INFO ]  PROGRESS: at sentence #16410000, processed 324015336 words, keeping 1631606 word types
2017-09-27 15:24:59,696 [MainThread  ] [INFO ]  PROGRESS: at sentence #16420000, processed 324219681 words, keeping 1631859 word types
2017-09-27 15:25:01,281 [MainThread  ] [INFO ]  PROGRESS: at sentence #16430000, processed 324421859 words, keeping 1632484 word types
2017-09-27 15:25:02,793 [MainThread  ] [INFO ]  PROGRESS: at sentence #16440000, processed 324621043 words,

2017-09-27 15:26:35,321 [MainThread  ] [INFO ]  PROGRESS: at sentence #16960000, processed 334450881 words, keeping 1688364 word types
2017-09-27 15:26:36,812 [MainThread  ] [INFO ]  PROGRESS: at sentence #16970000, processed 334647393 words, keeping 1688875 word types
2017-09-27 15:26:38,130 [MainThread  ] [INFO ]  PROGRESS: at sentence #16980000, processed 334822769 words, keeping 1689566 word types
2017-09-27 15:26:39,638 [MainThread  ] [INFO ]  PROGRESS: at sentence #16990000, processed 335015709 words, keeping 1689917 word types
2017-09-27 15:26:41,071 [MainThread  ] [INFO ]  PROGRESS: at sentence #17000000, processed 335206629 words, keeping 1690666 word types
2017-09-27 15:26:41,480 [MainThread  ] [INFO ]  251: ../data/documents/68.json.gz
2017-09-27 15:26:43,116 [MainThread  ] [INFO ]  PROGRESS: at sentence #17010000, processed 335391712 words, keeping 1691092 word types
2017-09-27 15:26:44,482 [MainThread  ] [INFO ]  PROGRESS: at sentence #17020000, processed 335569294 words, 

2017-09-27 15:28:28,291 [MainThread  ] [INFO ]  PROGRESS: at sentence #17530000, processed 345760333 words, keeping 1731980 word types
2017-09-27 15:28:29,666 [MainThread  ] [INFO ]  PROGRESS: at sentence #17540000, processed 345918719 words, keeping 1732391 word types
2017-09-27 15:28:31,091 [MainThread  ] [INFO ]  PROGRESS: at sentence #17550000, processed 346105153 words, keeping 1733156 word types
2017-09-27 15:28:32,518 [MainThread  ] [INFO ]  PROGRESS: at sentence #17560000, processed 346285591 words, keeping 1733866 word types
2017-09-27 15:28:33,919 [MainThread  ] [INFO ]  PROGRESS: at sentence #17570000, processed 346470084 words, keeping 1734420 word types
2017-09-27 15:28:35,325 [MainThread  ] [INFO ]  PROGRESS: at sentence #17580000, processed 346640493 words, keeping 1735020 word types
2017-09-27 15:28:36,774 [MainThread  ] [INFO ]  PROGRESS: at sentence #17590000, processed 346819662 words, keeping 1735523 word types
2017-09-27 15:28:38,189 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:30:12,201 [MainThread  ] [INFO ]  266: ../data/documents/102.json.gz
2017-09-27 15:30:14,705 [MainThread  ] [INFO ]  PROGRESS: at sentence #18090000, processed 356287820 words, keeping 1760507 word types
2017-09-27 15:30:16,099 [MainThread  ] [INFO ]  PROGRESS: at sentence #18100000, processed 356470857 words, keeping 1760929 word types
2017-09-27 15:30:17,471 [MainThread  ] [INFO ]  PROGRESS: at sentence #18110000, processed 356650077 words, keeping 1761516 word types
2017-09-27 15:30:18,875 [MainThread  ] [INFO ]  PROGRESS: at sentence #18120000, processed 356829301 words, keeping 1761949 word types
2017-09-27 15:30:20,357 [MainThread  ] [INFO ]  PROGRESS: at sentence #18130000, processed 357024826 words, keeping 1762277 word types
2017-09-27 15:30:21,775 [MainThread  ] [INFO ]  PROGRESS: at sentence #18140000, processed 357204110 words, keeping 1762661 word types
2017-09-27 15:30:23,277 [MainThread  ] [INFO ]  PROGRESS: at sentence #18150000, processed 357396218 words,

2017-09-27 15:32:08,519 [MainThread  ] [INFO ]  PROGRESS: at sentence #18670000, processed 367514496 words, keeping 1798529 word types
2017-09-27 15:32:10,002 [MainThread  ] [INFO ]  PROGRESS: at sentence #18680000, processed 367707425 words, keeping 1798894 word types
2017-09-27 15:32:11,484 [MainThread  ] [INFO ]  PROGRESS: at sentence #18690000, processed 367896948 words, keeping 1799254 word types
2017-09-27 15:32:12,871 [MainThread  ] [INFO ]  PROGRESS: at sentence #18700000, processed 368069215 words, keeping 1799719 word types
2017-09-27 15:32:14,399 [MainThread  ] [INFO ]  PROGRESS: at sentence #18710000, processed 368258466 words, keeping 1800219 word types
2017-09-27 15:32:15,813 [MainThread  ] [INFO ]  PROGRESS: at sentence #18720000, processed 368442837 words, keeping 1800604 word types
2017-09-27 15:32:17,291 [MainThread  ] [INFO ]  PROGRESS: at sentence #18730000, processed 368640012 words, keeping 1801070 word types
2017-09-27 15:32:18,776 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:33:55,640 [MainThread  ] [INFO ]  PROGRESS: at sentence #19250000, processed 378648088 words, keeping 1824045 word types
2017-09-27 15:33:57,186 [MainThread  ] [INFO ]  PROGRESS: at sentence #19260000, processed 378857834 words, keeping 1824584 word types
2017-09-27 15:33:58,591 [MainThread  ] [INFO ]  PROGRESS: at sentence #19270000, processed 379042266 words, keeping 1825657 word types
2017-09-27 15:34:00,178 [MainThread  ] [INFO ]  PROGRESS: at sentence #19280000, processed 379246064 words, keeping 1825967 word types
2017-09-27 15:34:01,307 [MainThread  ] [INFO ]  277: ../data/documents/489.json.gz
2017-09-27 15:34:02,463 [MainThread  ] [INFO ]  PROGRESS: at sentence #19290000, processed 379454678 words, keeping 1826344 word types
2017-09-27 15:34:04,486 [MainThread  ] [INFO ]  PROGRESS: at sentence #19300000, processed 379729907 words, keeping 1827143 word types
2017-09-27 15:34:05,097 [MainThread  ] [INFO ]  278: ../data/documents/95.json.gz
2017-09-27 15:34:08,754 [

2017-09-27 15:36:19,077 [MainThread  ] [INFO ]  PROGRESS: at sentence #19800000, processed 393118095 words, keeping 1854545 word types
2017-09-27 15:36:20,563 [MainThread  ] [INFO ]  PROGRESS: at sentence #19810000, processed 393309685 words, keeping 1854848 word types
2017-09-27 15:36:22,012 [MainThread  ] [INFO ]  PROGRESS: at sentence #19820000, processed 393490437 words, keeping 1855097 word types
2017-09-27 15:36:23,427 [MainThread  ] [INFO ]  PROGRESS: at sentence #19830000, processed 393675319 words, keeping 1855395 word types
2017-09-27 15:36:24,837 [MainThread  ] [INFO ]  PROGRESS: at sentence #19840000, processed 393860416 words, keeping 1855749 word types
2017-09-27 15:36:26,276 [MainThread  ] [INFO ]  PROGRESS: at sentence #19850000, processed 394050013 words, keeping 1855999 word types
2017-09-27 15:36:27,750 [MainThread  ] [INFO ]  PROGRESS: at sentence #19860000, processed 394244382 words, keeping 1856286 word types
2017-09-27 15:36:29,218 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:38:06,444 [MainThread  ] [INFO ]  295: ../data/documents/747.json.gz
2017-09-27 15:38:17,067 [MainThread  ] [INFO ]  PROGRESS: at sentence #20360000, processed 404230197 words, keeping 1878775 word types
2017-09-27 15:38:18,525 [MainThread  ] [INFO ]  PROGRESS: at sentence #20370000, processed 404425663 words, keeping 1879245 word types
2017-09-27 15:38:19,939 [MainThread  ] [INFO ]  PROGRESS: at sentence #20380000, processed 404612821 words, keeping 1879618 word types
2017-09-27 15:38:21,487 [MainThread  ] [INFO ]  PROGRESS: at sentence #20390000, processed 404820088 words, keeping 1879947 word types
2017-09-27 15:38:23,045 [MainThread  ] [INFO ]  PROGRESS: at sentence #20400000, processed 405022488 words, keeping 1880263 word types
2017-09-27 15:38:24,489 [MainThread  ] [INFO ]  PROGRESS: at sentence #20410000, processed 405216276 words, keeping 1880741 word types
2017-09-27 15:38:26,040 [MainThread  ] [INFO ]  PROGRESS: at sentence #20420000, processed 405424929 words,

2017-09-27 15:40:05,594 [MainThread  ] [INFO ]  PROGRESS: at sentence #20930000, processed 415351618 words, keeping 1899789 word types
2017-09-27 15:40:07,136 [MainThread  ] [INFO ]  PROGRESS: at sentence #20940000, processed 415540244 words, keeping 1900172 word types
2017-09-27 15:40:08,661 [MainThread  ] [INFO ]  PROGRESS: at sentence #20950000, processed 415736757 words, keeping 1900676 word types
2017-09-27 15:40:10,069 [MainThread  ] [INFO ]  PROGRESS: at sentence #20960000, processed 415920831 words, keeping 1901044 word types
2017-09-27 15:40:11,551 [MainThread  ] [INFO ]  PROGRESS: at sentence #20970000, processed 416118847 words, keeping 1901417 word types
2017-09-27 15:40:13,078 [MainThread  ] [INFO ]  PROGRESS: at sentence #20980000, processed 416316644 words, keeping 1901845 word types
2017-09-27 15:40:14,609 [MainThread  ] [INFO ]  PROGRESS: at sentence #20990000, processed 416522214 words, keeping 1902645 word types
2017-09-27 15:40:16,055 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:41:56,053 [MainThread  ] [INFO ]  PROGRESS: at sentence #21500000, processed 426517726 words, keeping 1929911 word types
2017-09-27 15:41:57,535 [MainThread  ] [INFO ]  PROGRESS: at sentence #21510000, processed 426716147 words, keeping 1930280 word types
2017-09-27 15:41:58,987 [MainThread  ] [INFO ]  PROGRESS: at sentence #21520000, processed 426908555 words, keeping 1930799 word types
2017-09-27 15:42:00,534 [MainThread  ] [INFO ]  PROGRESS: at sentence #21530000, processed 427111196 words, keeping 1930998 word types
2017-09-27 15:42:02,037 [MainThread  ] [INFO ]  PROGRESS: at sentence #21540000, processed 427315782 words, keeping 1931255 word types
2017-09-27 15:42:03,518 [MainThread  ] [INFO ]  PROGRESS: at sentence #21550000, processed 427512183 words, keeping 1931526 word types
2017-09-27 15:42:04,940 [MainThread  ] [INFO ]  PROGRESS: at sentence #21560000, processed 427702358 words, keeping 1931824 word types
2017-09-27 15:42:06,415 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:43:41,407 [MainThread  ] [INFO ]  PROGRESS: at sentence #22060000, processed 437639727 words, keeping 2009506 word types
2017-09-27 15:43:42,924 [MainThread  ] [INFO ]  PROGRESS: at sentence #22070000, processed 437833937 words, keeping 2009794 word types
2017-09-27 15:43:44,360 [MainThread  ] [INFO ]  PROGRESS: at sentence #22080000, processed 438021857 words, keeping 2010168 word types
2017-09-27 15:43:44,630 [MainThread  ] [INFO ]  318: ../data/documents/711.json.gz
2017-09-27 15:43:46,991 [MainThread  ] [INFO ]  PROGRESS: at sentence #22090000, processed 438281594 words, keeping 2010539 word types
2017-09-27 15:43:48,434 [MainThread  ] [INFO ]  319: ../data/documents/629.json.gz
2017-09-27 15:43:49,695 [MainThread  ] [INFO ]  PROGRESS: at sentence #22100000, processed 438560954 words, keeping 2011018 word types
2017-09-27 15:43:51,611 [MainThread  ] [INFO ]  PROGRESS: at sentence #22110000, processed 438814205 words, keeping 2011501 word types
2017-09-27 15:43:52,575 

2017-09-27 15:45:36,502 [MainThread  ] [INFO ]  PROGRESS: at sentence #22620000, processed 448945325 words, keeping 2032841 word types
2017-09-27 15:45:38,066 [MainThread  ] [INFO ]  PROGRESS: at sentence #22630000, processed 449150428 words, keeping 2033129 word types
2017-09-27 15:45:39,566 [MainThread  ] [INFO ]  PROGRESS: at sentence #22640000, processed 449339392 words, keeping 2033315 word types
2017-09-27 15:45:41,050 [MainThread  ] [INFO ]  PROGRESS: at sentence #22650000, processed 449533123 words, keeping 2033684 word types
2017-09-27 15:45:42,560 [MainThread  ] [INFO ]  PROGRESS: at sentence #22660000, processed 449729764 words, keeping 2033943 word types
2017-09-27 15:45:43,972 [MainThread  ] [INFO ]  PROGRESS: at sentence #22670000, processed 449919357 words, keeping 2034214 word types
2017-09-27 15:45:44,912 [MainThread  ] [INFO ]  326: ../data/documents/619.json.gz
2017-09-27 15:45:47,389 [MainThread  ] [INFO ]  PROGRESS: at sentence #22680000, processed 450122575 words,

2017-09-27 15:47:24,823 [MainThread  ] [INFO ]  PROGRESS: at sentence #23160000, processed 459867630 words, keeping 2088377 word types
2017-09-27 15:47:26,130 [MainThread  ] [INFO ]  PROGRESS: at sentence #23170000, processed 460034761 words, keeping 2088733 word types
2017-09-27 15:47:27,507 [MainThread  ] [INFO ]  PROGRESS: at sentence #23180000, processed 460213086 words, keeping 2089044 word types
2017-09-27 15:47:28,921 [MainThread  ] [INFO ]  PROGRESS: at sentence #23190000, processed 460392564 words, keeping 2089297 word types
2017-09-27 15:47:30,318 [MainThread  ] [INFO ]  PROGRESS: at sentence #23200000, processed 460574001 words, keeping 2089560 word types
2017-09-27 15:47:31,685 [MainThread  ] [INFO ]  PROGRESS: at sentence #23210000, processed 460750940 words, keeping 2089899 word types
2017-09-27 15:47:33,093 [MainThread  ] [INFO ]  PROGRESS: at sentence #23220000, processed 460932774 words, keeping 2090178 word types
2017-09-27 15:47:33,536 [MainThread  ] [INFO ]  338: ..

2017-09-27 15:49:16,432 [MainThread  ] [INFO ]  PROGRESS: at sentence #23740000, processed 471106408 words, keeping 2114003 word types
2017-09-27 15:49:17,914 [MainThread  ] [INFO ]  PROGRESS: at sentence #23750000, processed 471285163 words, keeping 2114887 word types
2017-09-27 15:49:19,356 [MainThread  ] [INFO ]  PROGRESS: at sentence #23760000, processed 471477006 words, keeping 2115365 word types
2017-09-27 15:49:20,936 [MainThread  ] [INFO ]  PROGRESS: at sentence #23770000, processed 471690599 words, keeping 2115942 word types
2017-09-27 15:49:22,448 [MainThread  ] [INFO ]  PROGRESS: at sentence #23780000, processed 471884853 words, keeping 2116395 word types
2017-09-27 15:49:23,879 [MainThread  ] [INFO ]  PROGRESS: at sentence #23790000, processed 472070254 words, keeping 2116930 word types
2017-09-27 15:49:25,232 [MainThread  ] [INFO ]  PROGRESS: at sentence #23800000, processed 472252163 words, keeping 2117528 word types
2017-09-27 15:49:26,703 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:51:03,540 [MainThread  ] [INFO ]  PROGRESS: at sentence #24330000, processed 482117343 words, keeping 2162657 word types
2017-09-27 15:51:04,799 [MainThread  ] [INFO ]  348: ../data/documents/216.json.gz
2017-09-27 15:51:09,746 [MainThread  ] [INFO ]  PROGRESS: at sentence #24340000, processed 482318116 words, keeping 2162949 word types
2017-09-27 15:51:11,162 [MainThread  ] [INFO ]  PROGRESS: at sentence #24350000, processed 482494348 words, keeping 2163377 word types
2017-09-27 15:51:12,436 [MainThread  ] [INFO ]  PROGRESS: at sentence #24360000, processed 482662563 words, keeping 2163846 word types
2017-09-27 15:51:13,757 [MainThread  ] [INFO ]  PROGRESS: at sentence #24370000, processed 482833479 words, keeping 2164354 word types
2017-09-27 15:51:15,068 [MainThread  ] [INFO ]  PROGRESS: at sentence #24380000, processed 483004765 words, keeping 2164834 word types
2017-09-27 15:51:16,384 [MainThread  ] [INFO ]  PROGRESS: at sentence #24390000, processed 483170787 words,

2017-09-27 15:52:52,856 [MainThread  ] [INFO ]  PROGRESS: at sentence #24890000, processed 493096581 words, keeping 2184540 word types
2017-09-27 15:52:53,021 [MainThread  ] [INFO ]  357: ../data/documents/191.json.gz
2017-09-27 15:52:58,866 [MainThread  ] [INFO ]  PROGRESS: at sentence #24900000, processed 493285242 words, keeping 2184898 word types
2017-09-27 15:53:00,262 [MainThread  ] [INFO ]  PROGRESS: at sentence #24910000, processed 493465673 words, keeping 2185192 word types
2017-09-27 15:53:01,650 [MainThread  ] [INFO ]  PROGRESS: at sentence #24920000, processed 493645166 words, keeping 2185548 word types
2017-09-27 15:53:02,950 [MainThread  ] [INFO ]  PROGRESS: at sentence #24930000, processed 493816108 words, keeping 2185996 word types
2017-09-27 15:53:04,235 [MainThread  ] [INFO ]  PROGRESS: at sentence #24940000, processed 493982521 words, keeping 2186285 word types
2017-09-27 15:53:05,657 [MainThread  ] [INFO ]  PROGRESS: at sentence #24950000, processed 494166694 words,

2017-09-27 15:54:44,327 [MainThread  ] [INFO ]  PROGRESS: at sentence #25440000, processed 503735429 words, keeping 2204883 word types
2017-09-27 15:54:46,016 [MainThread  ] [INFO ]  PROGRESS: at sentence #25450000, processed 503939926 words, keeping 2205126 word types
2017-09-27 15:54:47,655 [MainThread  ] [INFO ]  PROGRESS: at sentence #25460000, processed 504145606 words, keeping 2205398 word types
2017-09-27 15:54:49,248 [MainThread  ] [INFO ]  PROGRESS: at sentence #25470000, processed 504354743 words, keeping 2205658 word types
2017-09-27 15:54:50,838 [MainThread  ] [INFO ]  PROGRESS: at sentence #25480000, processed 504551867 words, keeping 2205971 word types
2017-09-27 15:54:52,519 [MainThread  ] [INFO ]  PROGRESS: at sentence #25490000, processed 504767297 words, keeping 2206258 word types
2017-09-27 15:54:54,206 [MainThread  ] [INFO ]  PROGRESS: at sentence #25500000, processed 504976477 words, keeping 2206596 word types
2017-09-27 15:54:55,879 [MainThread  ] [INFO ]  PROGRES

2017-09-27 15:56:45,073 [MainThread  ] [INFO ]  PROGRESS: at sentence #26010000, processed 516027063 words, keeping 2224363 word types
2017-09-27 15:56:47,081 [MainThread  ] [INFO ]  PROGRESS: at sentence #26020000, processed 516294066 words, keeping 2224628 word types
2017-09-27 15:56:48,663 [MainThread  ] [INFO ]  PROGRESS: at sentence #26030000, processed 516499690 words, keeping 2225041 word types
2017-09-27 15:56:50,216 [MainThread  ] [INFO ]  PROGRESS: at sentence #26040000, processed 516701180 words, keeping 2225504 word types
2017-09-27 15:56:51,706 [MainThread  ] [INFO ]  PROGRESS: at sentence #26050000, processed 516899780 words, keeping 2225720 word types
2017-09-27 15:56:53,241 [MainThread  ] [INFO ]  PROGRESS: at sentence #26060000, processed 517094603 words, keeping 2225980 word types
2017-09-27 15:56:54,821 [MainThread  ] [INFO ]  373: ../data/documents/536.json.gz
2017-09-27 15:56:55,925 [MainThread  ] [INFO ]  PROGRESS: at sentence #26070000, processed 517320599 words,

2017-09-27 15:58:44,365 [MainThread  ] [INFO ]  PROGRESS: at sentence #26580000, processed 527331604 words, keeping 2241870 word types
2017-09-27 15:58:45,889 [MainThread  ] [INFO ]  PROGRESS: at sentence #26590000, processed 527530268 words, keeping 2242534 word types
2017-09-27 15:58:47,326 [MainThread  ] [INFO ]  PROGRESS: at sentence #26600000, processed 527709617 words, keeping 2242730 word types
2017-09-27 15:58:48,864 [MainThread  ] [INFO ]  PROGRESS: at sentence #26610000, processed 527912918 words, keeping 2242991 word types
2017-09-27 15:58:50,308 [MainThread  ] [INFO ]  PROGRESS: at sentence #26620000, processed 528097034 words, keeping 2243418 word types
2017-09-27 15:58:51,799 [MainThread  ] [INFO ]  PROGRESS: at sentence #26630000, processed 528286351 words, keeping 2243784 word types
2017-09-27 15:58:53,212 [MainThread  ] [INFO ]  PROGRESS: at sentence #26640000, processed 528469652 words, keeping 2244340 word types
2017-09-27 15:58:54,750 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:00:29,497 [MainThread  ] [INFO ]  PROGRESS: at sentence #27160000, processed 538168849 words, keeping 2263597 word types
2017-09-27 16:00:30,939 [MainThread  ] [INFO ]  PROGRESS: at sentence #27170000, processed 538348389 words, keeping 2263894 word types
2017-09-27 16:00:32,396 [MainThread  ] [INFO ]  PROGRESS: at sentence #27180000, processed 538542861 words, keeping 2264192 word types
2017-09-27 16:00:33,855 [MainThread  ] [INFO ]  PROGRESS: at sentence #27190000, processed 538737321 words, keeping 2264450 word types
2017-09-27 16:00:35,338 [MainThread  ] [INFO ]  PROGRESS: at sentence #27200000, processed 538927491 words, keeping 2264708 word types
2017-09-27 16:00:36,768 [MainThread  ] [INFO ]  PROGRESS: at sentence #27210000, processed 539116167 words, keeping 2265140 word types
2017-09-27 16:00:38,247 [MainThread  ] [INFO ]  PROGRESS: at sentence #27220000, processed 539308697 words, keeping 2265482 word types
2017-09-27 16:00:39,641 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:02:12,857 [MainThread  ] [INFO ]  390: ../data/documents/949.json.gz
2017-09-27 16:02:14,587 [MainThread  ] [INFO ]  PROGRESS: at sentence #27730000, processed 549083838 words, keeping 2297940 word types
2017-09-27 16:02:16,161 [MainThread  ] [INFO ]  PROGRESS: at sentence #27740000, processed 549288753 words, keeping 2298173 word types
2017-09-27 16:02:17,689 [MainThread  ] [INFO ]  PROGRESS: at sentence #27750000, processed 549487854 words, keeping 2298408 word types
2017-09-27 16:02:19,201 [MainThread  ] [INFO ]  PROGRESS: at sentence #27760000, processed 549679755 words, keeping 2298656 word types
2017-09-27 16:02:20,445 [MainThread  ] [INFO ]  391: ../data/documents/749.json.gz
2017-09-27 16:02:25,753 [MainThread  ] [INFO ]  PROGRESS: at sentence #27770000, processed 549891543 words, keeping 2299032 word types
2017-09-27 16:02:27,287 [MainThread  ] [INFO ]  PROGRESS: at sentence #27780000, processed 550090957 words, keeping 2299311 word types
2017-09-27 16:02:28,856 

2017-09-27 16:04:02,057 [MainThread  ] [INFO ]  PROGRESS: at sentence #28260000, processed 559848168 words, keeping 2335043 word types
2017-09-27 16:04:03,677 [MainThread  ] [INFO ]  PROGRESS: at sentence #28270000, processed 560066587 words, keeping 2335222 word types
2017-09-27 16:04:05,215 [MainThread  ] [INFO ]  PROGRESS: at sentence #28280000, processed 560273277 words, keeping 2335423 word types
2017-09-27 16:04:06,786 [MainThread  ] [INFO ]  PROGRESS: at sentence #28290000, processed 560474760 words, keeping 2335670 word types
2017-09-27 16:04:07,598 [MainThread  ] [INFO ]  403: ../data/documents/244.json.gz
2017-09-27 16:04:13,109 [MainThread  ] [INFO ]  PROGRESS: at sentence #28300000, processed 560663323 words, keeping 2335939 word types
2017-09-27 16:04:14,467 [MainThread  ] [INFO ]  PROGRESS: at sentence #28310000, processed 560837537 words, keeping 2336267 word types
2017-09-27 16:04:15,826 [MainThread  ] [INFO ]  PROGRESS: at sentence #28320000, processed 560999374 words,

2017-09-27 16:05:51,428 [MainThread  ] [INFO ]  PROGRESS: at sentence #28810000, processed 570428109 words, keeping 2353357 word types
2017-09-27 16:05:53,138 [MainThread  ] [INFO ]  PROGRESS: at sentence #28820000, processed 570647693 words, keeping 2353662 word types
2017-09-27 16:05:54,814 [MainThread  ] [INFO ]  PROGRESS: at sentence #28830000, processed 570871898 words, keeping 2353936 word types
2017-09-27 16:05:56,415 [MainThread  ] [INFO ]  PROGRESS: at sentence #28840000, processed 571083884 words, keeping 2354216 word types
2017-09-27 16:05:57,843 [MainThread  ] [INFO ]  PROGRESS: at sentence #28850000, processed 571268873 words, keeping 2354572 word types
2017-09-27 16:05:59,366 [MainThread  ] [INFO ]  PROGRESS: at sentence #28860000, processed 571454258 words, keeping 2354970 word types
2017-09-27 16:05:59,980 [MainThread  ] [INFO ]  413: ../data/documents/460.json.gz
2017-09-27 16:06:03,119 [MainThread  ] [INFO ]  PROGRESS: at sentence #28870000, processed 571649369 words,

2017-09-27 16:07:41,088 [MainThread  ] [INFO ]  PROGRESS: at sentence #29400000, processed 581628695 words, keeping 2374253 word types
2017-09-27 16:07:42,618 [MainThread  ] [INFO ]  PROGRESS: at sentence #29410000, processed 581823552 words, keeping 2374470 word types
2017-09-27 16:07:44,124 [MainThread  ] [INFO ]  PROGRESS: at sentence #29420000, processed 582018169 words, keeping 2374811 word types
2017-09-27 16:07:44,938 [MainThread  ] [INFO ]  417: ../data/documents/442.json.gz
2017-09-27 16:07:46,597 [MainThread  ] [INFO ]  PROGRESS: at sentence #29430000, processed 582233470 words, keeping 2375211 word types
2017-09-27 16:07:48,418 [MainThread  ] [INFO ]  PROGRESS: at sentence #29440000, processed 582481809 words, keeping 2375539 word types
2017-09-27 16:07:49,428 [MainThread  ] [INFO ]  418: ../data/documents/305.json.gz
2017-09-27 16:07:54,202 [MainThread  ] [INFO ]  PROGRESS: at sentence #29450000, processed 582693625 words, keeping 2375854 word types
2017-09-27 16:07:55,589 

2017-09-27 16:09:32,657 [MainThread  ] [INFO ]  PROGRESS: at sentence #29970000, processed 592718514 words, keeping 2391470 word types
2017-09-27 16:09:34,053 [MainThread  ] [INFO ]  PROGRESS: at sentence #29980000, processed 592900606 words, keeping 2391707 word types
2017-09-27 16:09:35,424 [MainThread  ] [INFO ]  PROGRESS: at sentence #29990000, processed 593078900 words, keeping 2391985 word types
2017-09-27 16:09:36,871 [MainThread  ] [INFO ]  PROGRESS: at sentence #30000000, processed 593270755 words, keeping 2392223 word types
2017-09-27 16:09:37,590 [MainThread  ] [INFO ]  423: ../data/documents/353.json.gz
2017-09-27 16:09:39,114 [MainThread  ] [INFO ]  PROGRESS: at sentence #30010000, processed 593515420 words, keeping 2392665 word types
2017-09-27 16:09:39,836 [MainThread  ] [INFO ]  424: ../data/documents/301.json.gz
2017-09-27 16:09:44,187 [MainThread  ] [INFO ]  PROGRESS: at sentence #30020000, processed 593733469 words, keeping 2393097 word types
2017-09-27 16:09:45,657 

2017-09-27 16:11:21,117 [MainThread  ] [INFO ]  PROGRESS: at sentence #30510000, processed 603580810 words, keeping 2427468 word types
2017-09-27 16:11:22,753 [MainThread  ] [INFO ]  PROGRESS: at sentence #30520000, processed 603795115 words, keeping 2427634 word types
2017-09-27 16:11:24,367 [MainThread  ] [INFO ]  PROGRESS: at sentence #30530000, processed 604006203 words, keeping 2427834 word types
2017-09-27 16:11:26,084 [MainThread  ] [INFO ]  PROGRESS: at sentence #30540000, processed 604232910 words, keeping 2428036 word types
2017-09-27 16:11:27,646 [MainThread  ] [INFO ]  PROGRESS: at sentence #30550000, processed 604447467 words, keeping 2428269 word types
2017-09-27 16:11:28,251 [MainThread  ] [INFO ]  435: ../data/documents/850.json.gz
2017-09-27 16:11:32,224 [MainThread  ] [INFO ]  PROGRESS: at sentence #30560000, processed 604697325 words, keeping 2428529 word types
2017-09-27 16:11:34,214 [MainThread  ] [INFO ]  PROGRESS: at sentence #30570000, processed 604970732 words,

2017-09-27 16:13:13,205 [MainThread  ] [INFO ]  PROGRESS: at sentence #31080000, processed 615031014 words, keeping 2442331 word types
2017-09-27 16:13:14,045 [MainThread  ] [INFO ]  442: ../data/documents/479.json.gz
2017-09-27 16:13:15,437 [MainThread  ] [INFO ]  PROGRESS: at sentence #31090000, processed 615235574 words, keeping 2442514 word types
2017-09-27 16:13:17,133 [MainThread  ] [INFO ]  PROGRESS: at sentence #31100000, processed 615465578 words, keeping 2442684 word types
2017-09-27 16:13:17,835 [MainThread  ] [INFO ]  443: ../data/documents/662.json.gz
2017-09-27 16:13:27,997 [MainThread  ] [INFO ]  PROGRESS: at sentence #31110000, processed 615674507 words, keeping 2442913 word types
2017-09-27 16:13:29,615 [MainThread  ] [INFO ]  PROGRESS: at sentence #31120000, processed 615891238 words, keeping 2443650 word types
2017-09-27 16:13:30,996 [MainThread  ] [INFO ]  PROGRESS: at sentence #31130000, processed 616077104 words, keeping 2443890 word types
2017-09-27 16:13:32,474 

2017-09-27 16:15:00,261 [MainThread  ] [INFO ]  452: ../data/documents/431.json.gz
2017-09-27 16:15:03,318 [MainThread  ] [INFO ]  PROGRESS: at sentence #31630000, processed 625738781 words, keeping 2461858 word types
2017-09-27 16:15:04,854 [MainThread  ] [INFO ]  PROGRESS: at sentence #31640000, processed 625938097 words, keeping 2462140 word types
2017-09-27 16:15:06,492 [MainThread  ] [INFO ]  PROGRESS: at sentence #31650000, processed 626157262 words, keeping 2462336 word types
2017-09-27 16:15:08,090 [MainThread  ] [INFO ]  PROGRESS: at sentence #31660000, processed 626374456 words, keeping 2462645 word types
2017-09-27 16:15:09,643 [MainThread  ] [INFO ]  PROGRESS: at sentence #31670000, processed 626583144 words, keeping 2462846 word types
2017-09-27 16:15:10,849 [MainThread  ] [INFO ]  453: ../data/documents/399.json.gz
2017-09-27 16:15:12,102 [MainThread  ] [INFO ]  PROGRESS: at sentence #31680000, processed 626798135 words, keeping 2463140 word types
2017-09-27 16:15:13,964 

2017-09-27 16:16:54,832 [MainThread  ] [INFO ]  PROGRESS: at sentence #32190000, processed 636957188 words, keeping 2476823 word types
2017-09-27 16:16:56,324 [MainThread  ] [INFO ]  PROGRESS: at sentence #32200000, processed 637154789 words, keeping 2477114 word types
2017-09-27 16:16:57,760 [MainThread  ] [INFO ]  PROGRESS: at sentence #32210000, processed 637338463 words, keeping 2477324 word types
2017-09-27 16:16:59,342 [MainThread  ] [INFO ]  PROGRESS: at sentence #32220000, processed 637536413 words, keeping 2477760 word types
2017-09-27 16:17:00,479 [MainThread  ] [INFO ]  461: ../data/documents/388.json.gz
2017-09-27 16:17:03,648 [MainThread  ] [INFO ]  PROGRESS: at sentence #32230000, processed 637744440 words, keeping 2477963 word types
2017-09-27 16:17:05,301 [MainThread  ] [INFO ]  462: ../data/documents/681.json.gz
2017-09-27 16:17:12,204 [MainThread  ] [INFO ]  PROGRESS: at sentence #32240000, processed 637984937 words, keeping 2478165 word types
2017-09-27 16:17:13,661 

2017-09-27 16:18:42,203 [MainThread  ] [INFO ]  469: ../data/documents/492.json.gz
2017-09-27 16:18:46,041 [MainThread  ] [INFO ]  PROGRESS: at sentence #32750000, processed 647869130 words, keeping 2496563 word types
2017-09-27 16:18:47,913 [MainThread  ] [INFO ]  PROGRESS: at sentence #32760000, processed 648123387 words, keeping 2496915 word types
2017-09-27 16:18:48,630 [MainThread  ] [INFO ]  470: ../data/documents/568.json.gz
2017-09-27 16:18:50,835 [MainThread  ] [INFO ]  PROGRESS: at sentence #32770000, processed 648327066 words, keeping 2497100 word types
2017-09-27 16:18:52,522 [MainThread  ] [INFO ]  PROGRESS: at sentence #32780000, processed 648552814 words, keeping 2497288 word types
2017-09-27 16:18:54,071 [MainThread  ] [INFO ]  PROGRESS: at sentence #32790000, processed 648768035 words, keeping 2497463 word types
2017-09-27 16:18:55,716 [MainThread  ] [INFO ]  PROGRESS: at sentence #32800000, processed 648992953 words, keeping 2497670 word types
2017-09-27 16:18:57,332 

2017-09-27 16:20:33,217 [MainThread  ] [INFO ]  475: ../data/documents/403.json.gz
2017-09-27 16:20:34,895 [MainThread  ] [INFO ]  PROGRESS: at sentence #33320000, processed 659006158 words, keeping 2513461 word types
2017-09-27 16:20:35,762 [MainThread  ] [INFO ]  476: ../data/documents/105.json.gz
2017-09-27 16:20:40,159 [MainThread  ] [INFO ]  PROGRESS: at sentence #33330000, processed 659219068 words, keeping 2513864 word types
2017-09-27 16:20:41,515 [MainThread  ] [INFO ]  PROGRESS: at sentence #33340000, processed 659396069 words, keeping 2514217 word types
2017-09-27 16:20:42,840 [MainThread  ] [INFO ]  PROGRESS: at sentence #33350000, processed 659569569 words, keeping 2514492 word types
2017-09-27 16:20:44,303 [MainThread  ] [INFO ]  PROGRESS: at sentence #33360000, processed 659754927 words, keeping 2514935 word types
2017-09-27 16:20:45,686 [MainThread  ] [INFO ]  PROGRESS: at sentence #33370000, processed 659933632 words, keeping 2515235 word types
2017-09-27 16:20:47,079 

2017-09-27 16:22:25,669 [MainThread  ] [INFO ]  PROGRESS: at sentence #33880000, processed 669626404 words, keeping 2529795 word types
2017-09-27 16:22:27,077 [MainThread  ] [INFO ]  PROGRESS: at sentence #33890000, processed 669810354 words, keeping 2529977 word types
2017-09-27 16:22:28,458 [MainThread  ] [INFO ]  PROGRESS: at sentence #33900000, processed 669990250 words, keeping 2530204 word types
2017-09-27 16:22:29,964 [MainThread  ] [INFO ]  PROGRESS: at sentence #33910000, processed 670190319 words, keeping 2531484 word types
2017-09-27 16:22:31,542 [MainThread  ] [INFO ]  PROGRESS: at sentence #33920000, processed 670396017 words, keeping 2531715 word types
2017-09-27 16:22:33,012 [MainThread  ] [INFO ]  PROGRESS: at sentence #33930000, processed 670582115 words, keeping 2532020 word types
2017-09-27 16:22:34,546 [MainThread  ] [INFO ]  PROGRESS: at sentence #33940000, processed 670779467 words, keeping 2532185 word types
2017-09-27 16:22:35,941 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:24:12,592 [MainThread  ] [INFO ]  PROGRESS: at sentence #34430000, processed 680589171 words, keeping 2548209 word types
2017-09-27 16:24:12,659 [MainThread  ] [INFO ]  493: ../data/documents/21.json.gz
2017-09-27 16:24:17,303 [MainThread  ] [INFO ]  PROGRESS: at sentence #34440000, processed 680772308 words, keeping 2549491 word types
2017-09-27 16:24:18,721 [MainThread  ] [INFO ]  PROGRESS: at sentence #34450000, processed 680952998 words, keeping 2551456 word types
2017-09-27 16:24:20,104 [MainThread  ] [INFO ]  PROGRESS: at sentence #34460000, processed 681127737 words, keeping 2552600 word types
2017-09-27 16:24:21,510 [MainThread  ] [INFO ]  PROGRESS: at sentence #34470000, processed 681307135 words, keeping 2553057 word types
2017-09-27 16:24:22,961 [MainThread  ] [INFO ]  PROGRESS: at sentence #34480000, processed 681489268 words, keeping 2553623 word types
2017-09-27 16:24:23,201 [MainThread  ] [INFO ]  494: ../data/documents/396.json.gz
2017-09-27 16:24:25,561 [

2017-09-27 16:26:06,172 [MainThread  ] [INFO ]  PROGRESS: at sentence #34970000, processed 691501373 words, keeping 2571623 word types
2017-09-27 16:26:07,818 [MainThread  ] [INFO ]  PROGRESS: at sentence #34980000, processed 691703811 words, keeping 2571827 word types
2017-09-27 16:26:09,308 [MainThread  ] [INFO ]  PROGRESS: at sentence #34990000, processed 691893623 words, keeping 2572036 word types
2017-09-27 16:26:10,815 [MainThread  ] [INFO ]  PROGRESS: at sentence #35000000, processed 692081915 words, keeping 2572245 word types
2017-09-27 16:26:12,420 [MainThread  ] [INFO ]  PROGRESS: at sentence #35010000, processed 692279031 words, keeping 2572424 word types
2017-09-27 16:26:14,105 [MainThread  ] [INFO ]  PROGRESS: at sentence #35020000, processed 692500348 words, keeping 2572625 word types
2017-09-27 16:26:15,801 [MainThread  ] [INFO ]  PROGRESS: at sentence #35030000, processed 692707288 words, keeping 2572874 word types
2017-09-27 16:26:16,736 [MainThread  ] [INFO ]  504: ..

2017-09-27 16:28:00,983 [MainThread  ] [INFO ]  PROGRESS: at sentence #35550000, processed 702718190 words, keeping 2587625 word types
2017-09-27 16:28:02,633 [MainThread  ] [INFO ]  PROGRESS: at sentence #35560000, processed 702933756 words, keeping 2587809 word types
2017-09-27 16:28:04,397 [MainThread  ] [INFO ]  PROGRESS: at sentence #35570000, processed 703169044 words, keeping 2588169 word types
2017-09-27 16:28:06,205 [MainThread  ] [INFO ]  PROGRESS: at sentence #35580000, processed 703411284 words, keeping 2588439 word types
2017-09-27 16:28:07,825 [MainThread  ] [INFO ]  PROGRESS: at sentence #35590000, processed 703630306 words, keeping 2588614 word types
2017-09-27 16:28:09,226 [MainThread  ] [INFO ]  PROGRESS: at sentence #35600000, processed 703814243 words, keeping 2588812 word types
2017-09-27 16:28:10,910 [MainThread  ] [INFO ]  PROGRESS: at sentence #35610000, processed 704038260 words, keeping 2589073 word types
2017-09-27 16:28:12,779 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:29:57,607 [MainThread  ] [INFO ]  PROGRESS: at sentence #36120000, processed 714324167 words, keeping 2602706 word types
2017-09-27 16:29:59,015 [MainThread  ] [INFO ]  PROGRESS: at sentence #36130000, processed 714511774 words, keeping 2603316 word types
2017-09-27 16:30:00,702 [MainThread  ] [INFO ]  PROGRESS: at sentence #36140000, processed 714730689 words, keeping 2603539 word types
2017-09-27 16:30:02,189 [MainThread  ] [INFO ]  PROGRESS: at sentence #36150000, processed 714922345 words, keeping 2603788 word types
2017-09-27 16:30:03,704 [MainThread  ] [INFO ]  PROGRESS: at sentence #36160000, processed 715125560 words, keeping 2604221 word types
2017-09-27 16:30:05,111 [MainThread  ] [INFO ]  PROGRESS: at sentence #36170000, processed 715308241 words, keeping 2604313 word types
2017-09-27 16:30:06,646 [MainThread  ] [INFO ]  PROGRESS: at sentence #36180000, processed 715503189 words, keeping 2604587 word types
2017-09-27 16:30:08,155 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:31:42,616 [MainThread  ] [INFO ]  PROGRESS: at sentence #36690000, processed 725052378 words, keeping 2621088 word types
2017-09-27 16:31:44,093 [MainThread  ] [INFO ]  PROGRESS: at sentence #36700000, processed 725245278 words, keeping 2621230 word types
2017-09-27 16:31:45,482 [MainThread  ] [INFO ]  PROGRESS: at sentence #36710000, processed 725426494 words, keeping 2621425 word types
2017-09-27 16:31:47,100 [MainThread  ] [INFO ]  PROGRESS: at sentence #36720000, processed 725633312 words, keeping 2621833 word types
2017-09-27 16:31:48,664 [MainThread  ] [INFO ]  PROGRESS: at sentence #36730000, processed 725840045 words, keeping 2621976 word types
2017-09-27 16:31:50,150 [MainThread  ] [INFO ]  PROGRESS: at sentence #36740000, processed 726041077 words, keeping 2622149 word types
2017-09-27 16:31:51,696 [MainThread  ] [INFO ]  PROGRESS: at sentence #36750000, processed 726243534 words, keeping 2622322 word types
2017-09-27 16:31:53,164 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:33:30,929 [MainThread  ] [INFO ]  PROGRESS: at sentence #37260000, processed 736070235 words, keeping 2641631 word types
2017-09-27 16:33:32,542 [MainThread  ] [INFO ]  PROGRESS: at sentence #37270000, processed 736280866 words, keeping 2641899 word types
2017-09-27 16:33:34,187 [MainThread  ] [INFO ]  PROGRESS: at sentence #37280000, processed 736487513 words, keeping 2642103 word types
2017-09-27 16:33:35,665 [MainThread  ] [INFO ]  PROGRESS: at sentence #37290000, processed 736680343 words, keeping 2642391 word types
2017-09-27 16:33:35,883 [MainThread  ] [INFO ]  528: ../data/documents/604.json.gz
2017-09-27 16:33:43,786 [MainThread  ] [INFO ]  PROGRESS: at sentence #37300000, processed 736889144 words, keeping 2642700 word types
2017-09-27 16:33:45,205 [MainThread  ] [INFO ]  PROGRESS: at sentence #37310000, processed 737076464 words, keeping 2642939 word types
2017-09-27 16:33:46,709 [MainThread  ] [INFO ]  PROGRESS: at sentence #37320000, processed 737267832 words,

2017-09-27 16:35:22,908 [MainThread  ] [INFO ]  PROGRESS: at sentence #37820000, processed 746893384 words, keeping 2658860 word types
2017-09-27 16:35:24,243 [MainThread  ] [INFO ]  PROGRESS: at sentence #37830000, processed 747057702 words, keeping 2659661 word types
2017-09-27 16:35:25,638 [MainThread  ] [INFO ]  PROGRESS: at sentence #37840000, processed 747241278 words, keeping 2660250 word types
2017-09-27 16:35:26,991 [MainThread  ] [INFO ]  PROGRESS: at sentence #37850000, processed 747413885 words, keeping 2660570 word types
2017-09-27 16:35:28,401 [MainThread  ] [INFO ]  PROGRESS: at sentence #37860000, processed 747596518 words, keeping 2660900 word types
2017-09-27 16:35:29,855 [MainThread  ] [INFO ]  PROGRESS: at sentence #37870000, processed 747783061 words, keeping 2661313 word types
2017-09-27 16:35:31,257 [MainThread  ] [INFO ]  PROGRESS: at sentence #37880000, processed 747958536 words, keeping 2661686 word types
2017-09-27 16:35:32,665 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:37:10,979 [MainThread  ] [INFO ]  PROGRESS: at sentence #38380000, processed 757622003 words, keeping 2672904 word types
2017-09-27 16:37:12,632 [MainThread  ] [INFO ]  PROGRESS: at sentence #38390000, processed 757821895 words, keeping 2673144 word types
2017-09-27 16:37:14,083 [MainThread  ] [INFO ]  PROGRESS: at sentence #38400000, processed 758007452 words, keeping 2673433 word types
2017-09-27 16:37:15,558 [MainThread  ] [INFO ]  PROGRESS: at sentence #38410000, processed 758200229 words, keeping 2673615 word types
2017-09-27 16:37:17,054 [MainThread  ] [INFO ]  PROGRESS: at sentence #38420000, processed 758387062 words, keeping 2673844 word types
2017-09-27 16:37:18,552 [MainThread  ] [INFO ]  PROGRESS: at sentence #38430000, processed 758573008 words, keeping 2674094 word types
2017-09-27 16:37:19,073 [MainThread  ] [INFO ]  544: ../data/documents/465.json.gz
2017-09-27 16:37:26,178 [MainThread  ] [INFO ]  PROGRESS: at sentence #38440000, processed 758764892 words,

2017-09-27 16:39:01,362 [MainThread  ] [INFO ]  PROGRESS: at sentence #38950000, processed 768404285 words, keeping 2689225 word types
2017-09-27 16:39:02,728 [MainThread  ] [INFO ]  PROGRESS: at sentence #38960000, processed 768579887 words, keeping 2689533 word types
2017-09-27 16:39:04,183 [MainThread  ] [INFO ]  PROGRESS: at sentence #38970000, processed 768765461 words, keeping 2689776 word types
2017-09-27 16:39:05,587 [MainThread  ] [INFO ]  PROGRESS: at sentence #38980000, processed 768941111 words, keeping 2690076 word types
2017-09-27 16:39:07,019 [MainThread  ] [INFO ]  PROGRESS: at sentence #38990000, processed 769129683 words, keeping 2690244 word types
2017-09-27 16:39:08,578 [MainThread  ] [INFO ]  PROGRESS: at sentence #39000000, processed 769331403 words, keeping 2690651 word types
2017-09-27 16:39:10,054 [MainThread  ] [INFO ]  PROGRESS: at sentence #39010000, processed 769520166 words, keeping 2690820 word types
2017-09-27 16:39:11,427 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:40:48,395 [MainThread  ] [INFO ]  PROGRESS: at sentence #39530000, processed 779036833 words, keeping 2717202 word types
2017-09-27 16:40:49,854 [MainThread  ] [INFO ]  PROGRESS: at sentence #39540000, processed 779226946 words, keeping 2717366 word types
2017-09-27 16:40:51,281 [MainThread  ] [INFO ]  PROGRESS: at sentence #39550000, processed 779409634 words, keeping 2717569 word types
2017-09-27 16:40:52,890 [MainThread  ] [INFO ]  PROGRESS: at sentence #39560000, processed 779619209 words, keeping 2717714 word types
2017-09-27 16:40:54,410 [MainThread  ] [INFO ]  PROGRESS: at sentence #39570000, processed 779809737 words, keeping 2717912 word types
2017-09-27 16:40:55,982 [MainThread  ] [INFO ]  PROGRESS: at sentence #39580000, processed 780008875 words, keeping 2718033 word types
2017-09-27 16:40:57,454 [MainThread  ] [INFO ]  PROGRESS: at sentence #39590000, processed 780197333 words, keeping 2718176 word types
2017-09-27 16:40:57,488 [MainThread  ] [INFO ]  557: ..

2017-09-27 16:42:34,102 [MainThread  ] [INFO ]  PROGRESS: at sentence #40090000, processed 789613822 words, keeping 2740991 word types
2017-09-27 16:42:35,455 [MainThread  ] [INFO ]  PROGRESS: at sentence #40100000, processed 789788407 words, keeping 2741240 word types
2017-09-27 16:42:35,572 [MainThread  ] [INFO ]  566: ../data/documents/259.json.gz
2017-09-27 16:42:38,257 [MainThread  ] [INFO ]  PROGRESS: at sentence #40110000, processed 789976622 words, keeping 2747083 word types
2017-09-27 16:42:39,786 [MainThread  ] [INFO ]  PROGRESS: at sentence #40120000, processed 790181580 words, keeping 2752601 word types
2017-09-27 16:42:41,191 [MainThread  ] [INFO ]  PROGRESS: at sentence #40130000, processed 790367846 words, keeping 2758025 word types
2017-09-27 16:42:42,656 [MainThread  ] [INFO ]  PROGRESS: at sentence #40140000, processed 790566736 words, keeping 2766031 word types
2017-09-27 16:42:44,137 [MainThread  ] [INFO ]  PROGRESS: at sentence #40150000, processed 790773425 words,

2017-09-27 16:44:30,326 [MainThread  ] [INFO ]  PROGRESS: at sentence #40650000, processed 800873187 words, keeping 2783911 word types
2017-09-27 16:44:31,719 [MainThread  ] [INFO ]  PROGRESS: at sentence #40660000, processed 801046703 words, keeping 2784307 word types
2017-09-27 16:44:33,185 [MainThread  ] [INFO ]  PROGRESS: at sentence #40670000, processed 801236325 words, keeping 2784480 word types
2017-09-27 16:44:34,698 [MainThread  ] [INFO ]  PROGRESS: at sentence #40680000, processed 801421118 words, keeping 2784723 word types
2017-09-27 16:44:36,149 [MainThread  ] [INFO ]  PROGRESS: at sentence #40690000, processed 801614018 words, keeping 2784978 word types
2017-09-27 16:44:37,612 [MainThread  ] [INFO ]  PROGRESS: at sentence #40700000, processed 801804703 words, keeping 2785314 word types
2017-09-27 16:44:39,106 [MainThread  ] [INFO ]  PROGRESS: at sentence #40710000, processed 802000406 words, keeping 2785509 word types
2017-09-27 16:44:40,640 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:46:21,315 [MainThread  ] [INFO ]  PROGRESS: at sentence #41240000, processed 812114946 words, keeping 2801405 word types
2017-09-27 16:46:22,747 [MainThread  ] [INFO ]  PROGRESS: at sentence #41250000, processed 812297227 words, keeping 2801578 word types
2017-09-27 16:46:24,253 [MainThread  ] [INFO ]  PROGRESS: at sentence #41260000, processed 812496050 words, keeping 2802199 word types
2017-09-27 16:46:25,666 [MainThread  ] [INFO ]  PROGRESS: at sentence #41270000, processed 812676143 words, keeping 2802361 word types
2017-09-27 16:46:27,093 [MainThread  ] [INFO ]  PROGRESS: at sentence #41280000, processed 812861661 words, keeping 2802478 word types
2017-09-27 16:46:28,667 [MainThread  ] [INFO ]  PROGRESS: at sentence #41290000, processed 813058703 words, keeping 2802604 word types
2017-09-27 16:46:30,163 [MainThread  ] [INFO ]  PROGRESS: at sentence #41300000, processed 813253634 words, keeping 2802702 word types
2017-09-27 16:46:30,637 [MainThread  ] [INFO ]  578: ..

2017-09-27 16:48:06,949 [MainThread  ] [INFO ]  PROGRESS: at sentence #41800000, processed 822694580 words, keeping 2815394 word types
2017-09-27 16:48:08,018 [MainThread  ] [INFO ]  586: ../data/documents/664.json.gz
2017-09-27 16:48:16,100 [MainThread  ] [INFO ]  PROGRESS: at sentence #41810000, processed 822914060 words, keeping 2815759 word types
2017-09-27 16:48:17,535 [MainThread  ] [INFO ]  PROGRESS: at sentence #41820000, processed 823098482 words, keeping 2815947 word types
2017-09-27 16:48:19,067 [MainThread  ] [INFO ]  PROGRESS: at sentence #41830000, processed 823293103 words, keeping 2816192 word types
2017-09-27 16:48:20,585 [MainThread  ] [INFO ]  PROGRESS: at sentence #41840000, processed 823486500 words, keeping 2816314 word types
2017-09-27 16:48:22,081 [MainThread  ] [INFO ]  PROGRESS: at sentence #41850000, processed 823673338 words, keeping 2816540 word types
2017-09-27 16:48:23,417 [MainThread  ] [INFO ]  PROGRESS: at sentence #41860000, processed 823838976 words,

2017-09-27 16:50:00,754 [MainThread  ] [INFO ]  PROGRESS: at sentence #42380000, processed 833776684 words, keeping 2832466 word types
2017-09-27 16:50:02,183 [MainThread  ] [INFO ]  PROGRESS: at sentence #42390000, processed 833956265 words, keeping 2832682 word types
2017-09-27 16:50:03,633 [MainThread  ] [INFO ]  PROGRESS: at sentence #42400000, processed 834141702 words, keeping 2832903 word types
2017-09-27 16:50:05,163 [MainThread  ] [INFO ]  PROGRESS: at sentence #42410000, processed 834338999 words, keeping 2833109 word types
2017-09-27 16:50:05,650 [MainThread  ] [INFO ]  592: ../data/documents/703.json.gz
2017-09-27 16:50:07,707 [MainThread  ] [INFO ]  PROGRESS: at sentence #42420000, processed 834579098 words, keeping 2833342 word types
2017-09-27 16:50:09,735 [MainThread  ] [INFO ]  PROGRESS: at sentence #42430000, processed 834857541 words, keeping 2833624 word types
2017-09-27 16:50:10,141 [MainThread  ] [INFO ]  593: ../data/documents/951.json.gz
2017-09-27 16:50:12,526 

2017-09-27 16:51:54,964 [MainThread  ] [INFO ]  PROGRESS: at sentence #42940000, processed 845010706 words, keeping 2853500 word types
2017-09-27 16:51:56,403 [MainThread  ] [INFO ]  PROGRESS: at sentence #42950000, processed 845202542 words, keeping 2853690 word types
2017-09-27 16:51:57,884 [MainThread  ] [INFO ]  PROGRESS: at sentence #42960000, processed 845397134 words, keeping 2853940 word types
2017-09-27 16:51:59,477 [MainThread  ] [INFO ]  PROGRESS: at sentence #42970000, processed 845597960 words, keeping 2854164 word types
2017-09-27 16:52:00,989 [MainThread  ] [INFO ]  PROGRESS: at sentence #42980000, processed 845789410 words, keeping 2854299 word types
2017-09-27 16:52:01,903 [MainThread  ] [INFO ]  601: ../data/documents/914.json.gz
2017-09-27 16:52:03,946 [MainThread  ] [INFO ]  PROGRESS: at sentence #42990000, processed 846001858 words, keeping 2854550 word types
2017-09-27 16:52:05,468 [MainThread  ] [INFO ]  PROGRESS: at sentence #43000000, processed 846196285 words,

2017-09-27 16:53:47,855 [MainThread  ] [INFO ]  PROGRESS: at sentence #43510000, processed 856263084 words, keeping 2866455 word types
2017-09-27 16:53:48,772 [MainThread  ] [INFO ]  608: ../data/documents/273.json.gz
2017-09-27 16:53:50,817 [MainThread  ] [INFO ]  PROGRESS: at sentence #43520000, processed 856462839 words, keeping 2866629 word types
2017-09-27 16:53:52,394 [MainThread  ] [INFO ]  PROGRESS: at sentence #43530000, processed 856661300 words, keeping 2866863 word types
2017-09-27 16:53:53,922 [MainThread  ] [INFO ]  PROGRESS: at sentence #43540000, processed 856862203 words, keeping 2867132 word types
2017-09-27 16:53:55,429 [MainThread  ] [INFO ]  PROGRESS: at sentence #43550000, processed 857059807 words, keeping 2867292 word types
2017-09-27 16:53:56,621 [MainThread  ] [INFO ]  609: ../data/documents/421.json.gz
2017-09-27 16:54:04,413 [MainThread  ] [INFO ]  PROGRESS: at sentence #43560000, processed 857246225 words, keeping 2867517 word types
2017-09-27 16:54:05,868 

2017-09-27 16:55:38,592 [MainThread  ] [INFO ]  PROGRESS: at sentence #44070000, processed 867004798 words, keeping 2881158 word types
2017-09-27 16:55:40,077 [MainThread  ] [INFO ]  PROGRESS: at sentence #44080000, processed 867188472 words, keeping 2881381 word types
2017-09-27 16:55:41,521 [MainThread  ] [INFO ]  PROGRESS: at sentence #44090000, processed 867370837 words, keeping 2881612 word types
2017-09-27 16:55:42,948 [MainThread  ] [INFO ]  PROGRESS: at sentence #44100000, processed 867553663 words, keeping 2881798 word types
2017-09-27 16:55:43,260 [MainThread  ] [INFO ]  617: ../data/documents/753.json.gz
2017-09-27 16:55:47,676 [MainThread  ] [INFO ]  PROGRESS: at sentence #44110000, processed 867799822 words, keeping 2882047 word types
2017-09-27 16:55:49,610 [MainThread  ] [INFO ]  PROGRESS: at sentence #44120000, processed 868069122 words, keeping 2882258 word types
2017-09-27 16:55:49,712 [MainThread  ] [INFO ]  618: ../data/documents/713.json.gz
2017-09-27 16:55:52,265 

2017-09-27 16:57:37,633 [MainThread  ] [INFO ]  PROGRESS: at sentence #44600000, processed 878082634 words, keeping 2892612 word types
2017-09-27 16:57:39,175 [MainThread  ] [INFO ]  PROGRESS: at sentence #44610000, processed 878276250 words, keeping 2892820 word types
2017-09-27 16:57:40,632 [MainThread  ] [INFO ]  PROGRESS: at sentence #44620000, processed 878463135 words, keeping 2893048 word types
2017-09-27 16:57:42,196 [MainThread  ] [INFO ]  PROGRESS: at sentence #44630000, processed 878656816 words, keeping 2893258 word types
2017-09-27 16:57:43,732 [MainThread  ] [INFO ]  PROGRESS: at sentence #44640000, processed 878855197 words, keeping 2893533 word types
2017-09-27 16:57:45,205 [MainThread  ] [INFO ]  PROGRESS: at sentence #44650000, processed 879043899 words, keeping 2893723 word types
2017-09-27 16:57:46,712 [MainThread  ] [INFO ]  PROGRESS: at sentence #44660000, processed 879240096 words, keeping 2893934 word types
2017-09-27 16:57:48,214 [MainThread  ] [INFO ]  PROGRES

2017-09-27 16:59:25,728 [MainThread  ] [INFO ]  PROGRESS: at sentence #45170000, processed 889247196 words, keeping 2905899 word types
2017-09-27 16:59:27,284 [MainThread  ] [INFO ]  PROGRESS: at sentence #45180000, processed 889449108 words, keeping 2906038 word types
2017-09-27 16:59:28,828 [MainThread  ] [INFO ]  PROGRESS: at sentence #45190000, processed 889642782 words, keeping 2906140 word types
2017-09-27 16:59:30,387 [MainThread  ] [INFO ]  PROGRESS: at sentence #45200000, processed 889841108 words, keeping 2906364 word types
2017-09-27 16:59:31,024 [MainThread  ] [INFO ]  637: ../data/documents/598.json.gz
2017-09-27 16:59:34,039 [MainThread  ] [INFO ]  PROGRESS: at sentence #45210000, processed 890026475 words, keeping 2906491 word types
2017-09-27 16:59:35,583 [MainThread  ] [INFO ]  PROGRESS: at sentence #45220000, processed 890222839 words, keeping 2906659 word types
2017-09-27 16:59:37,029 [MainThread  ] [INFO ]  PROGRESS: at sentence #45230000, processed 890414114 words,

2017-09-27 17:01:23,298 [MainThread  ] [INFO ]  PROGRESS: at sentence #45730000, processed 900259859 words, keeping 2918595 word types
2017-09-27 17:01:24,844 [MainThread  ] [INFO ]  PROGRESS: at sentence #45740000, processed 900465325 words, keeping 2918925 word types
2017-09-27 17:01:26,301 [MainThread  ] [INFO ]  PROGRESS: at sentence #45750000, processed 900651489 words, keeping 2919123 word types
2017-09-27 17:01:27,802 [MainThread  ] [INFO ]  PROGRESS: at sentence #45760000, processed 900846725 words, keeping 2919353 word types
2017-09-27 17:01:29,316 [MainThread  ] [INFO ]  PROGRESS: at sentence #45770000, processed 901031097 words, keeping 2919566 word types
2017-09-27 17:01:30,801 [MainThread  ] [INFO ]  PROGRESS: at sentence #45780000, processed 901224979 words, keeping 2919736 word types
2017-09-27 17:01:32,332 [MainThread  ] [INFO ]  PROGRESS: at sentence #45790000, processed 901421818 words, keeping 2919873 word types
2017-09-27 17:01:33,747 [MainThread  ] [INFO ]  PROGRES

2017-09-27 17:03:13,774 [MainThread  ] [INFO ]  PROGRESS: at sentence #46320000, processed 911388051 words, keeping 2932052 word types
2017-09-27 17:03:15,219 [MainThread  ] [INFO ]  PROGRESS: at sentence #46330000, processed 911573530 words, keeping 2932296 word types
2017-09-27 17:03:16,709 [MainThread  ] [INFO ]  PROGRESS: at sentence #46340000, processed 911759875 words, keeping 2932587 word types
2017-09-27 17:03:18,354 [MainThread  ] [INFO ]  PROGRESS: at sentence #46350000, processed 911957956 words, keeping 2933056 word types
2017-09-27 17:03:19,897 [MainThread  ] [INFO ]  PROGRESS: at sentence #46360000, processed 912147532 words, keeping 2933311 word types
2017-09-27 17:03:21,312 [MainThread  ] [INFO ]  PROGRESS: at sentence #46370000, processed 912329849 words, keeping 2933680 word types
2017-09-27 17:03:22,819 [MainThread  ] [INFO ]  PROGRESS: at sentence #46380000, processed 912525274 words, keeping 2933861 word types
2017-09-27 17:03:23,646 [MainThread  ] [INFO ]  650: ..

2017-09-27 17:05:03,308 [MainThread  ] [INFO ]  PROGRESS: at sentence #46860000, processed 922271334 words, keeping 2957664 word types
2017-09-27 17:05:05,054 [MainThread  ] [INFO ]  661: ../data/documents/715.json.gz
2017-09-27 17:05:06,392 [MainThread  ] [INFO ]  PROGRESS: at sentence #46870000, processed 922546687 words, keeping 2957879 word types
2017-09-27 17:05:08,280 [MainThread  ] [INFO ]  PROGRESS: at sentence #46880000, processed 922797393 words, keeping 2958095 word types
2017-09-27 17:05:09,969 [MainThread  ] [INFO ]  PROGRESS: at sentence #46890000, processed 923025724 words, keeping 2958241 word types
2017-09-27 17:05:11,723 [MainThread  ] [INFO ]  PROGRESS: at sentence #46900000, processed 923251353 words, keeping 2958432 word types
2017-09-27 17:05:11,908 [MainThread  ] [INFO ]  662: ../data/documents/222.json.gz
2017-09-27 17:05:18,095 [MainThread  ] [INFO ]  PROGRESS: at sentence #46910000, processed 923424789 words, keeping 2958836 word types
2017-09-27 17:05:19,653 

2017-09-27 17:06:55,956 [MainThread  ] [INFO ]  PROGRESS: at sentence #47420000, processed 933234556 words, keeping 2972406 word types
2017-09-27 17:06:57,424 [MainThread  ] [INFO ]  PROGRESS: at sentence #47430000, processed 933409150 words, keeping 2972654 word types
2017-09-27 17:06:58,812 [MainThread  ] [INFO ]  PROGRESS: at sentence #47440000, processed 933584752 words, keeping 2972953 word types
2017-09-27 17:07:00,274 [MainThread  ] [INFO ]  PROGRESS: at sentence #47450000, processed 933765723 words, keeping 2973211 word types
2017-09-27 17:07:01,730 [MainThread  ] [INFO ]  PROGRESS: at sentence #47460000, processed 933948394 words, keeping 2973550 word types
2017-09-27 17:07:03,199 [MainThread  ] [INFO ]  PROGRESS: at sentence #47470000, processed 934136133 words, keeping 2973699 word types
2017-09-27 17:07:03,456 [MainThread  ] [INFO ]  669: ../data/documents/605.json.gz
2017-09-27 17:07:13,204 [MainThread  ] [INFO ]  PROGRESS: at sentence #47480000, processed 934323718 words,

2017-09-27 17:08:48,601 [MainThread  ] [INFO ]  PROGRESS: at sentence #47990000, processed 944376201 words, keeping 2984995 word types
2017-09-27 17:08:50,158 [MainThread  ] [INFO ]  PROGRESS: at sentence #48000000, processed 944576586 words, keeping 2985283 word types
2017-09-27 17:08:50,679 [MainThread  ] [INFO ]  676: ../data/documents/593.json.gz
2017-09-27 17:08:56,112 [MainThread  ] [INFO ]  PROGRESS: at sentence #48010000, processed 944769580 words, keeping 2985517 word types
2017-09-27 17:08:57,478 [MainThread  ] [INFO ]  PROGRESS: at sentence #48020000, processed 944940449 words, keeping 2985678 word types
2017-09-27 17:08:58,911 [MainThread  ] [INFO ]  PROGRESS: at sentence #48030000, processed 945122881 words, keeping 2985827 word types
2017-09-27 17:09:00,412 [MainThread  ] [INFO ]  PROGRESS: at sentence #48040000, processed 945306761 words, keeping 2986017 word types
2017-09-27 17:09:01,803 [MainThread  ] [INFO ]  PROGRESS: at sentence #48050000, processed 945483154 words,

2017-09-27 17:10:38,934 [MainThread  ] [INFO ]  PROGRESS: at sentence #48560000, processed 955079604 words, keeping 2999440 word types
2017-09-27 17:10:40,454 [MainThread  ] [INFO ]  PROGRESS: at sentence #48570000, processed 955270899 words, keeping 2999611 word types
2017-09-27 17:10:41,025 [MainThread  ] [INFO ]  682: ../data/documents/744.json.gz
2017-09-27 17:10:48,327 [MainThread  ] [INFO ]  PROGRESS: at sentence #48580000, processed 955442757 words, keeping 2999868 word types
2017-09-27 17:10:49,807 [MainThread  ] [INFO ]  PROGRESS: at sentence #48590000, processed 955635603 words, keeping 2999994 word types
2017-09-27 17:10:51,348 [MainThread  ] [INFO ]  PROGRESS: at sentence #48600000, processed 955839245 words, keeping 3000211 word types
2017-09-27 17:10:52,880 [MainThread  ] [INFO ]  PROGRESS: at sentence #48610000, processed 956036526 words, keeping 3000338 word types
2017-09-27 17:10:54,472 [MainThread  ] [INFO ]  PROGRESS: at sentence #48620000, processed 956238605 words,

2017-09-27 17:12:32,006 [MainThread  ] [INFO ]  PROGRESS: at sentence #49120000, processed 965835381 words, keeping 3020721 word types
2017-09-27 17:12:33,547 [MainThread  ] [INFO ]  PROGRESS: at sentence #49130000, processed 966038329 words, keeping 3020931 word types
2017-09-27 17:12:35,125 [MainThread  ] [INFO ]  PROGRESS: at sentence #49140000, processed 966244240 words, keeping 3021360 word types
2017-09-27 17:12:36,616 [MainThread  ] [INFO ]  PROGRESS: at sentence #49150000, processed 966436629 words, keeping 3021493 word types
2017-09-27 17:12:38,130 [MainThread  ] [INFO ]  PROGRESS: at sentence #49160000, processed 966626008 words, keeping 3021892 word types
2017-09-27 17:12:39,416 [MainThread  ] [INFO ]  691: ../data/documents/733.json.gz
2017-09-27 17:12:48,261 [MainThread  ] [INFO ]  PROGRESS: at sentence #49170000, processed 966821620 words, keeping 3022030 word types
2017-09-27 17:12:49,754 [MainThread  ] [INFO ]  PROGRESS: at sentence #49180000, processed 967014600 words,

2017-09-27 17:14:28,376 [MainThread  ] [INFO ]  PROGRESS: at sentence #49710000, processed 977453071 words, keeping 3041164 word types
2017-09-27 17:14:29,812 [MainThread  ] [INFO ]  PROGRESS: at sentence #49720000, processed 977629160 words, keeping 3043137 word types
2017-09-27 17:14:31,342 [MainThread  ] [INFO ]  PROGRESS: at sentence #49730000, processed 977810519 words, keeping 3045298 word types
2017-09-27 17:14:32,839 [MainThread  ] [INFO ]  PROGRESS: at sentence #49740000, processed 977997259 words, keeping 3047900 word types
2017-09-27 17:14:33,596 [MainThread  ] [INFO ]  695: ../data/documents/641.json.gz
2017-09-27 17:14:35,248 [MainThread  ] [INFO ]  PROGRESS: at sentence #49750000, processed 978190283 words, keeping 3048665 word types
2017-09-27 17:14:36,980 [MainThread  ] [INFO ]  PROGRESS: at sentence #49760000, processed 978410533 words, keeping 3048817 word types
2017-09-27 17:14:38,798 [MainThread  ] [INFO ]  PROGRESS: at sentence #49770000, processed 978649962 words,

2017-09-27 17:16:17,879 [MainThread  ] [INFO ]  PROGRESS: at sentence #50280000, processed 988173393 words, keeping 3104673 word types
2017-09-27 17:16:17,893 [MainThread  ] [INFO ]  701: ../data/documents/436.json.gz
2017-09-27 17:16:19,435 [MainThread  ] [INFO ]  702: ../data/documents/462.json.gz
2017-09-27 17:16:24,973 [MainThread  ] [INFO ]  PROGRESS: at sentence #50290000, processed 988417356 words, keeping 3104930 word types
2017-09-27 17:16:26,444 [MainThread  ] [INFO ]  PROGRESS: at sentence #50300000, processed 988609677 words, keeping 3105090 word types
2017-09-27 17:16:28,055 [MainThread  ] [INFO ]  PROGRESS: at sentence #50310000, processed 988821279 words, keeping 3105310 word types
2017-09-27 17:16:29,494 [MainThread  ] [INFO ]  PROGRESS: at sentence #50320000, processed 989010592 words, keeping 3105468 word types
2017-09-27 17:16:30,919 [MainThread  ] [INFO ]  PROGRESS: at sentence #50330000, processed 989191045 words, keeping 3105705 word types
2017-09-27 17:16:32,336 

2017-09-27 17:18:13,674 [MainThread  ] [INFO ]  PROGRESS: at sentence #50850000, processed 999020903 words, keeping 3119097 word types
2017-09-27 17:18:15,212 [MainThread  ] [INFO ]  PROGRESS: at sentence #50860000, processed 999218134 words, keeping 3119423 word types
2017-09-27 17:18:16,746 [MainThread  ] [INFO ]  PROGRESS: at sentence #50870000, processed 999413446 words, keeping 3119598 word types
2017-09-27 17:18:18,153 [MainThread  ] [INFO ]  PROGRESS: at sentence #50880000, processed 999593501 words, keeping 3119902 word types
2017-09-27 17:18:19,730 [MainThread  ] [INFO ]  PROGRESS: at sentence #50890000, processed 999793862 words, keeping 3120161 word types
2017-09-27 17:18:21,332 [MainThread  ] [INFO ]  PROGRESS: at sentence #50900000, processed 1000001532 words, keeping 3120347 word types
2017-09-27 17:18:22,736 [MainThread  ] [INFO ]  PROGRESS: at sentence #50910000, processed 1000178379 words, keeping 3120537 word types
2017-09-27 17:18:24,169 [MainThread  ] [INFO ]  PROGR

2017-09-27 17:20:02,477 [MainThread  ] [INFO ]  PROGRESS: at sentence #51410000, processed 1009963940 words, keeping 3142426 word types
2017-09-27 17:20:04,286 [MainThread  ] [INFO ]  PROGRESS: at sentence #51420000, processed 1010200477 words, keeping 3142535 word types
2017-09-27 17:20:06,018 [MainThread  ] [INFO ]  PROGRESS: at sentence #51430000, processed 1010428249 words, keeping 3142661 word types
2017-09-27 17:20:07,807 [MainThread  ] [INFO ]  PROGRESS: at sentence #51440000, processed 1010654984 words, keeping 3142754 word types
2017-09-27 17:20:09,191 [MainThread  ] [INFO ]  716: ../data/documents/886.json.gz
2017-09-27 17:20:14,072 [MainThread  ] [INFO ]  PROGRESS: at sentence #51450000, processed 1010868306 words, keeping 3142868 word types
2017-09-27 17:20:15,668 [MainThread  ] [INFO ]  PROGRESS: at sentence #51460000, processed 1011075180 words, keeping 3142998 word types
2017-09-27 17:20:17,328 [MainThread  ] [INFO ]  PROGRESS: at sentence #51470000, processed 1011283294

2017-09-27 17:21:55,015 [MainThread  ] [INFO ]  PROGRESS: at sentence #51970000, processed 1020900056 words, keeping 3150944 word types
2017-09-27 17:21:56,457 [MainThread  ] [INFO ]  PROGRESS: at sentence #51980000, processed 1021089007 words, keeping 3151104 word types
2017-09-27 17:21:57,958 [MainThread  ] [INFO ]  PROGRESS: at sentence #51990000, processed 1021281534 words, keeping 3151319 word types
2017-09-27 17:21:59,427 [MainThread  ] [INFO ]  PROGRESS: at sentence #52000000, processed 1021468209 words, keeping 3151563 word types
2017-09-27 17:22:00,957 [MainThread  ] [INFO ]  PROGRESS: at sentence #52010000, processed 1021665195 words, keeping 3151722 word types
2017-09-27 17:22:02,458 [MainThread  ] [INFO ]  PROGRESS: at sentence #52020000, processed 1021858713 words, keeping 3151933 word types
2017-09-27 17:22:03,384 [MainThread  ] [INFO ]  723: ../data/documents/7.json.gz
2017-09-27 17:22:07,733 [MainThread  ] [INFO ]  PROGRESS: at sentence #52030000, processed 1022040066 w

2017-09-27 17:23:38,947 [MainThread  ] [INFO ]  PROGRESS: at sentence #52510000, processed 1031072018 words, keeping 3184006 word types
2017-09-27 17:23:40,154 [MainThread  ] [INFO ]  734: ../data/documents/531.json.gz
2017-09-27 17:23:41,194 [MainThread  ] [INFO ]  PROGRESS: at sentence #52520000, processed 1031279641 words, keeping 3184136 word types
2017-09-27 17:23:43,407 [MainThread  ] [INFO ]  PROGRESS: at sentence #52530000, processed 1031566460 words, keeping 3184381 word types
2017-09-27 17:23:44,225 [MainThread  ] [INFO ]  735: ../data/documents/876.json.gz
2017-09-27 17:23:50,158 [MainThread  ] [INFO ]  PROGRESS: at sentence #52540000, processed 1031788359 words, keeping 3184557 word types
2017-09-27 17:23:51,793 [MainThread  ] [INFO ]  PROGRESS: at sentence #52550000, processed 1031993222 words, keeping 3184720 word types
2017-09-27 17:23:53,404 [MainThread  ] [INFO ]  PROGRESS: at sentence #52560000, processed 1032201890 words, keeping 3184926 word types
2017-09-27 17:23:5

2017-09-27 17:25:36,523 [MainThread  ] [INFO ]  PROGRESS: at sentence #53050000, processed 1042308412 words, keeping 3196230 word types
2017-09-27 17:25:37,949 [MainThread  ] [INFO ]  PROGRESS: at sentence #53060000, processed 1042490521 words, keeping 3196587 word types
2017-09-27 17:25:39,488 [MainThread  ] [INFO ]  PROGRESS: at sentence #53070000, processed 1042688825 words, keeping 3196744 word types
2017-09-27 17:25:41,006 [MainThread  ] [INFO ]  PROGRESS: at sentence #53080000, processed 1042879005 words, keeping 3196863 word types
2017-09-27 17:25:42,569 [MainThread  ] [INFO ]  PROGRESS: at sentence #53090000, processed 1043077047 words, keeping 3197128 word types
2017-09-27 17:25:43,938 [MainThread  ] [INFO ]  PROGRESS: at sentence #53100000, processed 1043250328 words, keeping 3197285 word types
2017-09-27 17:25:45,541 [MainThread  ] [INFO ]  PROGRESS: at sentence #53110000, processed 1043459887 words, keeping 3197432 word types
2017-09-27 17:25:47,074 [MainThread  ] [INFO ]  

2017-09-27 17:27:29,459 [MainThread  ] [INFO ]  PROGRESS: at sentence #53630000, processed 1053657354 words, keeping 3208348 word types
2017-09-27 17:27:30,855 [MainThread  ] [INFO ]  PROGRESS: at sentence #53640000, processed 1053842067 words, keeping 3208944 word types
2017-09-27 17:27:32,386 [MainThread  ] [INFO ]  PROGRESS: at sentence #53650000, processed 1054041163 words, keeping 3209065 word types
2017-09-27 17:27:33,845 [MainThread  ] [INFO ]  PROGRESS: at sentence #53660000, processed 1054232714 words, keeping 3209268 word types
2017-09-27 17:27:34,963 [MainThread  ] [INFO ]  749: ../data/documents/799.json.gz
2017-09-27 17:27:37,617 [MainThread  ] [INFO ]  PROGRESS: at sentence #53670000, processed 1054417780 words, keeping 3209367 word types
2017-09-27 17:27:39,098 [MainThread  ] [INFO ]  PROGRESS: at sentence #53680000, processed 1054610988 words, keeping 3209604 word types
2017-09-27 17:27:40,462 [MainThread  ] [INFO ]  PROGRESS: at sentence #53690000, processed 1054786030

2017-09-27 17:29:21,146 [MainThread  ] [INFO ]  PROGRESS: at sentence #54190000, processed 1064256979 words, keeping 3222615 word types
2017-09-27 17:29:22,609 [MainThread  ] [INFO ]  PROGRESS: at sentence #54200000, processed 1064444248 words, keeping 3222797 word types
2017-09-27 17:29:24,178 [MainThread  ] [INFO ]  PROGRESS: at sentence #54210000, processed 1064645358 words, keeping 3222929 word types
2017-09-27 17:29:25,573 [MainThread  ] [INFO ]  PROGRESS: at sentence #54220000, processed 1064825713 words, keeping 3223165 word types
2017-09-27 17:29:27,131 [MainThread  ] [INFO ]  PROGRESS: at sentence #54230000, processed 1065027193 words, keeping 3223367 word types
2017-09-27 17:29:28,607 [MainThread  ] [INFO ]  PROGRESS: at sentence #54240000, processed 1065216442 words, keeping 3223550 word types
2017-09-27 17:29:30,126 [MainThread  ] [INFO ]  PROGRESS: at sentence #54250000, processed 1065412560 words, keeping 3223718 word types
2017-09-27 17:29:31,589 [MainThread  ] [INFO ]  

2017-09-27 17:31:08,232 [MainThread  ] [INFO ]  763: ../data/documents/582.json.gz
2017-09-27 17:31:09,207 [MainThread  ] [INFO ]  PROGRESS: at sentence #54750000, processed 1075339172 words, keeping 3234094 word types
2017-09-27 17:31:11,311 [MainThread  ] [INFO ]  PROGRESS: at sentence #54760000, processed 1075623735 words, keeping 3234310 word types
2017-09-27 17:31:12,107 [MainThread  ] [INFO ]  764: ../data/documents/523.json.gz
2017-09-27 17:31:13,957 [MainThread  ] [INFO ]  PROGRESS: at sentence #54770000, processed 1075906020 words, keeping 3234553 word types
2017-09-27 17:31:15,860 [MainThread  ] [INFO ]  765: ../data/documents/20.json.gz
2017-09-27 17:31:19,505 [MainThread  ] [INFO ]  PROGRESS: at sentence #54780000, processed 1076177402 words, keeping 3234797 word types
2017-09-27 17:31:20,803 [MainThread  ] [INFO ]  PROGRESS: at sentence #54790000, processed 1076343354 words, keeping 3235965 word types
2017-09-27 17:31:22,239 [MainThread  ] [INFO ]  PROGRESS: at sentence #5

2017-09-27 17:32:59,152 [MainThread  ] [INFO ]  PROGRESS: at sentence #55300000, processed 1085881473 words, keeping 3252397 word types
2017-09-27 17:33:00,662 [MainThread  ] [INFO ]  PROGRESS: at sentence #55310000, processed 1086074178 words, keeping 3252574 word types
2017-09-27 17:33:02,276 [MainThread  ] [INFO ]  PROGRESS: at sentence #55320000, processed 1086276557 words, keeping 3252715 word types
2017-09-27 17:33:03,947 [MainThread  ] [INFO ]  PROGRESS: at sentence #55330000, processed 1086479273 words, keeping 3252858 word types
2017-09-27 17:33:04,921 [MainThread  ] [INFO ]  772: ../data/documents/485.json.gz
2017-09-27 17:33:06,304 [MainThread  ] [INFO ]  PROGRESS: at sentence #55340000, processed 1086708989 words, keeping 3253050 word types
2017-09-27 17:33:07,855 [MainThread  ] [INFO ]  773: ../data/documents/226.json.gz
2017-09-27 17:33:15,412 [MainThread  ] [INFO ]  PROGRESS: at sentence #55350000, processed 1086964691 words, keeping 3253237 word types
2017-09-27 17:33:1

2017-09-27 17:34:51,318 [MainThread  ] [INFO ]  PROGRESS: at sentence #55860000, processed 1096484682 words, keeping 3265790 word types
2017-09-27 17:34:52,646 [MainThread  ] [INFO ]  PROGRESS: at sentence #55870000, processed 1096655793 words, keeping 3266119 word types
2017-09-27 17:34:54,141 [MainThread  ] [INFO ]  PROGRESS: at sentence #55880000, processed 1096839171 words, keeping 3266314 word types
2017-09-27 17:34:55,591 [MainThread  ] [INFO ]  PROGRESS: at sentence #55890000, processed 1097021444 words, keeping 3266522 word types
2017-09-27 17:34:57,050 [MainThread  ] [INFO ]  PROGRESS: at sentence #55900000, processed 1097209105 words, keeping 3266709 word types
2017-09-27 17:34:57,794 [MainThread  ] [INFO ]  780: ../data/documents/915.json.gz
2017-09-27 17:35:00,769 [MainThread  ] [INFO ]  PROGRESS: at sentence #55910000, processed 1097393074 words, keeping 3267043 word types
2017-09-27 17:35:02,449 [MainThread  ] [INFO ]  PROGRESS: at sentence #55920000, processed 1097607904

2017-09-27 17:36:42,152 [MainThread  ] [INFO ]  PROGRESS: at sentence #56420000, processed 1107202401 words, keeping 3290556 word types
2017-09-27 17:36:43,546 [MainThread  ] [INFO ]  PROGRESS: at sentence #56430000, processed 1107378775 words, keeping 3290800 word types
2017-09-27 17:36:45,100 [MainThread  ] [INFO ]  PROGRESS: at sentence #56440000, processed 1107575861 words, keeping 3291049 word types
2017-09-27 17:36:46,536 [MainThread  ] [INFO ]  PROGRESS: at sentence #56450000, processed 1107756376 words, keeping 3291197 word types
2017-09-27 17:36:48,015 [MainThread  ] [INFO ]  PROGRESS: at sentence #56460000, processed 1107942360 words, keeping 3291356 word types
2017-09-27 17:36:49,479 [MainThread  ] [INFO ]  PROGRESS: at sentence #56470000, processed 1108132077 words, keeping 3291497 word types
2017-09-27 17:36:51,025 [MainThread  ] [INFO ]  PROGRESS: at sentence #56480000, processed 1108329915 words, keeping 3291659 word types
2017-09-27 17:36:51,330 [MainThread  ] [INFO ]  

2017-09-27 17:38:34,052 [MainThread  ] [INFO ]  PROGRESS: at sentence #56980000, processed 1118171937 words, keeping 3300517 word types
2017-09-27 17:38:35,721 [MainThread  ] [INFO ]  PROGRESS: at sentence #56990000, processed 1118387340 words, keeping 3300661 word types
2017-09-27 17:38:37,351 [MainThread  ] [INFO ]  PROGRESS: at sentence #57000000, processed 1118589771 words, keeping 3300854 word types
2017-09-27 17:38:38,936 [MainThread  ] [INFO ]  PROGRESS: at sentence #57010000, processed 1118792941 words, keeping 3301004 word types
2017-09-27 17:38:39,304 [MainThread  ] [INFO ]  794: ../data/documents/334.json.gz
2017-09-27 17:38:44,240 [MainThread  ] [INFO ]  PROGRESS: at sentence #57020000, processed 1118981637 words, keeping 3303435 word types
2017-09-27 17:38:45,771 [MainThread  ] [INFO ]  PROGRESS: at sentence #57030000, processed 1119185239 words, keeping 3304773 word types
2017-09-27 17:38:47,193 [MainThread  ] [INFO ]  PROGRESS: at sentence #57040000, processed 1119375137

2017-09-27 17:40:22,522 [MainThread  ] [INFO ]  PROGRESS: at sentence #57540000, processed 1128787615 words, keeping 3334418 word types
2017-09-27 17:40:23,571 [MainThread  ] [INFO ]  802: ../data/documents/625.json.gz
2017-09-27 17:40:25,103 [MainThread  ] [INFO ]  PROGRESS: at sentence #57550000, processed 1128996037 words, keeping 3336022 word types
2017-09-27 17:40:26,930 [MainThread  ] [INFO ]  PROGRESS: at sentence #57560000, processed 1129231047 words, keeping 3336198 word types
2017-09-27 17:40:28,680 [MainThread  ] [INFO ]  PROGRESS: at sentence #57570000, processed 1129457712 words, keeping 3336317 word types
2017-09-27 17:40:29,906 [MainThread  ] [INFO ]  803: ../data/documents/804.json.gz
2017-09-27 17:40:35,211 [MainThread  ] [INFO ]  PROGRESS: at sentence #57580000, processed 1129674797 words, keeping 3336453 word types
2017-09-27 17:40:36,797 [MainThread  ] [INFO ]  PROGRESS: at sentence #57590000, processed 1129880344 words, keeping 3336615 word types
2017-09-27 17:40:3

2017-09-27 17:42:19,196 [MainThread  ] [INFO ]  PROGRESS: at sentence #58100000, processed 1139717788 words, keeping 3347110 word types
2017-09-27 17:42:20,659 [MainThread  ] [INFO ]  PROGRESS: at sentence #58110000, processed 1139903597 words, keeping 3347321 word types
2017-09-27 17:42:22,077 [MainThread  ] [INFO ]  PROGRESS: at sentence #58120000, processed 1140077510 words, keeping 3347523 word types
2017-09-27 17:42:23,474 [MainThread  ] [INFO ]  PROGRESS: at sentence #58130000, processed 1140246440 words, keeping 3347737 word types
2017-09-27 17:42:24,964 [MainThread  ] [INFO ]  PROGRESS: at sentence #58140000, processed 1140433600 words, keeping 3348135 word types
2017-09-27 17:42:26,442 [MainThread  ] [INFO ]  PROGRESS: at sentence #58150000, processed 1140628821 words, keeping 3348341 word types
2017-09-27 17:42:27,898 [MainThread  ] [INFO ]  PROGRESS: at sentence #58160000, processed 1140814508 words, keeping 3348608 word types
2017-09-27 17:42:29,417 [MainThread  ] [INFO ]  

2017-09-27 17:44:08,149 [MainThread  ] [INFO ]  PROGRESS: at sentence #58660000, processed 1150463741 words, keeping 3362185 word types
2017-09-27 17:44:09,625 [MainThread  ] [INFO ]  PROGRESS: at sentence #58670000, processed 1150649947 words, keeping 3362474 word types
2017-09-27 17:44:11,376 [MainThread  ] [INFO ]  PROGRESS: at sentence #58680000, processed 1150868733 words, keeping 3362718 word types
2017-09-27 17:44:12,814 [MainThread  ] [INFO ]  PROGRESS: at sentence #58690000, processed 1151046420 words, keeping 3362993 word types
2017-09-27 17:44:14,289 [MainThread  ] [INFO ]  PROGRESS: at sentence #58700000, processed 1151237108 words, keeping 3363112 word types
2017-09-27 17:44:15,843 [MainThread  ] [INFO ]  PROGRESS: at sentence #58710000, processed 1151436420 words, keeping 3363304 word types
2017-09-27 17:44:17,289 [MainThread  ] [INFO ]  PROGRESS: at sentence #58720000, processed 1151627384 words, keeping 3363490 word types
2017-09-27 17:44:18,889 [MainThread  ] [INFO ]  

2017-09-27 17:45:54,510 [MainThread  ] [INFO ]  PROGRESS: at sentence #59230000, processed 1161154934 words, keeping 3375842 word types
2017-09-27 17:45:55,084 [MainThread  ] [INFO ]  822: ../data/documents/470.json.gz
2017-09-27 17:46:04,855 [MainThread  ] [INFO ]  PROGRESS: at sentence #59240000, processed 1161349390 words, keeping 3376084 word types
2017-09-27 17:46:06,354 [MainThread  ] [INFO ]  PROGRESS: at sentence #59250000, processed 1161536642 words, keeping 3376407 word types
2017-09-27 17:46:07,862 [MainThread  ] [INFO ]  PROGRESS: at sentence #59260000, processed 1161726127 words, keeping 3376769 word types
2017-09-27 17:46:09,210 [MainThread  ] [INFO ]  PROGRESS: at sentence #59270000, processed 1161899225 words, keeping 3376990 word types
2017-09-27 17:46:10,656 [MainThread  ] [INFO ]  PROGRESS: at sentence #59280000, processed 1162084234 words, keeping 3377151 word types
2017-09-27 17:46:12,141 [MainThread  ] [INFO ]  PROGRESS: at sentence #59290000, processed 1162268317

2017-09-27 17:47:44,029 [MainThread  ] [INFO ]  830: ../data/documents/506.json.gz
2017-09-27 17:47:53,709 [MainThread  ] [INFO ]  PROGRESS: at sentence #59790000, processed 1171797528 words, keeping 3388149 word types
2017-09-27 17:47:55,090 [MainThread  ] [INFO ]  PROGRESS: at sentence #59800000, processed 1171969901 words, keeping 3388345 word types
2017-09-27 17:47:56,485 [MainThread  ] [INFO ]  PROGRESS: at sentence #59810000, processed 1172147000 words, keeping 3388745 word types
2017-09-27 17:47:57,977 [MainThread  ] [INFO ]  PROGRESS: at sentence #59820000, processed 1172332784 words, keeping 3388900 word types
2017-09-27 17:47:59,438 [MainThread  ] [INFO ]  PROGRESS: at sentence #59830000, processed 1172517242 words, keeping 3389190 word types
2017-09-27 17:48:00,835 [MainThread  ] [INFO ]  PROGRESS: at sentence #59840000, processed 1172689225 words, keeping 3389427 word types
2017-09-27 17:48:02,400 [MainThread  ] [INFO ]  PROGRESS: at sentence #59850000, processed 1172876953

2017-09-27 17:49:41,441 [MainThread  ] [INFO ]  PROGRESS: at sentence #60370000, processed 1182925292 words, keeping 3402299 word types
2017-09-27 17:49:43,001 [MainThread  ] [INFO ]  PROGRESS: at sentence #60380000, processed 1183113809 words, keeping 3402472 word types
2017-09-27 17:49:44,664 [MainThread  ] [INFO ]  PROGRESS: at sentence #60390000, processed 1183321907 words, keeping 3402572 word types
2017-09-27 17:49:46,298 [MainThread  ] [INFO ]  PROGRESS: at sentence #60400000, processed 1183526968 words, keeping 3402715 word types
2017-09-27 17:49:47,563 [MainThread  ] [INFO ]  834: ../data/documents/425.json.gz
2017-09-27 17:49:53,361 [MainThread  ] [INFO ]  PROGRESS: at sentence #60410000, processed 1183712722 words, keeping 3402830 word types
2017-09-27 17:49:54,790 [MainThread  ] [INFO ]  PROGRESS: at sentence #60420000, processed 1183893186 words, keeping 3402978 word types
2017-09-27 17:49:56,302 [MainThread  ] [INFO ]  PROGRESS: at sentence #60430000, processed 1184082021

2017-09-27 17:51:35,294 [MainThread  ] [INFO ]  PROGRESS: at sentence #60950000, processed 1193893826 words, keeping 3414948 word types
2017-09-27 17:51:36,867 [MainThread  ] [INFO ]  PROGRESS: at sentence #60960000, processed 1194098591 words, keeping 3415268 word types
2017-09-27 17:51:38,348 [MainThread  ] [INFO ]  PROGRESS: at sentence #60970000, processed 1194275933 words, keeping 3415418 word types
2017-09-27 17:51:39,876 [MainThread  ] [INFO ]  PROGRESS: at sentence #60980000, processed 1194460181 words, keeping 3416048 word types
2017-09-27 17:51:41,601 [MainThread  ] [INFO ]  PROGRESS: at sentence #60990000, processed 1194681291 words, keeping 3416234 word types
2017-09-27 17:51:43,035 [MainThread  ] [INFO ]  PROGRESS: at sentence #61000000, processed 1194863378 words, keeping 3416426 word types
2017-09-27 17:51:44,292 [MainThread  ] [INFO ]  839: ../data/documents/372.json.gz
2017-09-27 17:51:47,135 [MainThread  ] [INFO ]  PROGRESS: at sentence #61010000, processed 1195056639

2017-09-27 17:53:25,622 [MainThread  ] [INFO ]  PROGRESS: at sentence #61530000, processed 1204797708 words, keeping 3427790 word types
2017-09-27 17:53:27,171 [MainThread  ] [INFO ]  PROGRESS: at sentence #61540000, processed 1204988371 words, keeping 3428068 word types
2017-09-27 17:53:28,658 [MainThread  ] [INFO ]  PROGRESS: at sentence #61550000, processed 1205177952 words, keeping 3428255 word types
2017-09-27 17:53:29,077 [MainThread  ] [INFO ]  844: ../data/documents/243.json.gz
2017-09-27 17:53:31,944 [MainThread  ] [INFO ]  PROGRESS: at sentence #61560000, processed 1205362416 words, keeping 3428459 word types
2017-09-27 17:53:33,386 [MainThread  ] [INFO ]  PROGRESS: at sentence #61570000, processed 1205547340 words, keeping 3428699 word types
2017-09-27 17:53:34,784 [MainThread  ] [INFO ]  PROGRESS: at sentence #61580000, processed 1205726530 words, keeping 3428894 word types
2017-09-27 17:53:36,224 [MainThread  ] [INFO ]  PROGRESS: at sentence #61590000, processed 1205907742

2017-09-27 17:55:25,867 [MainThread  ] [INFO ]  PROGRESS: at sentence #62090000, processed 1215954846 words, keeping 3437941 word types
2017-09-27 17:55:27,470 [MainThread  ] [INFO ]  PROGRESS: at sentence #62100000, processed 1216156164 words, keeping 3438092 word types
2017-09-27 17:55:29,020 [MainThread  ] [INFO ]  PROGRESS: at sentence #62110000, processed 1216353832 words, keeping 3438204 word types
2017-09-27 17:55:30,576 [MainThread  ] [INFO ]  PROGRESS: at sentence #62120000, processed 1216553515 words, keeping 3438368 word types
2017-09-27 17:55:32,100 [MainThread  ] [INFO ]  PROGRESS: at sentence #62130000, processed 1216747823 words, keeping 3438502 word types
2017-09-27 17:55:33,647 [MainThread  ] [INFO ]  PROGRESS: at sentence #62140000, processed 1216943794 words, keeping 3438718 word types
2017-09-27 17:55:35,215 [MainThread  ] [INFO ]  PROGRESS: at sentence #62150000, processed 1217147400 words, keeping 3438881 word types
2017-09-27 17:55:36,737 [MainThread  ] [INFO ]  

2017-09-27 17:57:11,476 [MainThread  ] [INFO ]  PROGRESS: at sentence #62660000, processed 1227086440 words, keeping 3447773 word types
2017-09-27 17:57:12,961 [MainThread  ] [INFO ]  PROGRESS: at sentence #62670000, processed 1227268980 words, keeping 3447934 word types
2017-09-27 17:57:14,531 [MainThread  ] [INFO ]  PROGRESS: at sentence #62680000, processed 1227459580 words, keeping 3448065 word types
2017-09-27 17:57:15,631 [MainThread  ] [INFO ]  857: ../data/documents/454.json.gz
2017-09-27 17:57:20,719 [MainThread  ] [INFO ]  PROGRESS: at sentence #62690000, processed 1227657239 words, keeping 3448259 word types
2017-09-27 17:57:22,142 [MainThread  ] [INFO ]  PROGRESS: at sentence #62700000, processed 1227840828 words, keeping 3448438 word types
2017-09-27 17:57:23,558 [MainThread  ] [INFO ]  PROGRESS: at sentence #62710000, processed 1228019771 words, keeping 3448609 word types
2017-09-27 17:57:25,062 [MainThread  ] [INFO ]  PROGRESS: at sentence #62720000, processed 1228210380

2017-09-27 17:59:05,973 [MainThread  ] [INFO ]  PROGRESS: at sentence #63220000, processed 1237964861 words, keeping 3457143 word types
2017-09-27 17:59:07,485 [MainThread  ] [INFO ]  PROGRESS: at sentence #63230000, processed 1238154907 words, keeping 3457224 word types
2017-09-27 17:59:09,089 [MainThread  ] [INFO ]  PROGRESS: at sentence #63240000, processed 1238354609 words, keeping 3457351 word types
2017-09-27 17:59:09,958 [MainThread  ] [INFO ]  865: ../data/documents/410.json.gz
2017-09-27 17:59:12,808 [MainThread  ] [INFO ]  PROGRESS: at sentence #63250000, processed 1238560330 words, keeping 3457493 word types
2017-09-27 17:59:14,336 [MainThread  ] [INFO ]  PROGRESS: at sentence #63260000, processed 1238748334 words, keeping 3457660 word types
2017-09-27 17:59:15,834 [MainThread  ] [INFO ]  PROGRESS: at sentence #63270000, processed 1238936093 words, keeping 3457912 word types
2017-09-27 17:59:17,438 [MainThread  ] [INFO ]  PROGRESS: at sentence #63280000, processed 1239140069

2017-09-27 18:00:59,874 [MainThread  ] [INFO ]  PROGRESS: at sentence #63800000, processed 1249024895 words, keeping 3468133 word types
2017-09-27 18:01:01,405 [MainThread  ] [INFO ]  PROGRESS: at sentence #63810000, processed 1249221464 words, keeping 3468236 word types
2017-09-27 18:01:02,905 [MainThread  ] [INFO ]  PROGRESS: at sentence #63820000, processed 1249409377 words, keeping 3468392 word types
2017-09-27 18:01:03,689 [MainThread  ] [INFO ]  870: ../data/documents/870.json.gz
2017-09-27 18:01:13,177 [MainThread  ] [INFO ]  PROGRESS: at sentence #63830000, processed 1249604538 words, keeping 3468599 word types
2017-09-27 18:01:14,621 [MainThread  ] [INFO ]  PROGRESS: at sentence #63840000, processed 1249789251 words, keeping 3468705 word types
2017-09-27 18:01:16,201 [MainThread  ] [INFO ]  PROGRESS: at sentence #63850000, processed 1249988987 words, keeping 3468780 word types
2017-09-27 18:01:17,755 [MainThread  ] [INFO ]  PROGRESS: at sentence #63860000, processed 1250184259

2017-09-27 18:02:53,043 [MainThread  ] [INFO ]  PROGRESS: at sentence #64360000, processed 1260290467 words, keeping 3478855 word types
2017-09-27 18:02:54,509 [MainThread  ] [INFO ]  PROGRESS: at sentence #64370000, processed 1260480465 words, keeping 3479149 word types
2017-09-27 18:02:55,950 [MainThread  ] [INFO ]  PROGRESS: at sentence #64380000, processed 1260664553 words, keeping 3479463 word types
2017-09-27 18:02:57,339 [MainThread  ] [INFO ]  PROGRESS: at sentence #64390000, processed 1260840333 words, keeping 3479722 word types
2017-09-27 18:02:58,195 [MainThread  ] [INFO ]  878: ../data/documents/422.json.gz
2017-09-27 18:03:04,646 [MainThread  ] [INFO ]  PROGRESS: at sentence #64400000, processed 1261026065 words, keeping 3479924 word types
2017-09-27 18:03:06,134 [MainThread  ] [INFO ]  PROGRESS: at sentence #64410000, processed 1261218290 words, keeping 3480177 word types
2017-09-27 18:03:07,684 [MainThread  ] [INFO ]  PROGRESS: at sentence #64420000, processed 1261416908

2017-09-27 18:04:46,763 [MainThread  ] [INFO ]  PROGRESS: at sentence #64930000, processed 1271405360 words, keeping 3490615 word types
2017-09-27 18:04:48,249 [MainThread  ] [INFO ]  PROGRESS: at sentence #64940000, processed 1271594227 words, keeping 3490791 word types
2017-09-27 18:04:49,777 [MainThread  ] [INFO ]  PROGRESS: at sentence #64950000, processed 1271792042 words, keeping 3491037 word types
2017-09-27 18:04:51,283 [MainThread  ] [INFO ]  PROGRESS: at sentence #64960000, processed 1271984657 words, keeping 3491230 word types
2017-09-27 18:04:52,403 [MainThread  ] [INFO ]  884: ../data/documents/252.json.gz
2017-09-27 18:04:57,142 [MainThread  ] [INFO ]  PROGRESS: at sentence #64970000, processed 1272170198 words, keeping 3491423 word types
2017-09-27 18:04:58,599 [MainThread  ] [INFO ]  PROGRESS: at sentence #64980000, processed 1272350472 words, keeping 3491616 word types
2017-09-27 18:05:00,082 [MainThread  ] [INFO ]  PROGRESS: at sentence #64990000, processed 1272533680

2017-09-27 18:06:37,135 [MainThread  ] [INFO ]  PROGRESS: at sentence #65500000, processed 1282059714 words, keeping 3521754 word types
2017-09-27 18:06:38,547 [MainThread  ] [INFO ]  PROGRESS: at sentence #65510000, processed 1282236964 words, keeping 3522015 word types
2017-09-27 18:06:39,669 [MainThread  ] [INFO ]  890: ../data/documents/742.json.gz
2017-09-27 18:06:44,618 [MainThread  ] [INFO ]  PROGRESS: at sentence #65520000, processed 1282401847 words, keeping 3522297 word types
2017-09-27 18:06:46,160 [MainThread  ] [INFO ]  PROGRESS: at sentence #65530000, processed 1282601281 words, keeping 3522448 word types
2017-09-27 18:06:47,651 [MainThread  ] [INFO ]  PROGRESS: at sentence #65540000, processed 1282782765 words, keeping 3522618 word types
2017-09-27 18:06:49,168 [MainThread  ] [INFO ]  PROGRESS: at sentence #65550000, processed 1282978184 words, keeping 3522754 word types
2017-09-27 18:06:50,729 [MainThread  ] [INFO ]  PROGRESS: at sentence #65560000, processed 1283179687

2017-09-27 18:08:34,566 [MainThread  ] [INFO ]  PROGRESS: at sentence #66050000, processed 1293201562 words, keeping 3530461 word types
2017-09-27 18:08:36,130 [MainThread  ] [INFO ]  PROGRESS: at sentence #66060000, processed 1293392580 words, keeping 3530580 word types
2017-09-27 18:08:37,552 [MainThread  ] [INFO ]  PROGRESS: at sentence #66070000, processed 1293568928 words, keeping 3530730 word types
2017-09-27 18:08:39,084 [MainThread  ] [INFO ]  PROGRESS: at sentence #66080000, processed 1293759504 words, keeping 3530864 word types
2017-09-27 18:08:39,697 [MainThread  ] [INFO ]  899: ../data/documents/286.json.gz
2017-09-27 18:08:42,372 [MainThread  ] [INFO ]  PROGRESS: at sentence #66090000, processed 1293950127 words, keeping 3532611 word types
2017-09-27 18:08:43,893 [MainThread  ] [INFO ]  PROGRESS: at sentence #66100000, processed 1294141719 words, keeping 3536125 word types
2017-09-27 18:08:45,393 [MainThread  ] [INFO ]  PROGRESS: at sentence #66110000, processed 1294336657

2017-09-27 18:10:24,548 [MainThread  ] [INFO ]  PROGRESS: at sentence #66600000, processed 1303913540 words, keeping 3558438 word types
2017-09-27 18:10:26,022 [MainThread  ] [INFO ]  PROGRESS: at sentence #66610000, processed 1304101179 words, keeping 3558643 word types
2017-09-27 18:10:27,689 [MainThread  ] [INFO ]  PROGRESS: at sentence #66620000, processed 1304309475 words, keeping 3558956 word types
2017-09-27 18:10:28,817 [MainThread  ] [INFO ]  908: ../data/documents/944.json.gz
2017-09-27 18:10:35,583 [MainThread  ] [INFO ]  PROGRESS: at sentence #66630000, processed 1304493054 words, keeping 3559085 word types
2017-09-27 18:10:36,989 [MainThread  ] [INFO ]  PROGRESS: at sentence #66640000, processed 1304674169 words, keeping 3559182 word types
2017-09-27 18:10:38,485 [MainThread  ] [INFO ]  PROGRESS: at sentence #66650000, processed 1304862614 words, keeping 3559314 word types
2017-09-27 18:10:40,039 [MainThread  ] [INFO ]  PROGRESS: at sentence #66660000, processed 1305064369

2017-09-27 18:12:16,335 [MainThread  ] [INFO ]  PROGRESS: at sentence #67150000, processed 1315016581 words, keeping 3575457 word types
2017-09-27 18:12:17,786 [MainThread  ] [INFO ]  PROGRESS: at sentence #67160000, processed 1315200571 words, keeping 3575602 word types
2017-09-27 18:12:18,701 [MainThread  ] [INFO ]  918: ../data/documents/945.json.gz
2017-09-27 18:12:23,613 [MainThread  ] [INFO ]  PROGRESS: at sentence #67170000, processed 1315386230 words, keeping 3575790 word types
2017-09-27 18:12:25,135 [MainThread  ] [INFO ]  PROGRESS: at sentence #67180000, processed 1315583541 words, keeping 3575930 word types
2017-09-27 18:12:26,666 [MainThread  ] [INFO ]  PROGRESS: at sentence #67190000, processed 1315777425 words, keeping 3576082 word types
2017-09-27 18:12:28,118 [MainThread  ] [INFO ]  PROGRESS: at sentence #67200000, processed 1315967013 words, keeping 3576238 word types
2017-09-27 18:12:29,626 [MainThread  ] [INFO ]  PROGRESS: at sentence #67210000, processed 1316158690

2017-09-27 18:14:12,274 [MainThread  ] [INFO ]  PROGRESS: at sentence #67700000, processed 1325837562 words, keeping 3584819 word types
2017-09-27 18:14:13,776 [MainThread  ] [INFO ]  PROGRESS: at sentence #67710000, processed 1326027793 words, keeping 3585026 word types
2017-09-27 18:14:15,238 [MainThread  ] [INFO ]  PROGRESS: at sentence #67720000, processed 1326215299 words, keeping 3585159 word types
2017-09-27 18:14:16,711 [MainThread  ] [INFO ]  PROGRESS: at sentence #67730000, processed 1326403390 words, keeping 3585260 word types
2017-09-27 18:14:18,267 [MainThread  ] [INFO ]  PROGRESS: at sentence #67740000, processed 1326603899 words, keeping 3585408 word types
2017-09-27 18:14:19,778 [MainThread  ] [INFO ]  PROGRESS: at sentence #67750000, processed 1326801472 words, keeping 3585518 word types
2017-09-27 18:14:21,321 [MainThread  ] [INFO ]  PROGRESS: at sentence #67760000, processed 1326992142 words, keeping 3585654 word types
2017-09-27 18:14:22,791 [MainThread  ] [INFO ]  

2017-09-27 18:16:00,715 [MainThread  ] [INFO ]  PROGRESS: at sentence #68260000, processed 1336757490 words, keeping 3594865 word types
2017-09-27 18:16:02,093 [MainThread  ] [INFO ]  PROGRESS: at sentence #68270000, processed 1336930312 words, keeping 3595186 word types
2017-09-27 18:16:03,420 [MainThread  ] [INFO ]  PROGRESS: at sentence #68280000, processed 1337097833 words, keeping 3596027 word types
2017-09-27 18:16:04,897 [MainThread  ] [INFO ]  PROGRESS: at sentence #68290000, processed 1337273884 words, keeping 3596772 word types
2017-09-27 18:16:06,396 [MainThread  ] [INFO ]  PROGRESS: at sentence #68300000, processed 1337453226 words, keeping 3597709 word types
2017-09-27 18:16:06,644 [MainThread  ] [INFO ]  936: ../data/documents/766.json.gz
2017-09-27 18:16:11,042 [MainThread  ] [INFO ]  PROGRESS: at sentence #68310000, processed 1337693508 words, keeping 3597872 word types
2017-09-27 18:16:12,689 [MainThread  ] [INFO ]  937: ../data/documents/501.json.gz
2017-09-27 18:16:1

2017-09-27 18:17:53,663 [MainThread  ] [INFO ]  PROGRESS: at sentence #68820000, processed 1347554477 words, keeping 3606970 word types
2017-09-27 18:17:55,204 [MainThread  ] [INFO ]  PROGRESS: at sentence #68830000, processed 1347758747 words, keeping 3607085 word types
2017-09-27 18:17:56,709 [MainThread  ] [INFO ]  PROGRESS: at sentence #68840000, processed 1347949650 words, keeping 3607182 word types
2017-09-27 18:17:58,184 [MainThread  ] [INFO ]  PROGRESS: at sentence #68850000, processed 1348136998 words, keeping 3607358 word types
2017-09-27 18:17:59,717 [MainThread  ] [INFO ]  PROGRESS: at sentence #68860000, processed 1348337750 words, keeping 3607517 word types
2017-09-27 18:18:01,295 [MainThread  ] [INFO ]  PROGRESS: at sentence #68870000, processed 1348540798 words, keeping 3607646 word types
2017-09-27 18:18:02,775 [MainThread  ] [INFO ]  PROGRESS: at sentence #68880000, processed 1348734312 words, keeping 3607731 word types
2017-09-27 18:18:03,517 [MainThread  ] [INFO ]  

2017-09-27 18:19:51,763 [MainThread  ] [INFO ]  PROGRESS: at sentence #69380000, processed 1359178180 words, keeping 3615736 word types
2017-09-27 18:19:53,286 [MainThread  ] [INFO ]  PROGRESS: at sentence #69390000, processed 1359375178 words, keeping 3615909 word types
2017-09-27 18:19:54,796 [MainThread  ] [INFO ]  PROGRESS: at sentence #69400000, processed 1359567118 words, keeping 3616019 word types
2017-09-27 18:19:56,307 [MainThread  ] [INFO ]  PROGRESS: at sentence #69410000, processed 1359764710 words, keeping 3616160 word types
2017-09-27 18:19:57,902 [MainThread  ] [INFO ]  PROGRESS: at sentence #69420000, processed 1359965213 words, keeping 3616289 word types
2017-09-27 18:19:59,388 [MainThread  ] [INFO ]  PROGRESS: at sentence #69430000, processed 1360154212 words, keeping 3616447 word types
2017-09-27 18:20:00,878 [MainThread  ] [INFO ]  PROGRESS: at sentence #69440000, processed 1360335950 words, keeping 3616643 word types
2017-09-27 18:20:02,359 [MainThread  ] [INFO ]  

2017-09-27 18:21:40,808 [MainThread  ] [INFO ]  PROGRESS: at sentence #69920000, processed 1370049277 words, keeping 3676429 word types
2017-09-27 18:21:41,347 [MainThread  ] [INFO ]  961: ../data/documents/239.json.gz
2017-09-27 18:21:43,074 [MainThread  ] [INFO ]  PROGRESS: at sentence #69930000, processed 1370277462 words, keeping 3676635 word types
2017-09-27 18:21:44,404 [MainThread  ] [INFO ]  962: ../data/documents/690.json.gz
2017-09-27 18:21:51,966 [MainThread  ] [INFO ]  PROGRESS: at sentence #69940000, processed 1370501527 words, keeping 3676790 word types
2017-09-27 18:21:53,511 [MainThread  ] [INFO ]  PROGRESS: at sentence #69950000, processed 1370703746 words, keeping 3676904 word types
2017-09-27 18:21:55,132 [MainThread  ] [INFO ]  PROGRESS: at sentence #69960000, processed 1370919339 words, keeping 3676990 word types
2017-09-27 18:21:56,791 [MainThread  ] [INFO ]  PROGRESS: at sentence #69970000, processed 1371133826 words, keeping 3677099 word types
2017-09-27 18:21:5

2017-09-27 18:23:35,918 [MainThread  ] [INFO ]  PROGRESS: at sentence #70480000, processed 1380759771 words, keeping 3709906 word types
2017-09-27 18:23:37,449 [MainThread  ] [INFO ]  PROGRESS: at sentence #70490000, processed 1380948130 words, keeping 3710006 word types
2017-09-27 18:23:39,035 [MainThread  ] [INFO ]  PROGRESS: at sentence #70500000, processed 1381149261 words, keeping 3710161 word types
2017-09-27 18:23:40,626 [MainThread  ] [INFO ]  PROGRESS: at sentence #70510000, processed 1381345422 words, keeping 3710238 word types
2017-09-27 18:23:42,158 [MainThread  ] [INFO ]  PROGRESS: at sentence #70520000, processed 1381534581 words, keeping 3710345 word types
2017-09-27 18:23:42,782 [MainThread  ] [INFO ]  968: ../data/documents/694.json.gz
2017-09-27 18:23:54,269 [MainThread  ] [INFO ]  PROGRESS: at sentence #70530000, processed 1381728984 words, keeping 3710447 word types
2017-09-27 18:23:55,822 [MainThread  ] [INFO ]  PROGRESS: at sentence #70540000, processed 1381921840

2017-09-27 18:25:25,793 [MainThread  ] [INFO ]  972: ../data/documents/302.json.gz
2017-09-27 18:25:31,460 [MainThread  ] [INFO ]  PROGRESS: at sentence #71060000, processed 1391762645 words, keeping 3719709 word types
2017-09-27 18:25:32,868 [MainThread  ] [INFO ]  PROGRESS: at sentence #71070000, processed 1391935534 words, keeping 3719867 word types
2017-09-27 18:25:34,244 [MainThread  ] [INFO ]  PROGRESS: at sentence #71080000, processed 1392108613 words, keeping 3720034 word types
2017-09-27 18:25:35,557 [MainThread  ] [INFO ]  PROGRESS: at sentence #71090000, processed 1392271762 words, keeping 3720203 word types
2017-09-27 18:25:37,077 [MainThread  ] [INFO ]  PROGRESS: at sentence #71100000, processed 1392454181 words, keeping 3720358 word types
2017-09-27 18:25:38,417 [MainThread  ] [INFO ]  PROGRESS: at sentence #71110000, processed 1392621191 words, keeping 3720524 word types
2017-09-27 18:25:39,892 [MainThread  ] [INFO ]  PROGRESS: at sentence #71120000, processed 1392804447

2017-09-27 18:27:17,627 [MainThread  ] [INFO ]  PROGRESS: at sentence #71600000, processed 1402329138 words, keeping 3756010 word types
2017-09-27 18:27:19,241 [MainThread  ] [INFO ]  PROGRESS: at sentence #71610000, processed 1402532974 words, keeping 3760537 word types
2017-09-27 18:27:20,794 [MainThread  ] [INFO ]  PROGRESS: at sentence #71620000, processed 1402730550 words, keeping 3763050 word types
2017-09-27 18:27:22,487 [MainThread  ] [INFO ]  PROGRESS: at sentence #71630000, processed 1402937766 words, keeping 3766834 word types
2017-09-27 18:27:24,064 [MainThread  ] [INFO ]  PROGRESS: at sentence #71640000, processed 1403129883 words, keeping 3769865 word types
2017-09-27 18:27:24,956 [MainThread  ] [INFO ]  983: ../data/documents/748.json.gz
2017-09-27 18:27:36,432 [MainThread  ] [INFO ]  PROGRESS: at sentence #71650000, processed 1403333918 words, keeping 3771408 word types
2017-09-27 18:27:37,892 [MainThread  ] [INFO ]  PROGRESS: at sentence #71660000, processed 1403518050

2017-09-27 18:29:11,258 [MainThread  ] [INFO ]  PROGRESS: at sentence #72160000, processed 1413331283 words, keeping 3780203 word types
2017-09-27 18:29:12,776 [MainThread  ] [INFO ]  PROGRESS: at sentence #72170000, processed 1413520555 words, keeping 3780366 word types
2017-09-27 18:29:14,295 [MainThread  ] [INFO ]  PROGRESS: at sentence #72180000, processed 1413712841 words, keeping 3780596 word types
2017-09-27 18:29:15,851 [MainThread  ] [INFO ]  PROGRESS: at sentence #72190000, processed 1413909661 words, keeping 3780771 word types
2017-09-27 18:29:17,048 [MainThread  ] [INFO ]  990: ../data/documents/321.json.gz
2017-09-27 18:29:22,651 [MainThread  ] [INFO ]  PROGRESS: at sentence #72200000, processed 1414095876 words, keeping 3780913 word types
2017-09-27 18:29:24,076 [MainThread  ] [INFO ]  PROGRESS: at sentence #72210000, processed 1414271902 words, keeping 3781083 word types
2017-09-27 18:29:25,553 [MainThread  ] [INFO ]  PROGRESS: at sentence #72220000, processed 1414455028

2017-09-27 18:31:03,561 [MainThread  ] [INFO ]  PROGRESS: at sentence #72720000, processed 1423981810 words, keeping 3791976 word types
2017-09-27 18:31:05,005 [MainThread  ] [INFO ]  PROGRESS: at sentence #72730000, processed 1424163234 words, keeping 3792160 word types
2017-09-27 18:31:06,494 [MainThread  ] [INFO ]  PROGRESS: at sentence #72740000, processed 1424350361 words, keeping 3792324 word types
2017-09-27 18:31:07,944 [MainThread  ] [INFO ]  PROGRESS: at sentence #72750000, processed 1424533628 words, keeping 3792550 word types
2017-09-27 18:31:09,489 [MainThread  ] [INFO ]  PROGRESS: at sentence #72760000, processed 1424727811 words, keeping 3792829 word types
2017-09-27 18:31:11,015 [MainThread  ] [INFO ]  PROGRESS: at sentence #72770000, processed 1424919654 words, keeping 3793005 word types
2017-09-27 18:31:12,502 [MainThread  ] [INFO ]  PROGRESS: at sentence #72780000, processed 1425107403 words, keeping 3793214 word types
2017-09-27 18:31:13,951 [MainThread  ] [INFO ]  

2017-09-27 18:33:07,598 [MainThread  ] [INFO ]  training on 0 raw words (0 effective words) took 0.0s, 0 effective words/s
2017-09-27 18:33:07,600 [MainThread  ] [WARNI]  under 10 jobs per worker: consider setting a smaller `batch_words' for smoother alpha decay
2017-09-27 18:33:07,601 [MainThread  ] [WARNI]  supplied example count (0) did not equal expected count (364894570)


In [72]:
model_name = 'vectors/w2v_model_%s_w10_bigram' % dim
model.save(join(DATA_FOLDER, model_name))

2017-09-27 18:54:14,896 [MainThread  ] [INFO ]  saving Word2Vec object under ../data/vectors/w2v_model_300_w10_bigram, separately None
2017-09-27 18:54:14,898 [MainThread  ] [INFO ]  not storing attribute syn0norm
2017-09-27 18:54:14,900 [MainThread  ] [INFO ]  storing np array 'syn0' to ../data/vectors/w2v_model_300_w10_bigram.wv.syn0.npy
2017-09-27 18:54:16,045 [MainThread  ] [INFO ]  storing np array 'syn1neg' to ../data/vectors/w2v_model_300_w10_bigram.syn1neg.npy
2017-09-27 18:54:18,742 [MainThread  ] [INFO ]  not storing attribute cum_table
2017-09-27 18:54:45,268 [MainThread  ] [INFO ]  saved ../data/vectors/w2v_model_300_w10_bigram


## Trigram

In [None]:
sentences = Sentences(join(DATA_FOLDER, 'documents/'))
trigram = gensim.models.Phrases(bigram[sentences])

2017-09-27 18:55:54,836 [MainThread  ] [INFO ]  0: ../data/documents/72.json.gz
2017-09-27 18:55:54,989 [MainThread  ] [INFO ]  collecting all words and their counts
2017-09-27 18:55:54,991 [MainThread  ] [INFO ]  PROGRESS: at sentence #0, processed 0 words and 0 word types
2017-09-27 18:55:56,122 [MainThread  ] [INFO ]  1: ../data/documents/228.json.gz
2017-09-27 18:55:58,374 [MainThread  ] [INFO ]  PROGRESS: at sentence #10000, processed 172754 words and 120247 word types
2017-09-27 18:56:00,070 [MainThread  ] [INFO ]  PROGRESS: at sentence #20000, processed 353297 words and 217217 word types
2017-09-27 18:56:01,735 [MainThread  ] [INFO ]  PROGRESS: at sentence #30000, processed 536780 words and 308526 word types
2017-09-27 18:56:03,433 [MainThread  ] [INFO ]  PROGRESS: at sentence #40000, processed 728442 words and 397106 word types
2017-09-27 18:56:05,070 [MainThread  ] [INFO ]  PROGRESS: at sentence #50000, processed 912530 words and 482165 word types
2017-09-27 18:56:06,785 [Main

2017-09-27 18:57:50,523 [MainThread  ] [INFO ]  PROGRESS: at sentence #540000, processed 10569837 words and 2874875 word types
2017-09-27 18:57:52,961 [MainThread  ] [INFO ]  PROGRESS: at sentence #550000, processed 10848931 words and 2918526 word types
2017-09-27 18:57:53,875 [MainThread  ] [INFO ]  17: ../data/documents/253.json.gz
2017-09-27 18:57:57,664 [MainThread  ] [INFO ]  PROGRESS: at sentence #560000, processed 11067783 words and 2961872 word types
2017-09-27 18:57:59,241 [MainThread  ] [INFO ]  PROGRESS: at sentence #570000, processed 11239984 words and 3004084 word types
2017-09-27 18:58:00,983 [MainThread  ] [INFO ]  PROGRESS: at sentence #580000, processed 11430038 words and 3043587 word types
2017-09-27 18:58:02,588 [MainThread  ] [INFO ]  PROGRESS: at sentence #590000, processed 11610839 words and 3084236 word types
2017-09-27 18:58:04,315 [MainThread  ] [INFO ]  PROGRESS: at sentence #600000, processed 11800070 words and 3122363 word types
2017-09-27 18:58:05,982 [Main

2017-09-27 18:59:55,958 [MainThread  ] [INFO ]  26: ../data/documents/702.json.gz
2017-09-27 18:59:58,255 [MainThread  ] [INFO ]  PROGRESS: at sentence #1130000, processed 22364827 words and 4907465 word types
2017-09-27 19:00:00,450 [MainThread  ] [INFO ]  PROGRESS: at sentence #1140000, processed 22613879 words and 4938246 word types
2017-09-27 19:00:01,450 [MainThread  ] [INFO ]  27: ../data/documents/865.json.gz
2017-09-27 19:00:05,939 [MainThread  ] [INFO ]  PROGRESS: at sentence #1150000, processed 22841015 words and 4970435 word types
2017-09-27 19:00:07,784 [MainThread  ] [INFO ]  PROGRESS: at sentence #1160000, processed 23043939 words and 5000617 word types
2017-09-27 19:00:09,561 [MainThread  ] [INFO ]  PROGRESS: at sentence #1170000, processed 23243499 words and 5031051 word types
2017-09-27 19:00:11,481 [MainThread  ] [INFO ]  PROGRESS: at sentence #1180000, processed 23448210 words and 5062659 word types
2017-09-27 19:00:13,305 [MainThread  ] [INFO ]  PROGRESS: at sentenc

2017-09-27 19:02:08,170 [MainThread  ] [INFO ]  PROGRESS: at sentence #1710000, processed 33766475 words and 6653074 word types
2017-09-27 19:02:09,764 [MainThread  ] [INFO ]  PROGRESS: at sentence #1720000, processed 33941258 words and 6684931 word types
2017-09-27 19:02:11,460 [MainThread  ] [INFO ]  PROGRESS: at sentence #1730000, processed 34131838 words and 6716268 word types
2017-09-27 19:02:13,228 [MainThread  ] [INFO ]  PROGRESS: at sentence #1740000, processed 34321292 words and 6750948 word types
2017-09-27 19:02:14,817 [MainThread  ] [INFO ]  PROGRESS: at sentence #1750000, processed 34497051 words and 6778359 word types
2017-09-27 19:02:16,498 [MainThread  ] [INFO ]  PROGRESS: at sentence #1760000, processed 34684654 words and 6807795 word types
2017-09-27 19:02:18,204 [MainThread  ] [INFO ]  PROGRESS: at sentence #1770000, processed 34872794 words and 6837883 word types
2017-09-27 19:02:20,065 [MainThread  ] [INFO ]  PROGRESS: at sentence #1780000, processed 35080284 words

2017-09-27 19:04:13,091 [MainThread  ] [INFO ]  PROGRESS: at sentence #2310000, processed 45171221 words and 8351966 word types
2017-09-27 19:04:14,872 [MainThread  ] [INFO ]  PROGRESS: at sentence #2320000, processed 45363309 words and 8378990 word types
2017-09-27 19:04:16,699 [MainThread  ] [INFO ]  PROGRESS: at sentence #2330000, processed 45563441 words and 8404566 word types
2017-09-27 19:04:18,416 [MainThread  ] [INFO ]  PROGRESS: at sentence #2340000, processed 45748379 words and 8429310 word types
2017-09-27 19:04:20,180 [MainThread  ] [INFO ]  PROGRESS: at sentence #2350000, processed 45942899 words and 8453325 word types
2017-09-27 19:04:22,026 [MainThread  ] [INFO ]  PROGRESS: at sentence #2360000, processed 46143460 words and 8477530 word types
2017-09-27 19:04:23,865 [MainThread  ] [INFO ]  PROGRESS: at sentence #2370000, processed 46350501 words and 8503393 word types
2017-09-27 19:04:25,796 [MainThread  ] [INFO ]  PROGRESS: at sentence #2380000, processed 46566285 words

2017-09-27 19:06:21,676 [MainThread  ] [INFO ]  48: ../data/documents/303.json.gz
2017-09-27 19:06:25,079 [MainThread  ] [INFO ]  PROGRESS: at sentence #2920000, processed 56955232 words and 9833562 word types
2017-09-27 19:06:26,791 [MainThread  ] [INFO ]  PROGRESS: at sentence #2930000, processed 57129108 words and 9858817 word types
2017-09-27 19:06:28,499 [MainThread  ] [INFO ]  PROGRESS: at sentence #2940000, processed 57308411 words and 9882618 word types
2017-09-27 19:06:30,101 [MainThread  ] [INFO ]  PROGRESS: at sentence #2950000, processed 57476759 words and 9905814 word types
2017-09-27 19:06:31,664 [MainThread  ] [INFO ]  PROGRESS: at sentence #2960000, processed 57642227 words and 9930452 word types
2017-09-27 19:06:33,272 [MainThread  ] [INFO ]  PROGRESS: at sentence #2970000, processed 57820984 words and 9951577 word types
2017-09-27 19:06:35,040 [MainThread  ] [INFO ]  PROGRESS: at sentence #2980000, processed 58008085 words and 9974960 word types
2017-09-27 19:06:36,81

2017-09-27 19:08:52,101 [MainThread  ] [INFO ]  PROGRESS: at sentence #3520000, processed 69799911 words and 11146562 word types
2017-09-27 19:08:55,879 [MainThread  ] [INFO ]  PROGRESS: at sentence #3530000, processed 70228683 words and 11175864 word types
2017-09-27 19:09:00,543 [MainThread  ] [INFO ]  PROGRESS: at sentence #3540000, processed 70603272 words and 11195237 word types
2017-09-27 19:09:03,649 [MainThread  ] [INFO ]  PROGRESS: at sentence #3550000, processed 70957124 words and 11219190 word types
2017-09-27 19:09:06,754 [MainThread  ] [INFO ]  PROGRESS: at sentence #3560000, processed 71298862 words and 11238099 word types
2017-09-27 19:09:10,629 [MainThread  ] [INFO ]  PROGRESS: at sentence #3570000, processed 71712416 words and 11260595 word types
2017-09-27 19:09:13,318 [MainThread  ] [INFO ]  55: ../data/documents/486.json.gz
2017-09-27 19:09:14,608 [MainThread  ] [INFO ]  PROGRESS: at sentence #3580000, processed 72058599 words and 11282583 word types
2017-09-27 19:0

2017-09-27 19:11:13,226 [MainThread  ] [INFO ]  PROGRESS: at sentence #4120000, processed 82695667 words and 12374702 word types
2017-09-27 19:11:14,760 [MainThread  ] [INFO ]  PROGRESS: at sentence #4130000, processed 82858767 words and 12396137 word types
2017-09-27 19:11:16,402 [MainThread  ] [INFO ]  PROGRESS: at sentence #4140000, processed 83027850 words and 12420096 word types
2017-09-27 19:11:18,017 [MainThread  ] [INFO ]  PROGRESS: at sentence #4150000, processed 83198027 words and 12443122 word types
2017-09-27 19:11:19,565 [MainThread  ] [INFO ]  PROGRESS: at sentence #4160000, processed 83367956 words and 12466335 word types
2017-09-27 19:11:21,196 [MainThread  ] [INFO ]  PROGRESS: at sentence #4170000, processed 83543664 words and 12488532 word types
2017-09-27 19:11:21,816 [MainThread  ] [INFO ]  61: ../data/documents/853.json.gz
2017-09-27 19:11:24,128 [MainThread  ] [INFO ]  PROGRESS: at sentence #4180000, processed 83792571 words and 12511266 word types
2017-09-27 19:1

2017-09-27 19:13:15,228 [MainThread  ] [INFO ]  PROGRESS: at sentence #4710000, processed 93616920 words and 13648825 word types
2017-09-27 19:13:16,928 [MainThread  ] [INFO ]  PROGRESS: at sentence #4720000, processed 93803669 words and 13670601 word types
2017-09-27 19:13:18,650 [MainThread  ] [INFO ]  PROGRESS: at sentence #4730000, processed 93991761 words and 13692083 word types
2017-09-27 19:13:20,295 [MainThread  ] [INFO ]  PROGRESS: at sentence #4740000, processed 94171474 words and 13712927 word types
2017-09-27 19:13:21,985 [MainThread  ] [INFO ]  PROGRESS: at sentence #4750000, processed 94356463 words and 13735973 word types
2017-09-27 19:13:23,709 [MainThread  ] [INFO ]  PROGRESS: at sentence #4760000, processed 94540370 words and 13759784 word types
2017-09-27 19:13:25,414 [MainThread  ] [INFO ]  PROGRESS: at sentence #4770000, processed 94726064 words and 13780896 word types
2017-09-27 19:13:26,011 [MainThread  ] [INFO ]  69: ../data/documents/74.json.gz
2017-09-27 19:13

2017-09-27 19:15:13,910 [MainThread  ] [INFO ]  85: ../data/documents/297.json.gz
2017-09-27 19:15:14,793 [MainThread  ] [INFO ]  PROGRESS: at sentence #5250000, processed 104629799 words and 14814200 word types
2017-09-27 19:15:16,512 [MainThread  ] [INFO ]  PROGRESS: at sentence #5260000, processed 104819711 words and 14830656 word types
2017-09-27 19:15:17,191 [MainThread  ] [INFO ]  86: ../data/documents/675.json.gz
2017-09-27 19:15:20,373 [MainThread  ] [INFO ]  PROGRESS: at sentence #5270000, processed 104984433 words and 14847446 word types
2017-09-27 19:15:22,125 [MainThread  ] [INFO ]  PROGRESS: at sentence #5280000, processed 105171545 words and 14866372 word types
2017-09-27 19:15:23,867 [MainThread  ] [INFO ]  PROGRESS: at sentence #5290000, processed 105363598 words and 14882991 word types
2017-09-27 19:15:25,646 [MainThread  ] [INFO ]  PROGRESS: at sentence #5300000, processed 105557445 words and 14899496 word types
2017-09-27 19:15:27,560 [MainThread  ] [INFO ]  PROGRESS

2017-09-27 19:17:32,381 [MainThread  ] [INFO ]  PROGRESS: at sentence #5840000, processed 116615434 words and 15911039 word types
2017-09-27 19:17:34,096 [MainThread  ] [INFO ]  PROGRESS: at sentence #5850000, processed 116799970 words and 15929921 word types
2017-09-27 19:17:35,731 [MainThread  ] [INFO ]  PROGRESS: at sentence #5860000, processed 116978479 words and 15949561 word types
2017-09-27 19:17:37,327 [MainThread  ] [INFO ]  PROGRESS: at sentence #5870000, processed 117148685 words and 15969423 word types
2017-09-27 19:17:38,971 [MainThread  ] [INFO ]  PROGRESS: at sentence #5880000, processed 117325499 words and 15990899 word types
2017-09-27 19:17:40,673 [MainThread  ] [INFO ]  PROGRESS: at sentence #5890000, processed 117507304 words and 16010830 word types
2017-09-27 19:17:42,432 [MainThread  ] [INFO ]  PROGRESS: at sentence #5900000, processed 117697093 words and 16032718 word types
2017-09-27 19:17:44,033 [MainThread  ] [INFO ]  92: ../data/documents/348.json.gz
2017-09-

2017-09-27 19:19:35,334 [MainThread  ] [INFO ]  102: ../data/documents/328.json.gz
2017-09-27 19:19:38,425 [MainThread  ] [INFO ]  PROGRESS: at sentence #6410000, processed 127839036 words and 17003806 word types
2017-09-27 19:19:40,330 [MainThread  ] [INFO ]  PROGRESS: at sentence #6420000, processed 128038877 words and 17020273 word types
2017-09-27 19:19:42,025 [MainThread  ] [INFO ]  PROGRESS: at sentence #6430000, processed 128224038 words and 17039232 word types
2017-09-27 19:19:43,716 [MainThread  ] [INFO ]  PROGRESS: at sentence #6440000, processed 128407211 words and 17057127 word types
2017-09-27 19:19:45,526 [MainThread  ] [INFO ]  PROGRESS: at sentence #6450000, processed 128604171 words and 17074768 word types
2017-09-27 19:19:47,195 [MainThread  ] [INFO ]  PROGRESS: at sentence #6460000, processed 128783553 words and 17093308 word types
2017-09-27 19:19:48,888 [MainThread  ] [INFO ]  PROGRESS: at sentence #6470000, processed 128966888 words and 17112148 word types
2017-09

2017-09-27 19:21:44,988 [MainThread  ] [INFO ]  PROGRESS: at sentence #6990000, processed 139281033 words and 18015098 word types
2017-09-27 19:21:46,727 [MainThread  ] [INFO ]  PROGRESS: at sentence #7000000, processed 139469133 words and 18031554 word types
2017-09-27 19:21:48,490 [MainThread  ] [INFO ]  PROGRESS: at sentence #7010000, processed 139660835 words and 18049263 word types
2017-09-27 19:21:50,249 [MainThread  ] [INFO ]  PROGRESS: at sentence #7020000, processed 139852062 words and 18069001 word types
2017-09-27 19:21:52,088 [MainThread  ] [INFO ]  PROGRESS: at sentence #7030000, processed 140054491 words and 18088284 word types
2017-09-27 19:21:53,749 [MainThread  ] [INFO ]  PROGRESS: at sentence #7040000, processed 140233996 words and 18107818 word types
2017-09-27 19:21:55,458 [MainThread  ] [INFO ]  PROGRESS: at sentence #7050000, processed 140419040 words and 18128185 word types
2017-09-27 19:21:57,226 [MainThread  ] [INFO ]  PROGRESS: at sentence #7060000, processed 

2017-09-27 19:23:44,477 [MainThread  ] [INFO ]  PROGRESS: at sentence #7550000, processed 150253713 words and 19126277 word types
2017-09-27 19:23:46,043 [MainThread  ] [INFO ]  PROGRESS: at sentence #7560000, processed 150415733 words and 19144567 word types
2017-09-27 19:23:46,803 [MainThread  ] [INFO ]  122: ../data/documents/152.json.gz
2017-09-27 19:23:54,526 [MainThread  ] [INFO ]  PROGRESS: at sentence #7570000, processed 150602304 words and 19162915 word types
2017-09-27 19:23:56,260 [MainThread  ] [INFO ]  PROGRESS: at sentence #7580000, processed 150794917 words and 19181251 word types
2017-09-27 19:23:58,025 [MainThread  ] [INFO ]  PROGRESS: at sentence #7590000, processed 150993148 words and 19199929 word types
2017-09-27 19:23:59,682 [MainThread  ] [INFO ]  PROGRESS: at sentence #7600000, processed 151177205 words and 19217196 word types
2017-09-27 19:24:01,498 [MainThread  ] [INFO ]  PROGRESS: at sentence #7610000, processed 151377919 words and 19234801 word types
2017-09

2017-09-27 19:25:55,111 [MainThread  ] [INFO ]  PROGRESS: at sentence #8110000, processed 161572569 words and 20050343 word types
2017-09-27 19:25:56,869 [MainThread  ] [INFO ]  PROGRESS: at sentence #8120000, processed 161761126 words and 20066114 word types
2017-09-27 19:25:57,185 [MainThread  ] [INFO ]  133: ../data/documents/769.json.gz
2017-09-27 19:26:00,724 [MainThread  ] [INFO ]  PROGRESS: at sentence #8130000, processed 161981427 words and 20084238 word types
2017-09-27 19:26:02,773 [MainThread  ] [INFO ]  PROGRESS: at sentence #8140000, processed 162208382 words and 20099791 word types
2017-09-27 19:26:04,704 [MainThread  ] [INFO ]  PROGRESS: at sentence #8150000, processed 162422139 words and 20114490 word types
2017-09-27 19:26:06,536 [MainThread  ] [INFO ]  PROGRESS: at sentence #8160000, processed 162627206 words and 20131013 word types
2017-09-27 19:26:08,577 [MainThread  ] [INFO ]  PROGRESS: at sentence #8170000, processed 162848074 words and 20146969 word types
2017-09

2017-09-27 19:27:59,091 [MainThread  ] [INFO ]  PROGRESS: at sentence #8680000, processed 172639266 words and 21040150 word types
2017-09-27 19:28:00,634 [MainThread  ] [INFO ]  143: ../data/documents/928.json.gz
2017-09-27 19:28:13,965 [MainThread  ] [INFO ]  PROGRESS: at sentence #8690000, processed 172832949 words and 21071665 word types
2017-09-27 19:28:15,737 [MainThread  ] [INFO ]  PROGRESS: at sentence #8700000, processed 173021549 words and 21087398 word types
2017-09-27 19:28:17,194 [MainThread  ] [INFO ]  PROGRESS: at sentence #8710000, processed 173169513 words and 21101687 word types
2017-09-27 19:28:18,939 [MainThread  ] [INFO ]  PROGRESS: at sentence #8720000, processed 173340971 words and 21120526 word types
2017-09-27 19:28:20,793 [MainThread  ] [INFO ]  PROGRESS: at sentence #8730000, processed 173538455 words and 21135064 word types
2017-09-27 19:28:22,513 [MainThread  ] [INFO ]  PROGRESS: at sentence #8740000, processed 173720880 words and 21145760 word types
2017-09

2017-09-27 19:30:15,788 [MainThread  ] [INFO ]  PROGRESS: at sentence #9280000, processed 184729828 words and 22017724 word types
2017-09-27 19:30:17,621 [MainThread  ] [INFO ]  PROGRESS: at sentence #9290000, processed 184924981 words and 22034557 word types
2017-09-27 19:30:18,741 [MainThread  ] [INFO ]  149: ../data/documents/172.json.gz
2017-09-27 19:30:20,103 [MainThread  ] [INFO ]  PROGRESS: at sentence #9300000, processed 185127613 words and 22050636 word types
2017-09-27 19:30:21,555 [MainThread  ] [INFO ]  150: ../data/documents/608.json.gz
2017-09-27 19:30:31,928 [MainThread  ] [INFO ]  PROGRESS: at sentence #9310000, processed 185350421 words and 22066960 word types
2017-09-27 19:30:33,653 [MainThread  ] [INFO ]  PROGRESS: at sentence #9320000, processed 185527337 words and 22082274 word types
2017-09-27 19:30:35,418 [MainThread  ] [INFO ]  PROGRESS: at sentence #9330000, processed 185717987 words and 22098012 word types
2017-09-27 19:30:37,238 [MainThread  ] [INFO ]  PROGRE

2017-09-27 19:32:38,769 [MainThread  ] [INFO ]  PROGRESS: at sentence #9880000, processed 196488597 words and 22958461 word types
2017-09-27 19:32:40,424 [MainThread  ] [INFO ]  PROGRESS: at sentence #9890000, processed 196664236 words and 22973873 word types
2017-09-27 19:32:42,136 [MainThread  ] [INFO ]  PROGRESS: at sentence #9900000, processed 196847789 words and 22990974 word types
2017-09-27 19:32:43,831 [MainThread  ] [INFO ]  PROGRESS: at sentence #9910000, processed 197032533 words and 23007584 word types
2017-09-27 19:32:45,453 [MainThread  ] [INFO ]  PROGRESS: at sentence #9920000, processed 197205339 words and 23024696 word types
2017-09-27 19:32:47,152 [MainThread  ] [INFO ]  PROGRESS: at sentence #9930000, processed 197387074 words and 23041126 word types
2017-09-27 19:32:47,475 [MainThread  ] [INFO ]  155: ../data/documents/357.json.gz
2017-09-27 19:32:49,671 [MainThread  ] [INFO ]  156: ../data/documents/634.json.gz
2017-09-27 19:32:50,611 [MainThread  ] [INFO ]  PROGRE

2017-09-27 19:34:51,557 [MainThread  ] [INFO ]  PROGRESS: at sentence #10470000, processed 208006801 words and 23844451 word types
2017-09-27 19:34:53,408 [MainThread  ] [INFO ]  PROGRESS: at sentence #10480000, processed 208205287 words and 23861239 word types
2017-09-27 19:34:55,156 [MainThread  ] [INFO ]  PROGRESS: at sentence #10490000, processed 208395433 words and 23880676 word types
2017-09-27 19:34:56,958 [MainThread  ] [INFO ]  PROGRESS: at sentence #10500000, processed 208591723 words and 23896424 word types
2017-09-27 19:34:58,767 [MainThread  ] [INFO ]  PROGRESS: at sentence #10510000, processed 208791981 words and 23910560 word types
2017-09-27 19:35:00,333 [MainThread  ] [INFO ]  PROGRESS: at sentence #10520000, processed 208956303 words and 23920987 word types
2017-09-27 19:35:02,140 [MainThread  ] [INFO ]  PROGRESS: at sentence #10530000, processed 209145977 words and 23940219 word types
2017-09-27 19:35:03,879 [MainThread  ] [INFO ]  PROGRESS: at sentence #10540000, pr

2017-09-27 19:37:01,840 [MainThread  ] [INFO ]  PROGRESS: at sentence #11050000, processed 219305596 words and 24655948 word types
2017-09-27 19:37:03,648 [MainThread  ] [INFO ]  PROGRESS: at sentence #11060000, processed 219498934 words and 24670521 word types
2017-09-27 19:37:05,425 [MainThread  ] [INFO ]  PROGRESS: at sentence #11070000, processed 219688513 words and 24686198 word types


In [None]:
trigram.save('../data/saved/trigram')

In [None]:
trigram = gensim.models.phrases.Phrases.load(join(DATA_FOLDER, '../data/saved/trigram'))

In [None]:
sentences = Sentences(join(DATA_FOLDER, 'documents/'))
for phrase, score in trigram.export_phrases(sentences):
    print(u'{0}   {1}'.format(phrase, score))

In [None]:
sentences = Sentences(join(DATA_FOLDER, 'documents/'))
model = Word2Vec(trigram[sentences], size=dim, sg=1, min_count=5, window=10, workers=cpu_count)

In [None]:
model_name = 'vectors/w2v_model_%s_w10_trigram' % dim
model.save(join(DATA_FOLDER, model_name))