In [7]:
import gensim.models as g
from gensim.corpora import WikiCorpus
import logging
from _utils import u_constant
from _utils.nlp.ZHConverter import langconv
logging.basicConfig(format="%(asctime)s : %(levelname)s : %(message)s", level=logging.INFO)
root_path = u_constant.PATH_ROOT + "for learn/Python/NLP_in_Action/chapter-7/"
path = root_path + "doc2vec/"
ZHWIKI_INPUT_PATH = root_path + "data/zhwiki-latest-pages-articles.xml.bz2"
MODEL_PATH = path + "zhwiki.doc2vec"

In [5]:
class TaggedWikiDocument:
    def __init__(self, wiki):
        self.wiki = wiki
        self.wiki.metadata = True
    
    def __iter__(self):
        for content, (page_id, title) in self.wiki.get_texts():
            yield g.doc2vec.TaggedDocument([langconv.cht_to_chs(c) for c in content], [title])

In [6]:
def train(input_path, model_save_path):
    wiki = WikiCorpus(input_path, lemmatize=False, dictionary={})
    documents = TaggedWikiDocument(wiki)
    
    model = g.Doc2Vec(documents, dm=0, dbow_words=1, vector_size=200, 
                      window=8, min_count=19, epochs=10, workers=8)
    
    mdoel.save(model_save_path)  

In [8]:
train(ZHWIKI_INPUT_PATH, MODEL_PATH)

2018-12-17 17:52:40,243 : INFO : collecting all words and their counts
2018-12-17 17:52:42,133 : INFO : PROGRESS: at example #0, processed 0 words (0/s), 0 word types, 0 tags
2018-12-17 17:56:24,040 : INFO : PROGRESS: at example #10000, processed 4239827 words (19106/s), 2492195 word types, 10000 tags
2018-12-17 17:59:09,504 : INFO : PROGRESS: at example #20000, processed 7421842 words (19231/s), 4130449 word types, 20000 tags
2018-12-17 18:01:35,848 : INFO : PROGRESS: at example #30000, processed 10343940 words (19967/s), 5494395 word types, 30000 tags
2018-12-17 18:03:53,991 : INFO : PROGRESS: at example #40000, processed 13089493 words (19875/s), 6727537 word types, 40000 tags
2018-12-17 18:05:58,443 : INFO : PROGRESS: at example #50000, processed 15673288 words (20761/s), 7839939 word types, 50000 tags
2018-12-17 18:08:02,238 : INFO : PROGRESS: at example #60000, processed 18226547 words (20625/s), 8859024 word types, 60000 tags
2018-12-17 18:10:15,788 : INFO : PROGRESS: at example

2018-12-17 18:59:11,955 : INFO : EPOCH 1 - PROGRESS: at 0.34% examples, 8545 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:13,095 : INFO : EPOCH 1 - PROGRESS: at 0.35% examples, 8573 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:14,320 : INFO : EPOCH 1 - PROGRESS: at 0.37% examples, 8591 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:15,481 : INFO : EPOCH 1 - PROGRESS: at 0.39% examples, 8575 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:16,517 : INFO : EPOCH 1 - PROGRESS: at 0.40% examples, 8601 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:17,581 : INFO : EPOCH 1 - PROGRESS: at 0.42% examples, 8572 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:18,898 : INFO : EPOCH 1 - PROGRESS: at 0.44% examples, 8696 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:20,342 : INFO : EPOCH 1 - PROGRESS: at 0.46% examples, 8626 words/s, in_qsize 0, out_qsize 0
2018-12-17 18:59:21,541 : INFO : EPOCH 1 - PROGRESS: at 0.49% examples, 8620 words/s, in_qsize 0, out_qsize 0
2018-12-17

2018-12-17 19:00:42,672 : INFO : EPOCH 1 - PROGRESS: at 1.87% examples, 8719 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:44,036 : INFO : EPOCH 1 - PROGRESS: at 1.89% examples, 8712 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:45,378 : INFO : EPOCH 1 - PROGRESS: at 1.92% examples, 8704 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:46,517 : INFO : EPOCH 1 - PROGRESS: at 1.94% examples, 8721 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:47,617 : INFO : EPOCH 1 - PROGRESS: at 1.96% examples, 8720 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:48,799 : INFO : EPOCH 1 - PROGRESS: at 1.98% examples, 8731 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:49,960 : INFO : EPOCH 1 - PROGRESS: at 2.00% examples, 8740 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:51,067 : INFO : EPOCH 1 - PROGRESS: at 2.02% examples, 8739 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:00:52,175 : INFO : EPOCH 1 - PROGRESS: at 2.04% examples, 8715 words/s, in_qsize 0, out_qsize 0
2018-12-17

2018-12-17 19:02:15,843 : INFO : EPOCH 1 - PROGRESS: at 3.58% examples, 8582 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:17,110 : INFO : EPOCH 1 - PROGRESS: at 3.61% examples, 8583 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:18,641 : INFO : EPOCH 1 - PROGRESS: at 3.64% examples, 8577 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:19,756 : INFO : EPOCH 1 - PROGRESS: at 3.65% examples, 8586 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:21,104 : INFO : EPOCH 1 - PROGRESS: at 3.69% examples, 8581 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:22,382 : INFO : EPOCH 1 - PROGRESS: at 3.72% examples, 8580 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:23,638 : INFO : EPOCH 1 - PROGRESS: at 3.75% examples, 8578 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:24,642 : INFO : EPOCH 1 - PROGRESS: at 3.78% examples, 8570 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:02:25,818 : INFO : EPOCH 1 - PROGRESS: at 3.81% examples, 8568 words/s, in_qsize 0, out_qsize 0
2018-12-17

2018-12-17 19:03:48,414 : INFO : EPOCH 1 - PROGRESS: at 5.68% examples, 8817 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:49,743 : INFO : EPOCH 1 - PROGRESS: at 5.71% examples, 8814 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:51,032 : INFO : EPOCH 1 - PROGRESS: at 5.74% examples, 8814 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:52,134 : INFO : EPOCH 1 - PROGRESS: at 5.76% examples, 8812 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:53,330 : INFO : EPOCH 1 - PROGRESS: at 5.80% examples, 8809 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:54,674 : INFO : EPOCH 1 - PROGRESS: at 5.83% examples, 8805 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:55,860 : INFO : EPOCH 1 - PROGRESS: at 5.86% examples, 8811 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:57,281 : INFO : EPOCH 1 - PROGRESS: at 5.89% examples, 8808 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:03:58,516 : INFO : EPOCH 1 - PROGRESS: at 5.91% examples, 8810 words/s, in_qsize 0, out_qsize 0
2018-12-17

2018-12-17 19:05:20,520 : INFO : EPOCH 1 - PROGRESS: at 7.87% examples, 9047 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:21,823 : INFO : EPOCH 1 - PROGRESS: at 7.90% examples, 9046 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:23,175 : INFO : EPOCH 1 - PROGRESS: at 7.94% examples, 9048 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:24,388 : INFO : EPOCH 1 - PROGRESS: at 7.98% examples, 9048 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:25,763 : INFO : EPOCH 1 - PROGRESS: at 8.00% examples, 9065 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:26,934 : INFO : EPOCH 1 - PROGRESS: at 8.03% examples, 9068 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:28,099 : INFO : EPOCH 1 - PROGRESS: at 8.06% examples, 9073 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:29,464 : INFO : EPOCH 1 - PROGRESS: at 8.10% examples, 9072 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:05:30,751 : INFO : EPOCH 1 - PROGRESS: at 8.13% examples, 9077 words/s, in_qsize 0, out_qsize 0
2018-12-17

2018-12-17 19:06:54,179 : INFO : EPOCH 1 - PROGRESS: at 10.24% examples, 9278 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:06:55,362 : INFO : EPOCH 1 - PROGRESS: at 10.27% examples, 9282 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:06:56,551 : INFO : EPOCH 1 - PROGRESS: at 10.30% examples, 9282 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:06:58,037 : INFO : EPOCH 1 - PROGRESS: at 10.34% examples, 9293 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:06:59,209 : INFO : EPOCH 1 - PROGRESS: at 10.37% examples, 9295 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:07:00,235 : INFO : EPOCH 1 - PROGRESS: at 10.40% examples, 9291 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:07:01,362 : INFO : EPOCH 1 - PROGRESS: at 10.43% examples, 9298 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:07:02,489 : INFO : EPOCH 1 - PROGRESS: at 10.46% examples, 9298 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:07:03,865 : INFO : EPOCH 1 - PROGRESS: at 10.51% examples, 9299 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:08:24,271 : INFO : EPOCH 1 - PROGRESS: at 12.62% examples, 9407 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:25,646 : INFO : EPOCH 1 - PROGRESS: at 12.67% examples, 9404 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:26,990 : INFO : EPOCH 1 - PROGRESS: at 12.70% examples, 9404 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:28,217 : INFO : EPOCH 1 - PROGRESS: at 12.74% examples, 9402 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:29,486 : INFO : EPOCH 1 - PROGRESS: at 12.77% examples, 9402 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:30,522 : INFO : EPOCH 1 - PROGRESS: at 12.80% examples, 9401 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:31,738 : INFO : EPOCH 1 - PROGRESS: at 12.84% examples, 9404 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:33,020 : INFO : EPOCH 1 - PROGRESS: at 12.87% examples, 9404 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:08:34,247 : INFO : EPOCH 1 - PROGRESS: at 12.90% examples, 9405 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:09:56,499 : INFO : EPOCH 1 - PROGRESS: at 15.15% examples, 9537 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:09:57,727 : INFO : EPOCH 1 - PROGRESS: at 15.18% examples, 9538 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:09:59,024 : INFO : EPOCH 1 - PROGRESS: at 15.21% examples, 9538 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:10:00,262 : INFO : EPOCH 1 - PROGRESS: at 15.25% examples, 9545 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:10:01,438 : INFO : EPOCH 1 - PROGRESS: at 15.28% examples, 9547 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:10:02,564 : INFO : EPOCH 1 - PROGRESS: at 15.30% examples, 9556 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:10:03,624 : INFO : EPOCH 1 - PROGRESS: at 15.33% examples, 9562 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:10:04,725 : INFO : EPOCH 1 - PROGRESS: at 15.34% examples, 9570 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:10:06,137 : INFO : EPOCH 1 - PROGRESS: at 15.38% examples, 9570 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:11:27,992 : INFO : EPOCH 1 - PROGRESS: at 17.69% examples, 9677 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:29,248 : INFO : EPOCH 1 - PROGRESS: at 17.72% examples, 9679 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:30,502 : INFO : EPOCH 1 - PROGRESS: at 17.76% examples, 9683 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:31,878 : INFO : EPOCH 1 - PROGRESS: at 17.79% examples, 9683 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:33,313 : INFO : EPOCH 1 - PROGRESS: at 17.83% examples, 9682 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:34,346 : INFO : EPOCH 1 - PROGRESS: at 17.84% examples, 9680 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:35,778 : INFO : EPOCH 1 - PROGRESS: at 17.87% examples, 9674 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:36,907 : INFO : EPOCH 1 - PROGRESS: at 17.89% examples, 9670 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:11:37,911 : INFO : EPOCH 1 - PROGRESS: at 17.91% examples, 9663 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:13:03,342 : INFO : EPOCH 1 - PROGRESS: at 20.27% examples, 9741 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:04,759 : INFO : EPOCH 1 - PROGRESS: at 20.34% examples, 9740 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:05,987 : INFO : EPOCH 1 - PROGRESS: at 20.38% examples, 9742 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:07,293 : INFO : EPOCH 1 - PROGRESS: at 20.42% examples, 9743 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:08,707 : INFO : EPOCH 1 - PROGRESS: at 20.46% examples, 9743 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:09,858 : INFO : EPOCH 1 - PROGRESS: at 20.50% examples, 9740 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:10,967 : INFO : EPOCH 1 - PROGRESS: at 20.54% examples, 9740 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:12,179 : INFO : EPOCH 1 - PROGRESS: at 20.58% examples, 9744 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:13:13,287 : INFO : EPOCH 1 - PROGRESS: at 20.62% examples, 9748 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:14:35,875 : INFO : EPOCH 1 - PROGRESS: at 23.07% examples, 9810 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:37,209 : INFO : EPOCH 1 - PROGRESS: at 23.11% examples, 9810 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:38,388 : INFO : EPOCH 1 - PROGRESS: at 23.13% examples, 9813 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:39,820 : INFO : EPOCH 1 - PROGRESS: at 23.17% examples, 9812 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:41,112 : INFO : EPOCH 1 - PROGRESS: at 23.22% examples, 9815 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:42,469 : INFO : EPOCH 1 - PROGRESS: at 23.25% examples, 9815 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:43,754 : INFO : EPOCH 1 - PROGRESS: at 23.30% examples, 9816 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:45,179 : INFO : EPOCH 1 - PROGRESS: at 23.35% examples, 9815 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:14:46,487 : INFO : EPOCH 1 - PROGRESS: at 23.39% examples, 9814 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:16:08,193 : INFO : EPOCH 1 - PROGRESS: at 25.85% examples, 9852 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:09,487 : INFO : EPOCH 1 - PROGRESS: at 25.89% examples, 9853 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:10,693 : INFO : EPOCH 1 - PROGRESS: at 25.94% examples, 9855 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:11,993 : INFO : EPOCH 1 - PROGRESS: at 25.98% examples, 9855 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:13,378 : INFO : EPOCH 1 - PROGRESS: at 26.02% examples, 9856 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:14,613 : INFO : EPOCH 1 - PROGRESS: at 26.06% examples, 9856 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:16,046 : INFO : EPOCH 1 - PROGRESS: at 26.11% examples, 9856 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:17,345 : INFO : EPOCH 1 - PROGRESS: at 26.14% examples, 9855 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:16:18,533 : INFO : EPOCH 1 - PROGRESS: at 26.17% examples, 9856 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:17:40,454 : INFO : EPOCH 1 - PROGRESS: at 28.76% examples, 9956 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:41,749 : INFO : EPOCH 1 - PROGRESS: at 28.80% examples, 9955 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:42,986 : INFO : EPOCH 1 - PROGRESS: at 28.84% examples, 9954 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:44,290 : INFO : EPOCH 1 - PROGRESS: at 28.87% examples, 9955 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:45,557 : INFO : EPOCH 1 - PROGRESS: at 28.91% examples, 9956 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:46,828 : INFO : EPOCH 1 - PROGRESS: at 28.95% examples, 9958 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:48,158 : INFO : EPOCH 1 - PROGRESS: at 29.00% examples, 9959 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:49,374 : INFO : EPOCH 1 - PROGRESS: at 29.05% examples, 9961 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:17:50,518 : INFO : EPOCH 1 - PROGRESS: at 29.08% examples, 9966 words/s, in_qsize 0, out_qsize 0
2

2018-12-17 19:19:12,187 : INFO : EPOCH 1 - PROGRESS: at 31.47% examples, 10092 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:13,423 : INFO : EPOCH 1 - PROGRESS: at 31.50% examples, 10095 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:14,759 : INFO : EPOCH 1 - PROGRESS: at 31.54% examples, 10095 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:16,159 : INFO : EPOCH 1 - PROGRESS: at 31.59% examples, 10095 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:17,441 : INFO : EPOCH 1 - PROGRESS: at 31.63% examples, 10097 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:18,636 : INFO : EPOCH 1 - PROGRESS: at 31.67% examples, 10099 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:19,994 : INFO : EPOCH 1 - PROGRESS: at 31.70% examples, 10098 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:21,132 : INFO : EPOCH 1 - PROGRESS: at 31.74% examples, 10101 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:19:22,377 : INFO : EPOCH 1 - PROGRESS: at 31.78% examples, 10101 words/s, in_qsize 0, out_

2018-12-17 19:20:47,445 : INFO : EPOCH 1 - PROGRESS: at 34.22% examples, 10095 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:48,753 : INFO : EPOCH 1 - PROGRESS: at 34.27% examples, 10097 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:49,938 : INFO : EPOCH 1 - PROGRESS: at 34.30% examples, 10098 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:51,279 : INFO : EPOCH 1 - PROGRESS: at 34.34% examples, 10099 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:52,327 : INFO : EPOCH 1 - PROGRESS: at 34.37% examples, 10100 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:53,769 : INFO : EPOCH 1 - PROGRESS: at 34.43% examples, 10099 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:55,056 : INFO : EPOCH 1 - PROGRESS: at 34.47% examples, 10099 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:56,478 : INFO : EPOCH 1 - PROGRESS: at 34.52% examples, 10098 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:20:57,684 : INFO : EPOCH 1 - PROGRESS: at 34.55% examples, 10099 words/s, in_qsize 0, out_

2018-12-17 19:22:21,280 : INFO : EPOCH 1 - PROGRESS: at 37.23% examples, 10093 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:22,395 : INFO : EPOCH 1 - PROGRESS: at 37.27% examples, 10095 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:23,808 : INFO : EPOCH 1 - PROGRESS: at 37.32% examples, 10094 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:25,163 : INFO : EPOCH 1 - PROGRESS: at 37.37% examples, 10094 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:26,480 : INFO : EPOCH 1 - PROGRESS: at 37.40% examples, 10094 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:27,818 : INFO : EPOCH 1 - PROGRESS: at 37.44% examples, 10094 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:29,012 : INFO : EPOCH 1 - PROGRESS: at 37.47% examples, 10092 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:30,482 : INFO : EPOCH 1 - PROGRESS: at 37.51% examples, 10092 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:22:31,854 : INFO : EPOCH 1 - PROGRESS: at 37.56% examples, 10091 words/s, in_qsize 0, out_

2018-12-17 19:23:56,729 : INFO : EPOCH 1 - PROGRESS: at 40.06% examples, 10122 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:23:58,110 : INFO : EPOCH 1 - PROGRESS: at 40.11% examples, 10121 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:23:59,161 : INFO : EPOCH 1 - PROGRESS: at 40.14% examples, 10121 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:24:00,176 : INFO : EPOCH 1 - PROGRESS: at 40.15% examples, 10118 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:24:01,206 : INFO : EPOCH 1 - PROGRESS: at 40.19% examples, 10121 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:24:02,420 : INFO : EPOCH 1 - PROGRESS: at 40.22% examples, 10122 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:24:03,792 : INFO : EPOCH 1 - PROGRESS: at 40.27% examples, 10122 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:24:05,132 : INFO : EPOCH 1 - PROGRESS: at 40.31% examples, 10124 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:24:06,296 : INFO : EPOCH 1 - PROGRESS: at 40.34% examples, 10127 words/s, in_qsize 0, out_

2018-12-17 19:25:31,112 : INFO : EPOCH 1 - PROGRESS: at 42.99% examples, 10181 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:32,418 : INFO : EPOCH 1 - PROGRESS: at 43.02% examples, 10181 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:33,734 : INFO : EPOCH 1 - PROGRESS: at 43.06% examples, 10183 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:34,982 : INFO : EPOCH 1 - PROGRESS: at 43.09% examples, 10186 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:36,232 : INFO : EPOCH 1 - PROGRESS: at 43.14% examples, 10188 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:37,507 : INFO : EPOCH 1 - PROGRESS: at 43.17% examples, 10190 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:38,552 : INFO : EPOCH 1 - PROGRESS: at 43.19% examples, 10190 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:40,061 : INFO : EPOCH 1 - PROGRESS: at 43.24% examples, 10189 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:25:41,198 : INFO : EPOCH 1 - PROGRESS: at 43.27% examples, 10190 words/s, in_qsize 0, out_

2018-12-17 19:27:04,871 : INFO : EPOCH 1 - PROGRESS: at 45.77% examples, 10231 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:06,191 : INFO : EPOCH 1 - PROGRESS: at 45.81% examples, 10230 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:07,471 : INFO : EPOCH 1 - PROGRESS: at 45.85% examples, 10229 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:08,508 : INFO : EPOCH 1 - PROGRESS: at 45.89% examples, 10228 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:10,017 : INFO : EPOCH 1 - PROGRESS: at 45.94% examples, 10227 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:11,383 : INFO : EPOCH 1 - PROGRESS: at 45.98% examples, 10226 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:12,711 : INFO : EPOCH 1 - PROGRESS: at 46.02% examples, 10226 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:14,038 : INFO : EPOCH 1 - PROGRESS: at 46.06% examples, 10227 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:27:15,103 : INFO : EPOCH 1 - PROGRESS: at 46.10% examples, 10226 words/s, in_qsize 0, out_

2018-12-17 19:28:40,434 : INFO : EPOCH 1 - PROGRESS: at 48.81% examples, 10238 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:41,667 : INFO : EPOCH 1 - PROGRESS: at 48.84% examples, 10238 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:43,222 : INFO : EPOCH 1 - PROGRESS: at 48.89% examples, 10238 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:44,265 : INFO : EPOCH 1 - PROGRESS: at 48.92% examples, 10237 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:45,358 : INFO : EPOCH 1 - PROGRESS: at 48.95% examples, 10236 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:46,657 : INFO : EPOCH 1 - PROGRESS: at 48.99% examples, 10233 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:48,119 : INFO : EPOCH 1 - PROGRESS: at 49.03% examples, 10232 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:49,678 : INFO : EPOCH 1 - PROGRESS: at 49.06% examples, 10231 words/s, in_qsize 0, out_qsize 0
2018-12-17 19:28:51,179 : INFO : EPOCH 1 - PROGRESS: at 49.11% examples, 10230 words/s, in_qsize 0, out_

KeyboardInterrupt: 