In [1]:
import sys
import json
import datetime
import pickle
import gc
import time

from operator import itemgetter
from collections import defaultdict

import pandas as pd
import numpy as np

import gensim
from gensim import corpora, models
from sklearn.feature_extraction.text import CountVectorizer
from gensim import corpora, models, similarities, matutils
from gensim.models.ldamodel import LdaModel
from gensim.models.ldamulticore import LdaMulticore

# Plotting tools
import pyLDAvis
import pyLDAvis.gensim  # don't skip this
import matplotlib.pyplot as plt
%matplotlib inline

import pprint
pp = pprint.PrettyPrinter(indent=4)

import logging
logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s', level=logging.INFO)

In [6]:
with open('clean_data_full.pickle', 'rb') as file:
    art = pickle.load(file)
# List of Extra Stop words
stopwords = [
    'week','another','thing','month','day','come',
    'york','away','left','wrote','came','tell','asked',
    'left','right','hand','point','often','talk','head','point','ago','whether',
    'hour','group','became','become','becomes','often','sometimes','usually','page','sequence','doi','p'
    ]
# Remove Extra Stop Words
art['article_text_nostop_extra'] = [[word for word in x if not word in stopwords and len(word)>2] for x in art['tokenized_nopunc_lower_nostop_extra_lemmatized']]


In [7]:
art['string'] = [' '.join(x) for x in art['article_text_nostop_extra']]

In [15]:
atype='book-review'
years = [ #range (1982,1985),
          range(1985,1990),
          range(1990,1995),
          range(1995,2000), 
          range(2000,2005), 
          range(2005,2010),
          range(2010,2015)
        ]
art=art[art['type']==atype]

In [9]:

art.head()

Unnamed: 0,index,id,type,title,auth1,year,lang,citations,text,text_noent,tokenized_text,tokenized_nopunc,tokenized_nopunc_lower,tokenized_nopunc_lower_nostop,tokenized_nopunc_lower_nostop_extra,tokenized_nopunc_lower_nostop_extra_lemmatized,article_text_nostop_extra,string
12,17,[C:\Users\msatlow\Dropbox\AJSProject\data\jsto...,book-review,\n,Stuart S. Miller,1986,eng,[],page sequence 1 Martin Goodman State and Soci...,page sequence 1 Martin Goodman and in Roman G...,"[page, sequence, 1, Martin, Goodman, and, in, ...","[page, sequence, Martin, Goodman, and, in, Rom...","[page, sequence, martin, goodman, and, in, rom...","[martin, goodman, roman, galilee, centre, post...","[martin, goodman, roman, galilee, centre, post...","[martin, goodman, roman, galilee, centre, post...","[martin, goodman, roman, galilee, centre, post...",martin goodman roman galilee centre postgradua...
13,18,[C:\Users\msatlow\Dropbox\AJSProject\data\jsto...,book-review,\n,Anthony J. Saldarini,1986,eng,[],page sequence 1 Jack N Lightstone The Commerc...,page sequence 1 Jack N Lightstone The Commerc...,"[page, sequence, 1, Jack, N, Lightstone, The, ...","[page, sequence, Jack, N, Lightstone, The, Com...","[page, sequence, jack, n, lightstone, the, com...","[jack, lightstone, commerce, sacred, mediation...","[jack, lightstone, commerce, sacred, mediation...","[jack, lightstone, commerce, sacred, mediation...","[jack, lightstone, commerce, sacred, mediation...",jack lightstone commerce sacred mediation divi...
14,19,[C:\Users\msatlow\Dropbox\AJSProject\data\jsto...,book-review,\n,David Stern,1986,eng,[],page sequence 1 Judith R Baskin Pharaoh s Cou...,page sequence 1 Judith Baskin Pharaoh s Couns...,"[page, sequence, 1, Judith, Baskin, Pharaoh, s...","[page, sequence, Judith, Baskin, Pharaoh, s, C...","[page, sequence, judith, baskin, pharaoh, s, c...","[judith, baskin, pharaoh, counsellors, job, je...","[judith, baskin, pharaoh, counsellors, job, je...","[judith, baskin, pharaoh, counsellor, job, jet...","[judith, baskin, pharaoh, counsellor, job, jet...",judith baskin pharaoh counsellor job jethro ba...
15,20,[C:\Users\msatlow\Dropbox\AJSProject\data\jsto...,book-review,\n,Baruch M. Bokser,1986,eng,[],page sequence 1 Stephen M Passamaneck The Tra...,page sequence 1 Stephen M Passamaneck The Tra...,"[page, sequence, 1, Stephen, M, Passamaneck, T...","[page, sequence, Stephen, M, Passamaneck, The,...","[page, sequence, stephen, m, passamaneck, the,...","[stephen, passamaneck, traditional, law, sale,...","[stephen, passamaneck, traditional, law, sale,...","[stephen, passamaneck, traditional, law, sale,...","[stephen, passamaneck, traditional, law, sale,...",stephen passamaneck traditional law sale shulh...
16,21,[C:\Users\msatlow\Dropbox\AJSProject\data\jsto...,book-review,\n,Marsha L. Rozenblit,1986,eng,[],page sequence 1 Robert S Wistrich Socialism a...,page sequence 1 Robert S Wistrich Socialism a...,"[page, sequence, 1, Robert, S, Wistrich, Socia...","[page, sequence, Robert, S, Wistrich, Socialis...","[page, sequence, robert, s, wistrich, socialis...","[wistrich, socialism, dilemmas, assimilation, ...","[wistrich, socialism, dilemmas, assimilation, ...","[wistrich, socialism, dilemma, assimilation, g...","[wistrich, socialism, dilemma, assimilation, g...",wistrich socialism dilemma assimilation german...


In [16]:
dict_list=[]

for i in years:
    newart=art.copy()
    newart.astype({'year':'int'}).dtypes
    x=int(i[0])-1
    y=int(i[-1])
    newart=newart[newart['year']<y]
    newart=newart[newart['year']>x]
    texts=newart['article_text_nostop_extra'].tolist()
    for a in range(len(texts)):
        for b in range(len (texts[a])):
            dict_list.append(texts[a][b])
    
    res = [sub.split() for sub in dict_list] 
    
    dictionary = corpora.Dictionary(res)
    corpus = [dictionary.doc2bow(text) for text in texts]
   
    corpora.MmCorpus.serialize('corpus_allbooks'+str(i[0])+'.mm', corpus)
    no_of_topics = 17
    ldamodel17 = LdaModel(corpus, num_topics=no_of_topics, id2word=dictionary, passes=50, alpha='auto', eval_every=2000)
    # Save Model (24)
    ldamodel17.save('l2a_17t_50p_autoalpha_books_all_{}_val.model'.format(i[0]))
    vis = pyLDAvis.gensim.prepare(ldamodel17, corpus, dictionary)
    pyLDAvis.save_html(vis,'visualization_research_all'+str(i[0])+'.html')

    
    

2020-08-06 15:16:01,745 : INFO : adding document #0 to Dictionary(0 unique tokens: [])
2020-08-06 15:16:01,811 : INFO : adding document #10000 to Dictionary(3777 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:16:01,869 : INFO : adding document #20000 to Dictionary(5973 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:16:01,882 : INFO : built Dictionary(6397 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...) from 21990 documents (total 21990 corpus positions)
2020-08-06 15:16:01,909 : INFO : storing corpus in Matrix Market format to corpus_allbooks1985.mm
2020-08-06 15:16:01,914 : INFO : saving sparse matrix to corpus_allbooks1985.mm
2020-08-06 15:16:01,919 : INFO : PROGRESS: saving document #0
2020-08-06 15:16:01,961 : INFO : saved 31x6397 matrix, density=6.752% (13390/198307)
2020-08-06 15:16:01,963 : INFO : saving MmCorpus index to corpus_allbooks1985.mm.index
2020-08-06 15:16:01,970 : INFO 

2020-08-06 15:16:02,926 : INFO : topic diff=1.227547, rho=0.447214
2020-08-06 15:16:03,015 : INFO : -8.457 per-word bound, 351.4 perplexity estimate based on a held-out corpus of 31 documents with 21990 words
2020-08-06 15:16:03,016 : INFO : PROGRESS: pass 4, at document #31/31
2020-08-06 15:16:03,040 : INFO : optimized alpha [0.051919613, 0.036703974, 0.045797296, 0.038556024, 0.038747724, 0.067390844, 0.038450018, 0.04702976, 0.041268397, 0.039383516, 0.04260001, 0.03926551, 0.053315163, 0.04224407, 0.041997794, 0.047055643, 0.042509846]
2020-08-06 15:16:03,058 : INFO : topic #1 (0.037): 0.002*"segal" + 0.002*"rabbinic" + 0.001*"god" + 0.001*"belief" + 0.001*"century" + 0.001*"text" + 0.001*"power" + 0.001*"dualism" + 0.001*"review" + 0.001*"political"
2020-08-06 15:16:03,059 : INFO : topic #6 (0.038): 0.024*"diamond" + 0.018*"ratosh" + 0.017*"canaanism" + 0.014*"canaanite" + 0.012*"israeli" + 0.009*"zionism" + 0.009*"diaspora" + 0.008*"political" + 0.008*"secular" + 0.007*"zionist"


2020-08-06 15:16:03,655 : INFO : topic #5 (0.054): 0.009*"goodman" + 0.009*"hazaz" + 0.008*"bargad" + 0.007*"rabbinic" + 0.006*"question" + 0.006*"rabbi" + 0.006*"review" + 0.006*"work" + 0.005*"blumenthal" + 0.005*"hoter"
2020-08-06 15:16:03,657 : INFO : topic diff=0.195978, rho=0.316228
2020-08-06 15:16:03,779 : INFO : -8.185 per-word bound, 291.1 perplexity estimate based on a held-out corpus of 31 documents with 21990 words
2020-08-06 15:16:03,780 : INFO : PROGRESS: pass 9, at document #31/31
2020-08-06 15:16:03,798 : INFO : optimized alpha [0.036236763, 0.023561504, 0.03026201, 0.025795493, 0.025895944, 0.052014418, 0.025773438, 0.03271177, 0.028463604, 0.026140211, 0.029020628, 0.026080692, 0.03705595, 0.028689392, 0.028835109, 0.03257324, 0.028941542]
2020-08-06 15:16:03,817 : INFO : topic #1 (0.024): 0.000*"segal" + 0.000*"rabbinic" + 0.000*"god" + 0.000*"belief" + 0.000*"century" + 0.000*"text" + 0.000*"power" + 0.000*"dualism" + 0.000*"review" + 0.000*"political"
2020-08-06 1

2020-08-06 15:16:04,381 : INFO : topic #12 (0.031): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"canonization" + 0.007*"geonim" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:04,382 : INFO : topic #5 (0.046): 0.010*"goodman" + 0.009*"hazaz" + 0.008*"bargad" + 0.007*"rabbinic" + 0.006*"question" + 0.006*"rabbi" + 0.006*"review" + 0.005*"work" + 0.005*"blumenthal" + 0.005*"hoter"
2020-08-06 15:16:04,384 : INFO : topic diff=0.039536, rho=0.258199
2020-08-06 15:16:04,475 : INFO : -8.166 per-word bound, 287.2 perplexity estimate based on a held-out corpus of 31 documents with 21990 words
2020-08-06 15:16:04,476 : INFO : PROGRESS: pass 14, at document #31/31
2020-08-06 15:16:04,492 : INFO : optimized alpha [0.029755164, 0.018171629, 0.024012575, 0.020396138, 0.020466099, 0.045037154, 0.020393036, 0.026644906, 0.022955757, 0.020604482, 0.023291614, 0.020563861, 0.03037391, 0.02300362, 0.023210693, 0.02649216, 0.023220

2020-08-06 15:16:05,091 : INFO : topic #0 (0.027): 0.020*"blidstein" + 0.012*"maimonides" + 0.009*"buber" + 0.009*"politics" + 0.006*"source" + 0.006*"political" + 0.006*"power" + 0.006*"king" + 0.005*"authority" + 0.005*"subject"
2020-08-06 15:16:05,095 : INFO : topic #12 (0.027): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"canonization" + 0.007*"geonim" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:05,097 : INFO : topic #5 (0.042): 0.010*"goodman" + 0.009*"hazaz" + 0.008*"bargad" + 0.007*"rabbinic" + 0.006*"question" + 0.006*"rabbi" + 0.006*"review" + 0.005*"work" + 0.005*"blumenthal" + 0.005*"hoter"
2020-08-06 15:16:05,099 : INFO : topic diff=0.009934, rho=0.223607
2020-08-06 15:16:05,184 : INFO : -8.163 per-word bound, 286.6 perplexity estimate based on a held-out corpus of 31 documents with 21990 words
2020-08-06 15:16:05,185 : INFO : PROGRESS: pass 19, at document #31/31
2020-08-06 15:16:05,204 : INFO :

2020-08-06 15:16:05,905 : INFO : topic #0 (0.024): 0.020*"blidstein" + 0.012*"maimonides" + 0.009*"buber" + 0.009*"politics" + 0.006*"source" + 0.006*"political" + 0.006*"power" + 0.006*"king" + 0.005*"authority" + 0.005*"subject"
2020-08-06 15:16:05,906 : INFO : topic #12 (0.024): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"canonization" + 0.007*"geonim" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:05,909 : INFO : topic #5 (0.038): 0.010*"goodman" + 0.009*"hazaz" + 0.008*"bargad" + 0.007*"rabbinic" + 0.006*"question" + 0.006*"rabbi" + 0.006*"review" + 0.005*"work" + 0.005*"blumenthal" + 0.005*"hoter"
2020-08-06 15:16:05,912 : INFO : topic diff=0.003001, rho=0.200000
2020-08-06 15:16:06,013 : INFO : -8.162 per-word bound, 286.4 perplexity estimate based on a held-out corpus of 31 documents with 21990 words
2020-08-06 15:16:06,015 : INFO : PROGRESS: pass 24, at document #31/31
2020-08-06 15:16:06,039 : INFO :

2020-08-06 15:16:06,662 : INFO : topic #3 (0.014): 0.014*"economic" + 0.014*"pollins" + 0.013*"trade" + 0.010*"history" + 0.009*"immigrant" + 0.008*"century" + 0.007*"area" + 0.007*"england" + 0.005*"work" + 0.005*"community"
2020-08-06 15:16:06,663 : INFO : topic #0 (0.022): 0.020*"blidstein" + 0.012*"maimonides" + 0.009*"buber" + 0.009*"politics" + 0.006*"source" + 0.006*"political" + 0.006*"power" + 0.006*"king" + 0.005*"authority" + 0.005*"subject"
2020-08-06 15:16:06,664 : INFO : topic #12 (0.022): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"canonization" + 0.007*"geonim" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:06,665 : INFO : topic #5 (0.036): 0.010*"goodman" + 0.009*"hazaz" + 0.008*"bargad" + 0.007*"rabbinic" + 0.006*"question" + 0.006*"rabbi" + 0.006*"review" + 0.005*"work" + 0.005*"blumenthal" + 0.005*"hoter"
2020-08-06 15:16:06,667 : INFO : topic diff=0.001068, rho=0.182574
2020-08-06 15:16:06

2020-08-06 15:16:07,568 : INFO : topic #1 (0.011): 0.000*"segal" + 0.000*"rabbinic" + 0.000*"god" + 0.000*"belief" + 0.000*"century" + 0.000*"text" + 0.000*"power" + 0.000*"dualism" + 0.000*"review" + 0.000*"political"
2020-08-06 15:16:07,569 : INFO : topic #11 (0.013): 0.041*"caspi" + 0.024*"kesef" + 0.021*"herring" + 0.015*"miracle" + 0.011*"gevia" + 0.009*"question" + 0.008*"impossible" + 0.006*"god" + 0.006*"medieval" + 0.006*"category"
2020-08-06 15:16:07,570 : INFO : topic #0 (0.021): 0.020*"blidstein" + 0.012*"maimonides" + 0.009*"buber" + 0.009*"politics" + 0.006*"source" + 0.006*"political" + 0.006*"power" + 0.006*"king" + 0.005*"authority" + 0.005*"subject"
2020-08-06 15:16:07,571 : INFO : topic #12 (0.021): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"canonization" + 0.007*"geonim" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:07,572 : INFO : topic #5 (0.034): 0.010*"goodman" + 0.009*"hazaz" + 0.008

2020-08-06 15:16:08,432 : INFO : topic #1 (0.010): 0.000*"segal" + 0.000*"rabbinic" + 0.000*"god" + 0.000*"belief" + 0.000*"century" + 0.000*"text" + 0.000*"power" + 0.000*"dualism" + 0.000*"review" + 0.000*"political"
2020-08-06 15:16:08,434 : INFO : topic #4 (0.012): 0.026*"hartman" + 0.021*"god" + 0.015*"love" + 0.009*"covenantal" + 0.008*"theology" + 0.008*"human" + 0.008*"covenant" + 0.007*"rabbinic" + 0.007*"model" + 0.007*"terror"
2020-08-06 15:16:08,435 : INFO : topic #0 (0.019): 0.020*"blidstein" + 0.012*"maimonides" + 0.009*"buber" + 0.009*"politics" + 0.006*"source" + 0.006*"political" + 0.006*"power" + 0.006*"king" + 0.005*"subject" + 0.005*"authority"
2020-08-06 15:16:08,436 : INFO : topic #12 (0.020): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"canonization" + 0.007*"geonim" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:08,438 : INFO : topic #5 (0.033): 0.010*"goodman" + 0.009*"hazaz" + 0.008*"b

2020-08-06 15:16:09,289 : INFO : topic #1 (0.009): 0.000*"segal" + 0.000*"rabbinic" + 0.000*"god" + 0.000*"belief" + 0.000*"century" + 0.000*"text" + 0.000*"power" + 0.000*"dualism" + 0.000*"review" + 0.000*"political"
2020-08-06 15:16:09,292 : INFO : topic #3 (0.011): 0.014*"economic" + 0.014*"pollins" + 0.013*"trade" + 0.010*"history" + 0.009*"immigrant" + 0.008*"century" + 0.007*"area" + 0.007*"england" + 0.005*"work" + 0.005*"community"
2020-08-06 15:16:09,295 : INFO : topic #0 (0.018): 0.020*"blidstein" + 0.012*"maimonides" + 0.009*"buber" + 0.009*"politics" + 0.006*"source" + 0.006*"political" + 0.006*"power" + 0.006*"king" + 0.005*"subject" + 0.005*"authority"
2020-08-06 15:16:09,298 : INFO : topic #12 (0.019): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"canonization" + 0.007*"geonim" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:09,301 : INFO : topic #5 (0.032): 0.010*"goodman" + 0.009*"hazaz" + 0.008

2020-08-06 15:16:10,180 : INFO : topic #1 (0.008): 0.000*"segal" + 0.000*"rabbinic" + 0.000*"god" + 0.000*"belief" + 0.000*"century" + 0.000*"text" + 0.000*"power" + 0.000*"dualism" + 0.000*"review" + 0.000*"political"
2020-08-06 15:16:10,181 : INFO : topic #3 (0.010): 0.014*"economic" + 0.014*"pollins" + 0.013*"trade" + 0.010*"history" + 0.009*"immigrant" + 0.008*"century" + 0.007*"area" + 0.007*"england" + 0.005*"work" + 0.005*"community"
2020-08-06 15:16:10,182 : INFO : topic #0 (0.018): 0.020*"blidstein" + 0.012*"maimonides" + 0.009*"buber" + 0.009*"politics" + 0.006*"source" + 0.006*"political" + 0.006*"power" + 0.006*"king" + 0.005*"subject" + 0.005*"authority"
2020-08-06 15:16:10,183 : INFO : topic #12 (0.018): 0.012*"hoffman" + 0.010*"geonic" + 0.010*"liturgical" + 0.008*"period" + 0.007*"study" + 0.007*"geonim" + 0.007*"canonization" + 0.006*"evidence" + 0.006*"source" + 0.006*"analysis"
2020-08-06 15:16:10,185 : INFO : topic #5 (0.031): 0.010*"goodman" + 0.009*"hazaz" + 0.008

2020-08-06 15:17:56,153 : INFO : topic diff=7.280720, rho=1.000000
2020-08-06 15:17:56,826 : INFO : -10.852 per-word bound, 1847.9 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:17:56,828 : INFO : PROGRESS: pass 1, at document #114/114
2020-08-06 15:17:57,048 : INFO : optimized alpha [0.08648018, 0.086284876, 0.061938975, 0.06484779, 0.08888531, 0.07246604, 0.071626134, 0.069882244, 0.069157675, 0.0721534, 0.07341676, 0.069325104, 0.082328364, 0.065092176, 0.079045884, 0.078543514, 0.07420741]
2020-08-06 15:17:57,094 : INFO : topic #2 (0.062): 0.009*"ezra" + 0.007*"vision" + 0.007*"stone" + 0.005*"author" + 0.003*"idel" + 0.003*"religious" + 0.003*"experience" + 0.003*"literary" + 0.003*"study" + 0.003*"work"
2020-08-06 15:17:57,096 : INFO : topic #3 (0.065): 0.005*"kabbalah" + 0.004*"review" + 0.003*"century" + 0.003*"newby" + 0.003*"history" + 0.003*"idel" + 0.003*"arabia" + 0.003*"god" + 0.002*"scholem" + 0.002*"arabian"
2020-08-06 15:

2020-08-06 15:17:59,165 : INFO : topic diff=0.492252, rho=0.377964
2020-08-06 15:17:59,485 : INFO : -8.899 per-word bound, 477.2 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:17:59,486 : INFO : PROGRESS: pass 6, at document #114/114
2020-08-06 15:17:59,565 : INFO : optimized alpha [0.04461773, 0.044272486, 0.029894317, 0.030439368, 0.052081127, 0.03548923, 0.03558152, 0.036082026, 0.03317242, 0.037071284, 0.03610204, 0.034064453, 0.045394067, 0.03179848, 0.041274987, 0.04149743, 0.04025327]
2020-08-06 15:17:59,609 : INFO : topic #2 (0.030): 0.018*"ezra" + 0.014*"vision" + 0.014*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.003*"work" + 0.003*"commentary"
2020-08-06 15:17:59,611 : INFO : topic #3 (0.030): 0.008*"newby" + 0.007*"arabia" + 0.005*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.003*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002*"god"
2

2020-08-06 15:18:01,336 : INFO : topic diff=0.092618, rho=0.288675
2020-08-06 15:18:01,611 : INFO : -8.825 per-word bound, 453.7 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:01,612 : INFO : PROGRESS: pass 11, at document #114/114
2020-08-06 15:18:01,697 : INFO : optimized alpha [0.034407683, 0.033377822, 0.02169282, 0.021964656, 0.041657977, 0.026221927, 0.027127998, 0.027236715, 0.024325863, 0.028100537, 0.026892927, 0.025144437, 0.03583051, 0.02331304, 0.031486083, 0.03248487, 0.031295035]
2020-08-06 15:18:01,730 : INFO : topic #2 (0.022): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:01,731 : INFO : topic #3 (0.022): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.003*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002*"g

2020-08-06 15:18:03,588 : INFO : topic diff=0.022823, rho=0.242536
2020-08-06 15:18:03,854 : INFO : -8.814 per-word bound, 450.0 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:03,855 : INFO : PROGRESS: pass 16, at document #114/114
2020-08-06 15:18:03,915 : INFO : optimized alpha [0.029323312, 0.028084403, 0.017587474, 0.017760348, 0.036345847, 0.021631539, 0.02298477, 0.022769162, 0.019929763, 0.023573013, 0.02230677, 0.020699063, 0.03121154, 0.019063724, 0.026596608, 0.027854979, 0.026709788]
2020-08-06 15:18:03,953 : INFO : topic #2 (0.018): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:03,954 : INFO : topic #3 (0.018): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.002*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002*"

2020-08-06 15:18:05,685 : INFO : topic diff=0.007277, rho=0.213201
2020-08-06 15:18:06,033 : INFO : -8.810 per-word bound, 448.7 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:06,033 : INFO : PROGRESS: pass 21, at document #114/114
2020-08-06 15:18:06,137 : INFO : optimized alpha [0.026164848, 0.02483758, 0.0150397355, 0.015163036, 0.032999083, 0.0187932, 0.020351145, 0.01997783, 0.01720857, 0.020744434, 0.019462496, 0.017942619, 0.02826846, 0.016424056, 0.023556756, 0.02492819, 0.023821712]
2020-08-06 15:18:06,167 : INFO : topic #2 (0.015): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:06,168 : INFO : topic #3 (0.015): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.002*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002*"god

2020-08-06 15:18:08,121 : INFO : topic diff=0.003049, rho=0.192450
2020-08-06 15:18:08,435 : INFO : -8.807 per-word bound, 448.0 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:08,436 : INFO : PROGRESS: pass 26, at document #114/114
2020-08-06 15:18:08,563 : INFO : optimized alpha [0.02396854, 0.022598322, 0.013273256, 0.013367328, 0.030647034, 0.016827784, 0.018618548, 0.018031629, 0.015323611, 0.01877212, 0.017488929, 0.016030846, 0.026184328, 0.01459186, 0.021442862, 0.02287002, 0.021796385]
2020-08-06 15:18:08,606 : INFO : topic #2 (0.013): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:08,608 : INFO : topic #3 (0.013): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.002*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002*"g

2020-08-06 15:18:10,538 : INFO : topic diff=0.001676, rho=0.176777
2020-08-06 15:18:10,880 : INFO : -8.805 per-word bound, 447.4 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:10,880 : INFO : PROGRESS: pass 31, at document #114/114
2020-08-06 15:18:10,993 : INFO : optimized alpha [0.022331413, 0.02093924, 0.011961614, 0.012036648, 0.028877975, 0.015368699, 0.017328843, 0.016579472, 0.013924241, 0.017300254, 0.016021492, 0.014610143, 0.024609257, 0.013229928, 0.019867849, 0.021323718, 0.020278186]
2020-08-06 15:18:11,037 : INFO : topic #2 (0.012): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:11,038 : INFO : topic #3 (0.012): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.002*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002

2020-08-06 15:18:13,595 : INFO : topic diff=0.001100, rho=0.164399
2020-08-06 15:18:13,933 : INFO : -8.804 per-word bound, 447.0 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:13,933 : INFO : PROGRESS: pass 36, at document #114/114
2020-08-06 15:18:14,057 : INFO : optimized alpha [0.021052428, 0.019649202, 0.010941217, 0.011002989, 0.027484858, 0.014233186, 0.016351229, 0.015444848, 0.012835352, 0.016150013, 0.0148780225, 0.013503725, 0.023365002, 0.012169274, 0.018638229, 0.020108515, 0.019087335]
2020-08-06 15:18:14,093 : INFO : topic #2 (0.011): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:14,094 : INFO : topic #3 (0.011): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.002*"history" + 0.002*"arabic" + 0.002*"relation" + 0.0

2020-08-06 15:18:16,209 : INFO : topic diff=0.000772, rho=0.154303
2020-08-06 15:18:16,516 : INFO : -8.803 per-word bound, 446.7 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:16,517 : INFO : PROGRESS: pass 41, at document #114/114
2020-08-06 15:18:16,645 : INFO : optimized alpha [0.020018995, 0.0186108, 0.010120143, 0.010172215, 0.026351165, 0.013318904, 0.015603463, 0.014528345, 0.0119588, 0.015220713, 0.013956363, 0.012612422, 0.022350231, 0.011314941, 0.017645432, 0.019122085, 0.018122211]
2020-08-06 15:18:16,683 : INFO : topic #2 (0.010): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:16,684 : INFO : topic #3 (0.010): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.002*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002*"g

2020-08-06 15:18:18,963 : INFO : topic diff=0.000567, rho=0.145865
2020-08-06 15:18:19,419 : INFO : -8.803 per-word bound, 446.5 perplexity estimate based on a held-out corpus of 114 documents with 64741 words
2020-08-06 15:18:19,420 : INFO : PROGRESS: pass 46, at document #114/114
2020-08-06 15:18:19,548 : INFO : optimized alpha [0.019161932, 0.017752424, 0.009442177, 0.009486885, 0.025404617, 0.012563317, 0.014978805, 0.013768866, 0.011234603, 0.014450458, 0.013193982, 0.011875567, 0.021501841, 0.010608811, 0.016822804, 0.01830102, 0.017319987]
2020-08-06 15:18:19,590 : INFO : topic #2 (0.009): 0.018*"ezra" + 0.015*"vision" + 0.015*"stone" + 0.008*"author" + 0.004*"experience" + 0.004*"eschatological" + 0.004*"religious" + 0.004*"literary" + 0.004*"work" + 0.004*"commentary"
2020-08-06 15:18:19,591 : INFO : topic #3 (0.009): 0.009*"newby" + 0.007*"arabia" + 0.006*"arabian" + 0.004*"review" + 0.004*"century" + 0.003*"islam" + 0.002*"history" + 0.002*"arabic" + 0.002*"relation" + 0.002

2020-08-06 15:22:21,297 : INFO : adding document #20000 to Dictionary(5973 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:22:21,350 : INFO : adding document #30000 to Dictionary(7852 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:22:21,404 : INFO : adding document #40000 to Dictionary(9454 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:22:21,461 : INFO : adding document #50000 to Dictionary(10905 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:22:21,521 : INFO : adding document #60000 to Dictionary(12339 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:22:21,592 : INFO : adding document #70000 to Dictionary(13430 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:22:21,647 : INFO : adding document #80000 to Dictionary(14493 unique tokens: ['martin', 'goodman', 'roman',

2020-08-06 15:22:26,279 : INFO : topic #6 (0.052): 0.004*"blood" + 0.004*"woman" + 0.003*"history" + 0.003*"review" + 0.003*"hilberg" + 0.003*"hoffman" + 0.002*"study" + 0.002*"christian" + 0.002*"holocaust" + 0.002*"reading"
2020-08-06 15:22:26,280 : INFO : topic #5 (0.070): 0.007*"study" + 0.005*"review" + 0.005*"history" + 0.005*"christian" + 0.004*"work" + 0.004*"text" + 0.003*"period" + 0.003*"world" + 0.003*"author" + 0.003*"example"
2020-08-06 15:22:26,283 : INFO : topic #3 (0.079): 0.005*"history" + 0.005*"review" + 0.005*"study" + 0.005*"qumran" + 0.004*"scroll" + 0.004*"schiffman" + 0.004*"american" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:22:26,286 : INFO : topic #13 (0.082): 0.006*"rabbinic" + 0.005*"study" + 0.005*"review" + 0.005*"history" + 0.004*"work" + 0.003*"historical" + 0.003*"rabbi" + 0.003*"century" + 0.003*"source" + 0.003*"tradition"
2020-08-06 15:22:26,289 : INFO : topic diff=1.245366, rho=0.500000
2020-08-06 15:22:26,919 : INFO : -9.3

2020-08-06 15:22:30,845 : INFO : topic #6 (0.030): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"nazi" + 0.003*"review" + 0.003*"destruction" + 0.003*"janus" + 0.003*"circumcision"
2020-08-06 15:22:30,847 : INFO : topic #5 (0.043): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.005*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"period" + 0.003*"author"
2020-08-06 15:22:30,848 : INFO : topic #3 (0.049): 0.006*"history" + 0.005*"qumran" + 0.005*"american" + 0.005*"study" + 0.005*"scroll" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:22:30,850 : INFO : topic #13 (0.054): 0.006*"rabbinic" + 0.005*"study" + 0.005*"review" + 0.004*"history" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"rabbi" + 0.003*"author"
2020-08-06 15:22:30,854 : INFO : topic diff=0.227847, rho=0.333333
2020-08-06 15:22:31,569 : INFO

2020-08-06 15:22:36,134 : INFO : topic #6 (0.022): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"nazi" + 0.003*"destruction" + 0.003*"herod" + 0.003*"review" + 0.003*"janus"
2020-08-06 15:22:36,136 : INFO : topic #5 (0.034): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"period" + 0.003*"author"
2020-08-06 15:22:36,138 : INFO : topic #3 (0.041): 0.006*"history" + 0.005*"american" + 0.005*"qumran" + 0.005*"scroll" + 0.005*"study" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:22:36,140 : INFO : topic #13 (0.045): 0.006*"rabbinic" + 0.005*"study" + 0.005*"review" + 0.004*"history" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"rabbi" + 0.003*"author"
2020-08-06 15:22:36,144 : INFO : topic diff=0.051533, rho=0.267261
2020-08-06 15:22:37,058 : INFO : -8.9

2020-08-06 15:22:41,943 : INFO : topic #6 (0.019): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"nazi" + 0.004*"herod" + 0.003*"destruction" + 0.003*"janus" + 0.003*"review"
2020-08-06 15:22:41,945 : INFO : topic #5 (0.030): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"period" + 0.003*"author"
2020-08-06 15:22:41,947 : INFO : topic #3 (0.036): 0.006*"history" + 0.005*"american" + 0.005*"qumran" + 0.005*"scroll" + 0.005*"schiffman" + 0.005*"study" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:22:41,949 : INFO : topic #13 (0.039): 0.006*"rabbinic" + 0.005*"study" + 0.005*"review" + 0.004*"history" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"rabbi" + 0.003*"author"
2020-08-06 15:22:41,953 : INFO : topic diff=0.014915, rho=0.229416
2020-08-06 15:22:43,217 : INFO : -8.9

2020-08-06 15:22:50,545 : INFO : topic #6 (0.016): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"nazi" + 0.004*"herod" + 0.003*"destruction" + 0.003*"janus" + 0.003*"review"
2020-08-06 15:22:50,548 : INFO : topic #5 (0.027): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"period" + 0.003*"rabbinic"
2020-08-06 15:22:50,551 : INFO : topic #3 (0.033): 0.006*"history" + 0.005*"american" + 0.005*"qumran" + 0.005*"scroll" + 0.005*"study" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:22:50,553 : INFO : topic #13 (0.036): 0.006*"rabbinic" + 0.005*"study" + 0.005*"review" + 0.004*"history" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"rabbi" + 0.003*"author"
2020-08-06 15:22:50,559 : INFO : topic diff=0.005491, rho=0.204124
2020-08-06 15:22:51,654 : INFO : -8

2020-08-06 15:22:59,579 : INFO : topic #6 (0.014): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"herod" + 0.004*"nazi" + 0.003*"destruction" + 0.003*"janus" + 0.003*"review"
2020-08-06 15:22:59,582 : INFO : topic #5 (0.025): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"rabbinic" + 0.003*"period"
2020-08-06 15:22:59,585 : INFO : topic #3 (0.031): 0.006*"history" + 0.005*"american" + 0.005*"qumran" + 0.005*"scroll" + 0.005*"study" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:22:59,589 : INFO : topic #13 (0.033): 0.006*"rabbinic" + 0.005*"study" + 0.005*"review" + 0.004*"history" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"rabbi" + 0.003*"author"
2020-08-06 15:22:59,594 : INFO : topic diff=0.002626, rho=0.185695
2020-08-06 15:23:00,990 : INFO : -8

2020-08-06 15:23:10,350 : INFO : topic #6 (0.013): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"herod" + 0.004*"nazi" + 0.003*"destruction" + 0.003*"janus" + 0.003*"review"
2020-08-06 15:23:10,352 : INFO : topic #5 (0.023): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"rabbinic" + 0.003*"period"
2020-08-06 15:23:10,355 : INFO : topic #3 (0.029): 0.006*"history" + 0.006*"qumran" + 0.005*"american" + 0.005*"scroll" + 0.005*"study" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:23:10,357 : INFO : topic #13 (0.032): 0.006*"rabbinic" + 0.005*"study" + 0.005*"review" + 0.005*"history" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"rabbi" + 0.003*"author"
2020-08-06 15:23:10,362 : INFO : topic diff=0.001608, rho=0.171499
2020-08-06 15:23:11,728 : INFO : -8

2020-08-06 15:23:21,114 : INFO : topic #6 (0.012): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"herod" + 0.004*"nazi" + 0.003*"destruction" + 0.003*"janus" + 0.003*"review"
2020-08-06 15:23:21,117 : INFO : topic #5 (0.022): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"rabbinic" + 0.003*"period"
2020-08-06 15:23:21,119 : INFO : topic #3 (0.028): 0.006*"history" + 0.006*"qumran" + 0.005*"american" + 0.005*"scroll" + 0.005*"study" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:23:21,123 : INFO : topic #13 (0.030): 0.006*"rabbinic" + 0.005*"study" + 0.005*"history" + 0.005*"review" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"author" + 0.003*"rabbi"
2020-08-06 15:23:21,128 : INFO : topic diff=0.001163, rho=0.160128
2020-08-06 15:23:22,683 : INFO : -8

2020-08-06 15:23:31,501 : INFO : topic #6 (0.011): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"herod" + 0.004*"nazi" + 0.003*"destruction" + 0.003*"janus" + 0.003*"review"
2020-08-06 15:23:31,503 : INFO : topic #5 (0.021): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"rabbinic" + 0.003*"period"
2020-08-06 15:23:31,505 : INFO : topic #3 (0.027): 0.006*"history" + 0.006*"qumran" + 0.005*"american" + 0.005*"scroll" + 0.005*"study" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:23:31,507 : INFO : topic #13 (0.029): 0.006*"rabbinic" + 0.005*"study" + 0.005*"history" + 0.005*"review" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"author" + 0.003*"rabbi"
2020-08-06 15:23:31,511 : INFO : topic diff=0.000924, rho=0.150756
2020-08-06 15:23:32,633 : INFO : -8

2020-08-06 15:23:39,502 : INFO : topic #6 (0.011): 0.006*"blood" + 0.006*"hilberg" + 0.005*"hoffman" + 0.004*"woman" + 0.004*"holocaust" + 0.004*"herod" + 0.004*"nazi" + 0.003*"destruction" + 0.003*"janus" + 0.003*"review"
2020-08-06 15:23:39,503 : INFO : topic #5 (0.020): 0.007*"study" + 0.005*"review" + 0.005*"christian" + 0.005*"text" + 0.004*"history" + 0.004*"work" + 0.004*"source" + 0.003*"tradition" + 0.003*"rabbinic" + 0.003*"period"
2020-08-06 15:23:39,505 : INFO : topic #3 (0.026): 0.006*"history" + 0.006*"qumran" + 0.005*"scroll" + 0.005*"american" + 0.005*"study" + 0.005*"schiffman" + 0.005*"review" + 0.004*"community" + 0.004*"work" + 0.003*"author"
2020-08-06 15:23:39,508 : INFO : topic #13 (0.028): 0.006*"rabbinic" + 0.005*"study" + 0.005*"history" + 0.005*"review" + 0.004*"work" + 0.003*"historical" + 0.003*"tradition" + 0.003*"century" + 0.003*"author" + 0.003*"rabbi"
2020-08-06 15:23:39,513 : INFO : topic diff=0.000772, rho=0.142857
2020-08-06 15:23:40,477 : INFO : -8

2020-08-06 15:30:27,484 : INFO : adding document #190000 to Dictionary(22483 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:30:27,538 : INFO : adding document #200000 to Dictionary(23100 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:30:27,593 : INFO : adding document #210000 to Dictionary(23663 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:30:27,649 : INFO : adding document #220000 to Dictionary(24161 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:30:27,704 : INFO : adding document #230000 to Dictionary(24687 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:30:27,761 : INFO : adding document #240000 to Dictionary(25397 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:30:27,814 : INFO : adding document #250000 to Dictionary(26204 unique tokens: ['martin', 'goodman'

2020-08-06 15:30:31,385 : INFO : PROGRESS: pass 3, at document #155/155
2020-08-06 15:30:31,564 : INFO : optimized alpha [0.05120441, 0.055231903, 0.09666216, 0.04431195, 0.055781744, 0.043435585, 0.044670567, 0.042563703, 0.04793346, 0.044234052, 0.048831537, 0.042166397, 0.058437884, 0.050650455, 0.056577913, 0.044176534, 0.054729857]
2020-08-06 15:30:31,636 : INFO : topic #11 (0.042): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.002*"american" + 0.002*"identity" + 0.002*"non" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"based"
2020-08-06 15:30:31,638 : INFO : topic #7 (0.043): 0.003*"story" + 0.002*"translation" + 0.002*"reader" + 0.002*"subject" + 0.001*"voice" + 0.001*"poem" + 0.001*"spicehandler" + 0.001*"patterson" + 0.001*"random" + 0.001*"ezra"
2020-08-06 15:30:31,640 : INFO : topic #14 (0.057): 0.004*"american" + 0.004*"slave" + 0.004*"german" + 0.004*"synagogue" + 0.003*"yiddish" + 0.003*"student" + 0.003*"work" + 0.003*"identity" + 0.003*"maimonide

2020-08-06 15:30:35,500 : INFO : -9.149 per-word bound, 567.8 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:30:35,501 : INFO : PROGRESS: pass 8, at document #155/155
2020-08-06 15:30:35,666 : INFO : optimized alpha [0.03208026, 0.03521223, 0.07440955, 0.027847495, 0.03704028, 0.027141936, 0.027650524, 0.025898727, 0.029781677, 0.02781058, 0.031715397, 0.025758106, 0.03858472, 0.032608375, 0.037409734, 0.027191494, 0.035222612]
2020-08-06 15:30:35,768 : INFO : topic #11 (0.026): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:30:35,769 : INFO : topic #7 (0.026): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra"
2020-08-06 15:30:35,771 : INFO : topic #14 (0.037): 0.005*"american" 

2020-08-06 15:30:39,122 : INFO : topic diff=0.035594, rho=0.267261
2020-08-06 15:30:39,659 : INFO : -9.124 per-word bound, 557.8 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:30:39,660 : INFO : PROGRESS: pass 13, at document #155/155
2020-08-06 15:30:39,793 : INFO : optimized alpha [0.02511807, 0.027882703, 0.0651423, 0.021621251, 0.029926868, 0.02099429, 0.021317393, 0.019728685, 0.023126792, 0.021598544, 0.025174312, 0.0196478, 0.031140024, 0.025896307, 0.030408606, 0.020856585, 0.028063731]
2020-08-06 15:30:39,896 : INFO : topic #11 (0.020): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:30:39,897 : INFO : topic #7 (0.020): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra"
2

2020-08-06 15:30:42,997 : INFO : topic diff=0.009193, rho=0.229416
2020-08-06 15:30:43,589 : INFO : -9.119 per-word bound, 555.9 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:30:43,590 : INFO : PROGRESS: pass 18, at document #155/155
2020-08-06 15:30:43,876 : INFO : optimized alpha [0.021296563, 0.023864254, 0.059876803, 0.018160224, 0.02596494, 0.017580362, 0.01781851, 0.016330274, 0.01946706, 0.018144032, 0.021517392, 0.016274976, 0.027017627, 0.022162234, 0.026525691, 0.017366821, 0.024119128]
2020-08-06 15:30:43,954 : INFO : topic #11 (0.016): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:30:43,956 : INFO : topic #7 (0.016): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra

2020-08-06 15:30:47,938 : INFO : topic diff=0.003015, rho=0.204124
2020-08-06 15:30:48,559 : INFO : -9.117 per-word bound, 555.2 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:30:48,560 : INFO : PROGRESS: pass 23, at document #155/155
2020-08-06 15:30:48,794 : INFO : optimized alpha [0.018814392, 0.02125416, 0.056152098, 0.01589811, 0.023367139, 0.015350674, 0.01554002, 0.014122649, 0.01708852, 0.015885595, 0.019117016, 0.014081289, 0.024323191, 0.019717071, 0.023963196, 0.0150984805, 0.02154931]
2020-08-06 15:30:48,887 : INFO : topic #11 (0.014): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:30:48,889 : INFO : topic #7 (0.014): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra"

2020-08-06 15:30:53,081 : INFO : topic diff=0.001268, rho=0.185695
2020-08-06 15:30:53,637 : INFO : -9.116 per-word bound, 554.7 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:30:53,638 : INFO : PROGRESS: pass 28, at document #155/155
2020-08-06 15:30:53,900 : INFO : optimized alpha [0.017043011, 0.019390337, 0.053071484, 0.014278213, 0.021499317, 0.013755022, 0.0139126275, 0.012549335, 0.015391028, 0.014268053, 0.01739175, 0.012516645, 0.02238973, 0.017961966, 0.022111934, 0.013480619, 0.019710332]
2020-08-06 15:30:54,000 : INFO : topic #7 (0.013): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra"
2020-08-06 15:30:54,002 : INFO : topic #11 (0.013): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"bas

2020-08-06 15:30:57,938 : INFO : topic diff=0.000678, rho=0.171499
2020-08-06 15:30:58,562 : INFO : -9.115 per-word bound, 554.4 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:30:58,564 : INFO : PROGRESS: pass 33, at document #155/155
2020-08-06 15:30:58,794 : INFO : optimized alpha [0.015701024, 0.01797737, 0.050645083, 0.013048597, 0.02007578, 0.012544471, 0.012679758, 0.011359756, 0.014105402, 0.013040061, 0.016077993, 0.011332929, 0.020918138, 0.016626632, 0.02069575, 0.012256345, 0.018313933]
2020-08-06 15:30:58,876 : INFO : topic #11 (0.011): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:30:58,878 : INFO : topic #7 (0.011): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra

2020-08-06 15:31:02,970 : INFO : topic diff=0.000440, rho=0.160128
2020-08-06 15:31:03,586 : INFO : -9.114 per-word bound, 554.1 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:31:03,587 : INFO : PROGRESS: pass 38, at document #155/155
2020-08-06 15:31:03,843 : INFO : optimized alpha [0.014641165, 0.01686061, 0.048680786, 0.0120763695, 0.018945765, 0.011587781, 0.011706509, 0.010422335, 0.013090483, 0.0120690195, 0.015036332, 0.010399718, 0.019751072, 0.015568465, 0.019568155, 0.011290794, 0.017208826]
2020-08-06 15:31:03,934 : INFO : topic #11 (0.010): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:31:03,936 : INFO : topic #7 (0.010): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"

2020-08-06 15:31:08,258 : INFO : topic diff=0.000325, rho=0.150756
2020-08-06 15:31:08,844 : INFO : -9.113 per-word bound, 553.9 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:31:08,845 : INFO : PROGRESS: pass 43, at document #155/155
2020-08-06 15:31:09,146 : INFO : optimized alpha [0.013778001, 0.01595034, 0.04704071, 0.011284058, 0.01802125, 0.010808486, 0.010914423, 0.009660651, 0.012264313, 0.011277613, 0.0141852815, 0.009641188, 0.018796898, 0.014704261, 0.018643271, 0.010505616, 0.01630706]
2020-08-06 15:31:09,241 : INFO : topic #11 (0.010): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:31:09,243 : INFO : topic #7 (0.010): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra

2020-08-06 15:31:13,286 : INFO : topic diff=0.000262, rho=0.142857
2020-08-06 15:31:13,945 : INFO : -9.113 per-word bound, 553.7 perplexity estimate based on a held-out corpus of 155 documents with 97126 words
2020-08-06 15:31:13,949 : INFO : PROGRESS: pass 48, at document #155/155
2020-08-06 15:31:14,189 : INFO : optimized alpha [0.013058211, 0.015190601, 0.04563948, 0.010623157, 0.017247053, 0.010158708, 0.010254458, 0.0090269875, 0.011575728, 0.010617422, 0.013473718, 0.009009966, 0.0179983, 0.013981889, 0.0178671, 0.009851885, 0.0155536905]
2020-08-06 15:31:14,276 : INFO : topic #11 (0.009): 0.003*"study" + 0.003*"author" + 0.003*"synagogue" + 0.003*"american" + 0.002*"identity" + 0.002*"percent" + 0.002*"eisen" + 0.002*"observe" + 0.002*"non" + 0.002*"based"
2020-08-06 15:31:14,278 : INFO : topic #7 (0.009): 0.003*"story" + 0.003*"translation" + 0.002*"reader" + 0.002*"patterson" + 0.002*"subject" + 0.002*"voice" + 0.002*"poem" + 0.002*"spicehandler" + 0.002*"random" + 0.002*"ezra

2020-08-06 15:39:56,104 : INFO : adding document #250000 to Dictionary(26204 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:39:56,162 : INFO : adding document #260000 to Dictionary(26830 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:39:56,224 : INFO : adding document #270000 to Dictionary(27488 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:39:56,284 : INFO : adding document #280000 to Dictionary(28006 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:39:56,341 : INFO : adding document #290000 to Dictionary(28616 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:39:56,408 : INFO : adding document #300000 to Dictionary(29247 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:39:56,470 : INFO : adding document #310000 to Dictionary(29822 unique tokens: ['martin', 'goodman'

2020-08-06 15:40:02,485 : INFO : topic #15 (0.075): 0.005*"history" + 0.004*"study" + 0.004*"biblical" + 0.004*"literature" + 0.004*"ritual" + 0.004*"work" + 0.003*"reader" + 0.003*"scholar" + 0.003*"german" + 0.002*"historical"
2020-08-06 15:40:02,487 : INFO : topic #11 (0.075): 0.009*"woman" + 0.006*"history" + 0.004*"study" + 0.004*"literature" + 0.004*"century" + 0.004*"rabbinic" + 0.004*"reader" + 0.003*"work" + 0.003*"early" + 0.003*"source"
2020-08-06 15:40:02,489 : INFO : topic #10 (0.084): 0.004*"klezmer" + 0.004*"study" + 0.004*"music" + 0.004*"world" + 0.004*"levinas" + 0.004*"tradition" + 0.003*"work" + 0.003*"century" + 0.003*"author" + 0.003*"american"
2020-08-06 15:40:02,494 : INFO : topic diff=0.967942, rho=0.500000
2020-08-06 15:40:03,410 : INFO : -9.439 per-word bound, 694.3 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:40:03,412 : INFO : PROGRESS: pass 3, at document #197/197
2020-08-06 15:40:03,704 : INFO : optimized

2020-08-06 15:40:09,377 : INFO : topic #11 (0.047): 0.011*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"reader" + 0.004*"rabbinic" + 0.004*"work" + 0.003*"century" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:40:09,379 : INFO : topic #15 (0.048): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"scholar" + 0.003*"german" + 0.003*"historical"
2020-08-06 15:40:09,382 : INFO : topic #10 (0.055): 0.005*"klezmer" + 0.005*"music" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:40:09,389 : INFO : topic diff=0.161346, rho=0.333333
2020-08-06 15:40:10,411 : INFO : -9.126 per-word bound, 558.6 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:40:10,413 : INFO : PROGRESS: pass 8, at document #197/197
2020-08-06 15:40:10,740 : INFO : optimized

2020-08-06 15:40:16,326 : INFO : topic #11 (0.039): 0.011*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"reader" + 0.004*"rabbinic" + 0.004*"work" + 0.003*"century" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:40:16,329 : INFO : topic #15 (0.039): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"scholar" + 0.003*"german" + 0.003*"historical"
2020-08-06 15:40:16,332 : INFO : topic #10 (0.045): 0.005*"music" + 0.005*"klezmer" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:40:16,338 : INFO : topic diff=0.034378, rho=0.267261
2020-08-06 15:40:17,258 : INFO : -9.101 per-word bound, 549.0 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:40:17,260 : INFO : PROGRESS: pass 13, at document #197/197
2020-08-06 15:40:17,500 : INFO : optimize

2020-08-06 15:40:23,406 : INFO : topic #11 (0.034): 0.011*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"reader" + 0.004*"rabbinic" + 0.004*"work" + 0.004*"century" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:40:23,409 : INFO : topic #15 (0.034): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"scholar" + 0.003*"german" + 0.003*"historical"
2020-08-06 15:40:23,413 : INFO : topic #10 (0.040): 0.005*"music" + 0.005*"klezmer" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:40:23,418 : INFO : topic diff=0.009722, rho=0.229416
2020-08-06 15:40:24,687 : INFO : -9.094 per-word bound, 546.6 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:40:24,688 : INFO : PROGRESS: pass 18, at document #197/197
2020-08-06 15:40:25,148 : INFO : optimize

2020-08-06 15:40:32,550 : INFO : topic #15 (0.031): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"german" + 0.003*"scholar" + 0.003*"historical"
2020-08-06 15:40:32,553 : INFO : topic #11 (0.031): 0.011*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"reader" + 0.004*"rabbinic" + 0.004*"century" + 0.004*"work" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:40:32,557 : INFO : topic #10 (0.037): 0.005*"music" + 0.005*"klezmer" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:40:32,564 : INFO : topic diff=0.003731, rho=0.204124
2020-08-06 15:40:33,788 : INFO : -9.091 per-word bound, 545.4 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:40:33,790 : INFO : PROGRESS: pass 23, at document #197/197
2020-08-06 15:40:34,242 : INFO : optimize

2020-08-06 15:40:41,443 : INFO : topic #15 (0.029): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"german" + 0.003*"scholar" + 0.003*"historical"
2020-08-06 15:40:41,445 : INFO : topic #11 (0.029): 0.012*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"reader" + 0.004*"rabbinic" + 0.004*"century" + 0.004*"work" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:40:41,448 : INFO : topic #10 (0.035): 0.005*"music" + 0.005*"klezmer" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:40:41,453 : INFO : topic diff=0.001933, rho=0.185695
2020-08-06 15:40:42,773 : INFO : -9.089 per-word bound, 544.6 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:40:42,775 : INFO : PROGRESS: pass 28, at document #197/197
2020-08-06 15:40:43,290 : INFO : optimize

2020-08-06 15:40:50,520 : INFO : topic #15 (0.027): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"german" + 0.003*"scholar" + 0.003*"historical"
2020-08-06 15:40:50,523 : INFO : topic #11 (0.028): 0.012*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"reader" + 0.004*"rabbinic" + 0.004*"century" + 0.004*"work" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:40:50,525 : INFO : topic #10 (0.033): 0.005*"music" + 0.005*"klezmer" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:40:50,530 : INFO : topic diff=0.001247, rho=0.171499
2020-08-06 15:40:51,630 : INFO : -9.088 per-word bound, 544.1 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:40:51,631 : INFO : PROGRESS: pass 33, at document #197/197
2020-08-06 15:40:52,138 : INFO : optimize

2020-08-06 15:40:59,763 : INFO : topic #15 (0.026): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"german" + 0.003*"scholar" + 0.003*"historical"
2020-08-06 15:40:59,765 : INFO : topic #11 (0.027): 0.012*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"rabbinic" + 0.004*"reader" + 0.004*"century" + 0.004*"work" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:40:59,768 : INFO : topic #10 (0.032): 0.005*"music" + 0.005*"klezmer" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:40:59,773 : INFO : topic diff=0.000918, rho=0.160128
2020-08-06 15:41:00,939 : INFO : -9.086 per-word bound, 543.6 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:41:00,941 : INFO : PROGRESS: pass 38, at document #197/197
2020-08-06 15:41:01,468 : INFO : optimize

2020-08-06 15:41:08,922 : INFO : topic #15 (0.025): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"german" + 0.003*"scholar" + 0.003*"historical"
2020-08-06 15:41:08,925 : INFO : topic #11 (0.026): 0.012*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"rabbinic" + 0.004*"reader" + 0.004*"century" + 0.004*"work" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:41:08,929 : INFO : topic #10 (0.031): 0.005*"music" + 0.005*"klezmer" + 0.004*"study" + 0.004*"levinas" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:41:08,936 : INFO : topic diff=0.000733, rho=0.150756
2020-08-06 15:41:10,128 : INFO : -9.086 per-word bound, 543.3 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:41:10,131 : INFO : PROGRESS: pass 43, at document #197/197
2020-08-06 15:41:10,700 : INFO : optimize

2020-08-06 15:41:18,251 : INFO : topic #15 (0.024): 0.005*"history" + 0.004*"biblical" + 0.004*"ritual" + 0.004*"study" + 0.004*"literature" + 0.004*"work" + 0.003*"reader" + 0.003*"german" + 0.003*"scholar" + 0.003*"historical"
2020-08-06 15:41:18,254 : INFO : topic #11 (0.025): 0.012*"woman" + 0.006*"history" + 0.005*"study" + 0.004*"literature" + 0.004*"rabbinic" + 0.004*"reader" + 0.004*"century" + 0.004*"work" + 0.003*"christian" + 0.003*"early"
2020-08-06 15:41:18,256 : INFO : topic #10 (0.030): 0.005*"music" + 0.005*"klezmer" + 0.004*"levinas" + 0.004*"study" + 0.004*"world" + 0.004*"tradition" + 0.003*"american" + 0.003*"work" + 0.003*"war" + 0.003*"israeli"
2020-08-06 15:41:18,262 : INFO : topic diff=0.000612, rho=0.142857
2020-08-06 15:41:19,335 : INFO : -9.085 per-word bound, 543.0 perplexity estimate based on a held-out corpus of 197 documents with 127978 words
2020-08-06 15:41:19,338 : INFO : PROGRESS: pass 48, at document #197/197
2020-08-06 15:41:19,753 : INFO : optimize

2020-08-06 15:54:03,549 : INFO : adding document #210000 to Dictionary(23663 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:54:03,606 : INFO : adding document #220000 to Dictionary(24161 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:54:03,671 : INFO : adding document #230000 to Dictionary(24687 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:54:03,726 : INFO : adding document #240000 to Dictionary(25397 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:54:03,794 : INFO : adding document #250000 to Dictionary(26204 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:54:03,860 : INFO : adding document #260000 to Dictionary(26830 unique tokens: ['martin', 'goodman', 'roman', 'galilee', 'centre']...)
2020-08-06 15:54:03,931 : INFO : adding document #270000 to Dictionary(27488 unique tokens: ['martin', 'goodman'

2020-08-06 15:54:08,033 : INFO : topic #12 (0.065): 0.004*"birnbaum" + 0.003*"history" + 0.003*"nahmanides" + 0.003*"rabbinic" + 0.003*"christian" + 0.002*"caputo" + 0.002*"avraham" + 0.002*"cultural" + 0.002*"political" + 0.002*"century"
2020-08-06 15:54:08,036 : INFO : topic #5 (0.066): 0.004*"yiddish" + 0.003*"history" + 0.002*"century" + 0.002*"text" + 0.002*"song" + 0.002*"wallich" + 0.002*"german" + 0.002*"secular" + 0.002*"cultural" + 0.002*"early"
2020-08-06 15:54:08,039 : INFO : topic #14 (0.085): 0.005*"history" + 0.004*"material" + 0.004*"cultural" + 0.004*"study" + 0.004*"culture" + 0.003*"christian" + 0.003*"reuchlin" + 0.003*"work" + 0.003*"text" + 0.003*"author"
2020-08-06 15:54:08,043 : INFO : topic #1 (0.088): 0.008*"yiddish" + 0.006*"literature" + 0.005*"american" + 0.004*"culture" + 0.004*"literary" + 0.004*"study" + 0.003*"century" + 0.003*"practice" + 0.003*"writer" + 0.003*"work"
2020-08-06 15:54:08,046 : INFO : topic #7 (0.105): 0.006*"christian" + 0.006*"rabbini

2020-08-06 15:54:13,408 : INFO : topic #5 (0.030): 0.005*"song" + 0.004*"wallich" + 0.003*"manuscript" + 0.003*"text" + 0.003*"yiddish" + 0.002*"collection" + 0.002*"music" + 0.002*"german" + 0.002*"stanza" + 0.002*"god"
2020-08-06 15:54:13,410 : INFO : topic #12 (0.031): 0.007*"birnbaum" + 0.006*"nahmanides" + 0.005*"caputo" + 0.004*"avraham" + 0.004*"christian" + 0.003*"history" + 0.003*"zionist" + 0.003*"levenson" + 0.002*"leader" + 0.002*"rabbinic"
2020-08-06 15:54:13,412 : INFO : topic #14 (0.042): 0.005*"material" + 0.005*"cultural" + 0.005*"culture" + 0.004*"history" + 0.004*"reuchlin" + 0.004*"community" + 0.003*"casaubon" + 0.003*"question" + 0.003*"work" + 0.003*"world"
2020-08-06 15:54:13,414 : INFO : topic #1 (0.052): 0.010*"yiddish" + 0.007*"literature" + 0.005*"american" + 0.005*"culture" + 0.004*"literary" + 0.004*"study" + 0.004*"practice" + 0.004*"writer" + 0.004*"century" + 0.003*"author"
2020-08-06 15:54:13,417 : INFO : topic #7 (0.070): 0.007*"rabbinic" + 0.007*"chr

2020-08-06 15:54:18,543 : INFO : topic #5 (0.021): 0.005*"song" + 0.004*"wallich" + 0.003*"manuscript" + 0.003*"text" + 0.003*"yiddish" + 0.002*"collection" + 0.002*"music" + 0.002*"german" + 0.002*"stanza" + 0.002*"god"
2020-08-06 15:54:18,546 : INFO : topic #12 (0.022): 0.007*"birnbaum" + 0.006*"nahmanides" + 0.005*"caputo" + 0.004*"avraham" + 0.003*"christian" + 0.003*"history" + 0.003*"zionist" + 0.003*"levenson" + 0.003*"leader" + 0.002*"avram"
2020-08-06 15:54:18,549 : INFO : topic #14 (0.032): 0.005*"material" + 0.005*"cultural" + 0.005*"culture" + 0.004*"history" + 0.004*"reuchlin" + 0.004*"community" + 0.004*"casaubon" + 0.003*"question" + 0.003*"work" + 0.003*"world"
2020-08-06 15:54:18,552 : INFO : topic #1 (0.042): 0.010*"yiddish" + 0.007*"literature" + 0.005*"american" + 0.005*"culture" + 0.005*"literary" + 0.004*"study" + 0.004*"practice" + 0.004*"writer" + 0.004*"century" + 0.003*"author"
2020-08-06 15:54:18,555 : INFO : topic #7 (0.060): 0.007*"rabbinic" + 0.007*"christ

2020-08-06 15:54:23,785 : INFO : topic #5 (0.017): 0.005*"song" + 0.004*"wallich" + 0.003*"manuscript" + 0.003*"text" + 0.003*"yiddish" + 0.002*"collection" + 0.002*"music" + 0.002*"german" + 0.002*"stanza" + 0.002*"god"
2020-08-06 15:54:23,787 : INFO : topic #12 (0.018): 0.007*"birnbaum" + 0.007*"nahmanides" + 0.005*"caputo" + 0.004*"avraham" + 0.003*"christian" + 0.003*"history" + 0.003*"zionist" + 0.003*"levenson" + 0.003*"leader" + 0.002*"avram"
2020-08-06 15:54:23,790 : INFO : topic #14 (0.027): 0.005*"material" + 0.005*"cultural" + 0.005*"culture" + 0.004*"history" + 0.004*"reuchlin" + 0.004*"community" + 0.004*"casaubon" + 0.003*"question" + 0.003*"work" + 0.003*"world"
2020-08-06 15:54:23,792 : INFO : topic #1 (0.037): 0.010*"yiddish" + 0.007*"literature" + 0.005*"american" + 0.005*"culture" + 0.005*"literary" + 0.004*"study" + 0.004*"practice" + 0.004*"writer" + 0.004*"century" + 0.003*"mendelssohn"
2020-08-06 15:54:23,795 : INFO : topic #7 (0.054): 0.007*"christian" + 0.007*"

2020-08-06 15:54:29,482 : INFO : optimized alpha [0.02160732, 0.033669032, 0.019957472, 0.017547732, 0.015756462, 0.014673021, 0.019861996, 0.05097797, 0.019997431, 0.01639577, 0.018130817, 0.018127665, 0.015642954, 0.022690326, 0.024203045, 0.018044952, 0.017356435]
2020-08-06 15:54:29,591 : INFO : topic #5 (0.015): 0.005*"song" + 0.004*"wallich" + 0.003*"manuscript" + 0.003*"text" + 0.003*"yiddish" + 0.002*"collection" + 0.002*"music" + 0.002*"german" + 0.002*"stanza" + 0.002*"god"
2020-08-06 15:54:29,594 : INFO : topic #12 (0.016): 0.007*"birnbaum" + 0.007*"nahmanides" + 0.005*"caputo" + 0.004*"avraham" + 0.003*"christian" + 0.003*"history" + 0.003*"zionist" + 0.003*"levenson" + 0.003*"leader" + 0.002*"avram"
2020-08-06 15:54:29,596 : INFO : topic #14 (0.024): 0.005*"material" + 0.005*"cultural" + 0.005*"culture" + 0.004*"history" + 0.004*"reuchlin" + 0.004*"community" + 0.004*"casaubon" + 0.003*"question" + 0.003*"work" + 0.003*"world"
2020-08-06 15:54:29,598 : INFO : topic #1 (0.0

2020-08-06 15:54:35,521 : INFO : -9.151 per-word bound, 568.4 perplexity estimate based on a held-out corpus of 136 documents with 94478 words
2020-08-06 15:54:35,522 : INFO : PROGRESS: pass 26, at document #136/136
2020-08-06 15:54:35,829 : INFO : optimized alpha [0.019668547, 0.031399786, 0.017998591, 0.015667938, 0.013959639, 0.01292243, 0.017931465, 0.048394464, 0.018142581, 0.014556731, 0.016231272, 0.016213864, 0.013872238, 0.020646846, 0.022090623, 0.016163496, 0.015514196]
2020-08-06 15:54:35,946 : INFO : topic #5 (0.013): 0.005*"song" + 0.004*"wallich" + 0.003*"manuscript" + 0.003*"text" + 0.003*"yiddish" + 0.002*"collection" + 0.002*"music" + 0.002*"german" + 0.002*"stanza" + 0.002*"god"
2020-08-06 15:54:35,948 : INFO : topic #12 (0.014): 0.007*"birnbaum" + 0.007*"nahmanides" + 0.005*"caputo" + 0.004*"avraham" + 0.003*"christian" + 0.003*"zionist" + 0.003*"levenson" + 0.003*"history" + 0.003*"leader" + 0.002*"avram"
2020-08-06 15:54:35,950 : INFO : topic #14 (0.022): 0.005*"m

2020-08-06 15:54:40,781 : INFO : topic diff=0.001214, rho=0.176777
2020-08-06 15:54:41,619 : INFO : -9.149 per-word bound, 567.7 perplexity estimate based on a held-out corpus of 136 documents with 94478 words
2020-08-06 15:54:41,620 : INFO : PROGRESS: pass 31, at document #136/136
2020-08-06 15:54:41,981 : INFO : optimized alpha [0.018220447, 0.029687505, 0.016545186, 0.014275276, 0.012629217, 0.011627956, 0.016495774, 0.046363816, 0.01675653, 0.013196119, 0.0148232365, 0.014798192, 0.012558856, 0.019127721, 0.020522188, 0.0147674605, 0.014146743]
2020-08-06 15:54:42,094 : INFO : topic #5 (0.012): 0.005*"song" + 0.004*"wallich" + 0.003*"manuscript" + 0.003*"text" + 0.003*"yiddish" + 0.002*"collection" + 0.002*"music" + 0.002*"german" + 0.002*"stanza" + 0.002*"god"
2020-08-06 15:54:42,097 : INFO : topic #12 (0.013): 0.007*"birnbaum" + 0.007*"nahmanides" + 0.005*"caputo" + 0.004*"avraham" + 0.003*"christian" + 0.003*"zionist" + 0.003*"levenson" + 0.003*"history" + 0.003*"leader" + 0.002

2020-08-06 15:54:47,153 : INFO : topic #7 (0.045): 0.007*"christian" + 0.007*"rabbinic" + 0.005*"study" + 0.004*"legal" + 0.004*"century" + 0.004*"work" + 0.004*"law" + 0.004*"history" + 0.004*"medieval" + 0.003*"rabbi"
2020-08-06 15:54:47,159 : INFO : topic diff=0.000918, rho=0.164399
2020-08-06 15:54:48,021 : INFO : -9.147 per-word bound, 567.1 perplexity estimate based on a held-out corpus of 136 documents with 94478 words
2020-08-06 15:54:48,022 : INFO : PROGRESS: pass 36, at document #136/136
2020-08-06 15:54:48,337 : INFO : optimized alpha [0.017087735, 0.028334942, 0.0154141765, 0.013193026, 0.011596036, 0.010623908, 0.015376643, 0.044704225, 0.015672013, 0.012140019, 0.013728529, 0.013699237, 0.011537578, 0.01794355, 0.019300483, 0.013681268, 0.013082539]
2020-08-06 15:54:48,468 : INFO : topic #5 (0.011): 0.005*"song" + 0.004*"wallich" + 0.003*"manuscript" + 0.003*"text" + 0.003*"yiddish" + 0.002*"collection" + 0.002*"music" + 0.002*"german" + 0.002*"stanza" + 0.002*"god"
2020-

2020-08-06 15:54:53,944 : INFO : topic #1 (0.027): 0.010*"yiddish" + 0.007*"literature" + 0.005*"american" + 0.005*"culture" + 0.005*"literary" + 0.004*"study" + 0.004*"practice" + 0.004*"writer" + 0.003*"author" + 0.003*"mendelssohn"
2020-08-06 15:54:53,946 : INFO : topic #7 (0.044): 0.007*"christian" + 0.007*"rabbinic" + 0.005*"study" + 0.004*"legal" + 0.004*"century" + 0.004*"work" + 0.004*"law" + 0.004*"history" + 0.004*"medieval" + 0.004*"rabbi"
2020-08-06 15:54:53,954 : INFO : topic diff=0.000748, rho=0.154303
2020-08-06 15:54:54,835 : INFO : -9.146 per-word bound, 566.6 perplexity estimate based on a held-out corpus of 136 documents with 94478 words
2020-08-06 15:54:54,836 : INFO : PROGRESS: pass 41, at document #136/136
2020-08-06 15:54:55,272 : INFO : optimized alpha [0.01617155, 0.027230427, 0.014503192, 0.012322429, 0.010765514, 0.009817704, 0.01447403, 0.04330905, 0.014794621, 0.011291341, 0.0128475465, 0.01281588, 0.010715791, 0.016988248, 0.01831532, 0.012806624, 0.012225

2020-08-06 15:55:00,864 : INFO : topic #14 (0.018): 0.005*"material" + 0.005*"cultural" + 0.005*"culture" + 0.004*"history" + 0.004*"reuchlin" + 0.004*"community" + 0.004*"casaubon" + 0.003*"question" + 0.003*"work" + 0.003*"world"
2020-08-06 15:55:00,866 : INFO : topic #1 (0.026): 0.010*"yiddish" + 0.007*"literature" + 0.005*"american" + 0.005*"culture" + 0.005*"literary" + 0.004*"study" + 0.004*"practice" + 0.004*"writer" + 0.003*"author" + 0.003*"mendelssohn"
2020-08-06 15:55:00,869 : INFO : topic #7 (0.042): 0.007*"christian" + 0.007*"rabbinic" + 0.005*"study" + 0.004*"legal" + 0.004*"century" + 0.004*"work" + 0.004*"law" + 0.004*"medieval" + 0.004*"history" + 0.004*"rabbi"
2020-08-06 15:55:00,875 : INFO : topic diff=0.000630, rho=0.145865
2020-08-06 15:55:01,629 : INFO : -9.145 per-word bound, 566.1 perplexity estimate based on a held-out corpus of 136 documents with 94478 words
2020-08-06 15:55:01,630 : INFO : PROGRESS: pass 46, at document #136/136
2020-08-06 15:55:02,009 : INFO

2020-08-06 15:55:06,380 : INFO : saved l2a_17t_50p_autoalpha_books_all_2010_val.model
of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.


  return pd.concat([default_term_info] + list(topic_dfs))


In [None]:
    for a in range(len(texts)):
        for b in range(len (texts[a])):
            dict_list.append(texts[a][b])


    res = [sub.split() for sub in dict_list] 
    dictionary = corpora.Dictionary(res)
    
    corpus = [dictionary.doc2bow(text) for text in texts]
    corpora.MmCorpus.serialize('corpus_book'+str(i[0])+'.mm', corpus)
    
#     vec = CountVectorizer(max_df =.95,min_df = 10,stop_words='english')
#     counts = vec.fit_transform(texts).transpose()
#     corpus = matutils.Sparse2Corpus(counts)
#     with open('full_set_countvec_corpus.'+str(i[0])+'.pickle','wb') as file:
#         pickle.dump(corpus,file)
    
    no_of_topics = 17
    ldamodel17 = LdaModel(corpus, num_topics=no_of_topics, id2word=dictionary, passes=50, alpha='auto', eval_every=2000)
    # Save Model (24)
    ldamodel17.save('lda_17t_50p_autoalpha_book_{}_val.model'.format(i[0]))
    vis = pyLDAvis.gensim.prepare(ldamodel17, corpus, dictionary)
    pyLDAvis.save_html(vis,'visualization_book'+str(i[0])+'.html')
    
    