In [1]:
import sys
sys.path.append('../..')
import src.data.data_loader as dl
from src.features.vectorizer import Vectorizer
from src.models.topic_models import TopicModel
import pandas as pd
import sklearn.utils as skutil
pd.set_option('display.max_rows', None)



In [2]:
# Data 
language = 'english'
typex = 'editorial'

# Vectorization
min_df = 0.005
max_df = 0.9

# Topic Modeling
algorithm = 'lda'
num_topics = 130

train_percentage = 0.9
alpha = 'auto'
eta = 0.01
iterations = 200
passes = 60
chunksize = 5000
kappa = 0
tau_0 = 0

In [3]:
data = dl.get_articles_by_type(language, typex,kind = "tagged")
texts = data['article_texts']

def min_length (texts,min_characters):
    neu = []
    for t in texts: 
        token_perdoc_list = t.split()
        token_min_character = []
        for token in token_perdoc_list: 
            if len(token)>= min_characters: 
                token_min_character.append(token)
        joined = (" ").join(token_min_character)
        neu.append(joined)
    return neu

texts = min_length(texts,3)

In [4]:
vec = Vectorizer('tf', texts, min_df=min_df, max_df=max_df)
vec.save('tagged/vectorizer/{}_{}_{}_pos.pkl'.format(algorithm, language, "article_texts","tagged"))

document_term_matrix = vec.get_document_token_matrix(texts)
id2token = vec.get_id2token_mapping()

In [5]:
document_term_matrix = skutil.shuffle(document_term_matrix, random_state=1)
num_docs, num_terms = document_term_matrix.shape
train = int(num_docs * train_percentage)
train_document_term_matrix = document_term_matrix[0:train, :]
test_document_term_matrix = document_term_matrix[train: num_docs, :]

In [6]:
model = TopicModel('lda', num_topics, train_document_term_matrix, id2token, alpha=alpha, eta=eta, iterations=iterations, passes=passes, chunksize=chunksize, test_document_term_matrix=test_document_term_matrix, decay=kappa, offset=tau_0)
model.save('tagged/topic_models/lda/{}_{}_{}_{}_{}.pkl'.format(algorithm, language, "article_texts","tagged",num_topics))

2018-11-11 03:23:11,425 : INFO : using autotuned alpha, starting with [0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.0076923077, 0.007

2018-11-11 03:23:57,257 : INFO : topic diff=inf, rho=1.000000
2018-11-11 03:24:00,526 : INFO : Epoch 1: perplexity estimate: 13564.83073762272
2018-11-11 03:24:00,682 : INFO : PROGRESS: pass 2, at document #2223/2223
2018-11-11 03:24:14,915 : INFO : optimized alpha [0.007166401, 0.0083258785, 0.010541113, 0.0067886524, 0.0068014134, 0.006809493, 0.007654024, 0.0068862806, 0.009009727, 0.0074943043, 0.00791079, 0.006775417, 0.0070652575, 0.0068068625, 0.007515613, 0.0071291146, 0.0067238905, 0.0068947715, 0.006700691, 0.008332733, 0.007061532, 0.006867117, 0.0067754537, 0.008620505, 0.0070187985, 0.0069259126, 0.0069188266, 0.007481299, 0.0075341365, 0.006783392, 0.007165738, 0.007835085, 0.006962146, 0.0067927777, 0.007047967, 0.007587512, 0.006793459, 0.006828187, 0.0067965197, 0.006961692, 0.0074733845, 0.0068296134, 0.0068565817, 0.009725484, 0.007496103, 0.0086615905, 0.007836382, 0.007016073, 0.0067897094, 0.0067555923, 0.0075206817, 0.007428232, 0.00899682, 0.007862882, 0.0066596

2018-11-11 03:24:47,724 : INFO : topic #54 (0.006): 0.132*"hydroponic" + 0.042*"soil" + 0.028*"board" + 0.027*"system" + 0.021*"greenhouse" + 0.019*"plant" + 0.016*"grow" + 0.015*"nutrient" + 0.015*"nop" + 0.013*"recommendation"
2018-11-11 03:24:47,725 : INFO : topic #52 (0.011): 0.014*"what" + 0.013*"but" + 0.013*"there" + 0.013*"about" + 0.012*"this" + 0.011*"people" + 0.011*"think" + 0.010*"can" + 0.009*"get" + 0.009*"how"
2018-11-11 03:24:47,726 : INFO : topic #2 (0.014): 0.029*"store" + 0.023*"say" + 0.010*"grocery" + 0.010*"market" + 0.010*"will" + 0.010*"more" + 0.010*"year" + 0.009*"new" + 0.008*"company" + 0.007*"customer"
2018-11-11 03:24:47,727 : INFO : topic #76 (0.015): 0.022*"farm" + 0.018*"say" + 0.017*"farmer" + 0.013*"grow" + 0.009*"year" + 0.008*"but" + 0.008*"who" + 0.007*"local" + 0.006*"more" + 0.006*"about"
2018-11-11 03:24:47,733 : INFO : topic diff=inf, rho=1.000000
2018-11-11 03:24:50,604 : INFO : Epoch 4: perplexity estimate: 3498.952173345154
2018-11-11 03:24

2018-11-11 03:25:32,654 : INFO : topic #70 (0.006): 0.087*"a.m." + 0.037*"p.m." + 0.030*"roasted" + 0.029*"morning" + 0.019*"pound" + 0.015*"farm" + 0.015*"natural" + 0.013*"will" + 0.012*"new" + 0.011*"bread"
2018-11-11 03:25:32,655 : INFO : topic #54 (0.006): 0.095*"hydroponic" + 0.058*"board" + 0.046*"lettuce" + 0.038*"soil" + 0.036*"system" + 0.035*"grow" + 0.027*"recommendation" + 0.025*"plant" + 0.021*"greenhouse" + 0.019*"vote"
2018-11-11 03:25:32,656 : INFO : topic #52 (0.019): 0.017*"what" + 0.015*"but" + 0.015*"about" + 0.015*"there" + 0.013*"people" + 0.012*"this" + 0.011*"think" + 0.011*"can" + 0.010*"get" + 0.009*"all"
2018-11-11 03:25:32,657 : INFO : topic #2 (0.020): 0.032*"store" + 0.025*"say" + 0.011*"grocery" + 0.011*"market" + 0.010*"more" + 0.010*"will" + 0.010*"year" + 0.009*"new" + 0.008*"customer" + 0.008*"company"
2018-11-11 03:25:32,658 : INFO : topic #76 (0.021): 0.025*"farm" + 0.020*"say" + 0.019*"farmer" + 0.013*"grow" + 0.011*"year" + 0.008*"who" + 0.008*"b

2018-11-11 03:26:19,652 : INFO : topic #61 (0.005): 0.050*"susan" + 0.024*"administrator" + 0.017*"sugar" + 0.015*"eat" + 0.012*"but" + 0.011*"fat" + 0.011*"body" + 0.010*"can" + 0.010*"add" + 0.008*"say"
2018-11-11 03:26:19,653 : INFO : topic #89 (0.005): 0.020*"coleman" + 0.017*"natural" + 0.017*"more" + 0.012*"but" + 0.011*"healthy" + 0.010*"what" + 0.009*"worker" + 0.009*"need" + 0.009*"when" + 0.008*"some"
2018-11-11 03:26:19,654 : INFO : topic #2 (0.027): 0.034*"store" + 0.026*"say" + 0.012*"grocery" + 0.011*"market" + 0.010*"more" + 0.010*"will" + 0.010*"new" + 0.009*"year" + 0.008*"customer" + 0.008*"chain"
2018-11-11 03:26:19,655 : INFO : topic #76 (0.028): 0.027*"farm" + 0.021*"say" + 0.020*"farmer" + 0.013*"grow" + 0.012*"year" + 0.009*"who" + 0.009*"but" + 0.007*"farming" + 0.007*"sell" + 0.006*"local"
2018-11-11 03:26:19,657 : INFO : topic #52 (0.034): 0.018*"what" + 0.016*"but" + 0.016*"about" + 0.016*"there" + 0.013*"people" + 0.013*"this" + 0.012*"think" + 0.011*"can" +

2018-11-11 03:27:04,143 : INFO : topic #61 (0.005): 0.051*"susan" + 0.025*"administrator" + 0.017*"sugar" + 0.015*"eat" + 0.012*"but" + 0.011*"fat" + 0.011*"body" + 0.010*"can" + 0.010*"add" + 0.009*"fruit"
2018-11-11 03:27:04,144 : INFO : topic #89 (0.005): 0.022*"coleman" + 0.020*"natural" + 0.018*"more" + 0.011*"healthy" + 0.011*"but" + 0.010*"worker" + 0.009*"than" + 0.009*"some" + 0.009*"need" + 0.008*"find"
2018-11-11 03:27:04,145 : INFO : topic #2 (0.034): 0.036*"store" + 0.027*"say" + 0.012*"grocery" + 0.011*"market" + 0.010*"will" + 0.010*"new" + 0.010*"more" + 0.009*"year" + 0.009*"customer" + 0.008*"chain"
2018-11-11 03:27:04,146 : INFO : topic #76 (0.034): 0.028*"farm" + 0.022*"say" + 0.020*"farmer" + 0.013*"grow" + 0.013*"year" + 0.009*"who" + 0.009*"but" + 0.007*"farming" + 0.007*"sell" + 0.006*"land"
2018-11-11 03:27:04,148 : INFO : topic #52 (0.056): 0.019*"what" + 0.017*"but" + 0.016*"about" + 0.016*"there" + 0.013*"this" + 0.013*"people" + 0.012*"think" + 0.011*"can" 

2018-11-11 03:27:42,960 : INFO : topic #89 (0.005): 0.023*"coleman" + 0.021*"natural" + 0.019*"more" + 0.012*"healthy" + 0.011*"worker" + 0.010*"but" + 0.009*"than" + 0.009*"some" + 0.009*"ranch" + 0.008*"find"
2018-11-11 03:27:42,962 : INFO : topic #61 (0.005): 0.053*"susan" + 0.026*"administrator" + 0.017*"sugar" + 0.016*"eat" + 0.012*"but" + 0.011*"fat" + 0.011*"body" + 0.010*"add" + 0.010*"can" + 0.009*"fruit"
2018-11-11 03:27:42,963 : INFO : topic #2 (0.040): 0.037*"store" + 0.027*"say" + 0.013*"grocery" + 0.011*"market" + 0.010*"will" + 0.010*"new" + 0.010*"more" + 0.009*"customer" + 0.009*"year" + 0.008*"chain"
2018-11-11 03:27:42,965 : INFO : topic #76 (0.040): 0.029*"farm" + 0.023*"say" + 0.020*"farmer" + 0.013*"year" + 0.013*"grow" + 0.010*"who" + 0.009*"but" + 0.007*"farming" + 0.007*"sell" + 0.006*"land"
2018-11-11 03:27:42,966 : INFO : topic #52 (0.084): 0.019*"what" + 0.018*"but" + 0.017*"about" + 0.016*"there" + 0.014*"this" + 0.013*"people" + 0.012*"can" + 0.012*"think"

2018-11-11 03:28:20,214 : INFO : topic #61 (0.005): 0.054*"susan" + 0.026*"administrator" + 0.017*"sugar" + 0.016*"eat" + 0.012*"but" + 0.011*"fat" + 0.011*"body" + 0.010*"add" + 0.010*"can" + 0.009*"fruit"
2018-11-11 03:28:20,215 : INFO : topic #89 (0.005): 0.024*"coleman" + 0.022*"natural" + 0.020*"more" + 0.012*"worker" + 0.012*"healthy" + 0.010*"than" + 0.009*"ranch" + 0.009*"some" + 0.009*"but" + 0.009*"employee"
2018-11-11 03:28:20,216 : INFO : topic #2 (0.044): 0.038*"store" + 0.027*"say" + 0.013*"grocery" + 0.011*"market" + 0.010*"will" + 0.010*"new" + 0.009*"more" + 0.009*"customer" + 0.008*"year" + 0.008*"chain"
2018-11-11 03:28:20,217 : INFO : topic #76 (0.045): 0.030*"farm" + 0.023*"say" + 0.020*"farmer" + 0.014*"year" + 0.013*"grow" + 0.010*"who" + 0.009*"but" + 0.007*"farming" + 0.007*"sell" + 0.007*"work"
2018-11-11 03:28:20,218 : INFO : topic #52 (0.111): 0.019*"what" + 0.018*"but" + 0.017*"about" + 0.017*"there" + 0.014*"this" + 0.013*"people" + 0.012*"can" + 0.012*"th

2018-11-11 03:28:53,106 : INFO : topic #61 (0.005): 0.054*"susan" + 0.027*"administrator" + 0.017*"sugar" + 0.016*"eat" + 0.013*"but" + 0.011*"fat" + 0.011*"add" + 0.011*"body" + 0.009*"can" + 0.009*"fruit"
2018-11-11 03:28:53,107 : INFO : topic #89 (0.005): 0.024*"coleman" + 0.022*"natural" + 0.020*"more" + 0.012*"worker" + 0.011*"healthy" + 0.010*"than" + 0.010*"ranch" + 0.009*"some" + 0.009*"employee" + 0.009*"but"
2018-11-11 03:28:53,108 : INFO : topic #2 (0.047): 0.039*"store" + 0.027*"say" + 0.013*"grocery" + 0.010*"market" + 0.010*"will" + 0.010*"new" + 0.009*"more" + 0.009*"customer" + 0.008*"chain" + 0.008*"year"
2018-11-11 03:28:53,109 : INFO : topic #76 (0.048): 0.031*"farm" + 0.023*"say" + 0.020*"farmer" + 0.014*"year" + 0.013*"grow" + 0.010*"who" + 0.009*"but" + 0.008*"farming" + 0.007*"sell" + 0.007*"work"
2018-11-11 03:28:53,110 : INFO : topic #52 (0.133): 0.020*"what" + 0.019*"but" + 0.017*"about" + 0.017*"there" + 0.014*"this" + 0.013*"people" + 0.012*"can" + 0.012*"al

2018-11-11 03:29:24,734 : INFO : topic #61 (0.004): 0.055*"susan" + 0.027*"administrator" + 0.017*"sugar" + 0.016*"eat" + 0.013*"but" + 0.011*"fat" + 0.011*"add" + 0.011*"body" + 0.009*"can" + 0.009*"say"
2018-11-11 03:29:24,735 : INFO : topic #89 (0.005): 0.025*"coleman" + 0.022*"natural" + 0.021*"more" + 0.013*"worker" + 0.011*"healthy" + 0.010*"ranch" + 0.010*"than" + 0.010*"employee" + 0.010*"some" + 0.009*"germ"
2018-11-11 03:29:24,736 : INFO : topic #2 (0.049): 0.040*"store" + 0.026*"say" + 0.014*"grocery" + 0.010*"market" + 0.010*"will" + 0.010*"new" + 0.009*"customer" + 0.009*"more" + 0.009*"chain" + 0.008*"year"
2018-11-11 03:29:24,737 : INFO : topic #76 (0.051): 0.031*"farm" + 0.024*"say" + 0.020*"farmer" + 0.014*"year" + 0.013*"grow" + 0.010*"who" + 0.009*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:29:24,738 : INFO : topic #52 (0.153): 0.020*"what" + 0.019*"but" + 0.017*"about" + 0.017*"there" + 0.014*"this" + 0.013*"people" + 0.012*"can" + 0.012*"all

2018-11-11 03:29:55,745 : INFO : topic #61 (0.004): 0.056*"susan" + 0.028*"administrator" + 0.018*"sugar" + 0.016*"eat" + 0.013*"but" + 0.011*"fat" + 0.011*"body" + 0.011*"add" + 0.009*"can" + 0.009*"fruit"
2018-11-11 03:29:55,746 : INFO : topic #89 (0.004): 0.025*"coleman" + 0.022*"natural" + 0.021*"more" + 0.013*"worker" + 0.011*"healthy" + 0.010*"ranch" + 0.010*"than" + 0.010*"employee" + 0.010*"some" + 0.009*"germ"
2018-11-11 03:29:55,747 : INFO : topic #76 (0.054): 0.032*"farm" + 0.024*"say" + 0.019*"farmer" + 0.015*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:29:55,748 : INFO : topic #13 (0.054): 0.059*"percent" + 0.051*"year" + 0.044*"sale" + 0.032*"consumer" + 0.031*"more" + 0.026*"say" + 0.023*"accord" + 0.023*"market" + 0.022*"than" + 0.018*"last"
2018-11-11 03:29:55,749 : INFO : topic #52 (0.170): 0.020*"what" + 0.019*"but" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"people" + 0.013*"can" + 0.012*

2018-11-11 03:30:25,700 : INFO : topic #61 (0.004): 0.057*"susan" + 0.028*"administrator" + 0.018*"sugar" + 0.016*"eat" + 0.012*"but" + 0.012*"fat" + 0.011*"body" + 0.011*"add" + 0.009*"can" + 0.009*"say"
2018-11-11 03:30:25,701 : INFO : topic #89 (0.004): 0.025*"coleman" + 0.022*"natural" + 0.021*"more" + 0.013*"worker" + 0.011*"healthy" + 0.011*"ranch" + 0.010*"than" + 0.010*"some" + 0.010*"employee" + 0.009*"germ"
2018-11-11 03:30:25,702 : INFO : topic #76 (0.056): 0.032*"farm" + 0.024*"say" + 0.019*"farmer" + 0.015*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:30:25,702 : INFO : topic #13 (0.059): 0.059*"percent" + 0.052*"year" + 0.044*"sale" + 0.032*"consumer" + 0.032*"more" + 0.027*"say" + 0.023*"accord" + 0.023*"market" + 0.022*"than" + 0.018*"last"
2018-11-11 03:30:25,703 : INFO : topic #52 (0.186): 0.020*"what" + 0.020*"but" + 0.017*"about" + 0.017*"there" + 0.015*"this" + 0.013*"people" + 0.013*"can" + 0.012*"a

2018-11-11 03:30:54,590 : INFO : topic #61 (0.004): 0.057*"susan" + 0.028*"administrator" + 0.018*"sugar" + 0.016*"eat" + 0.012*"but" + 0.012*"fat" + 0.011*"body" + 0.011*"add" + 0.009*"can" + 0.009*"fruit"
2018-11-11 03:30:54,591 : INFO : topic #89 (0.004): 0.025*"coleman" + 0.021*"natural" + 0.021*"more" + 0.013*"worker" + 0.011*"healthy" + 0.011*"ranch" + 0.010*"employee" + 0.010*"yield" + 0.010*"than" + 0.010*"some"
2018-11-11 03:30:54,592 : INFO : topic #76 (0.058): 0.033*"farm" + 0.024*"say" + 0.019*"farmer" + 0.015*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:30:54,593 : INFO : topic #13 (0.062): 0.060*"percent" + 0.052*"year" + 0.043*"sale" + 0.032*"more" + 0.032*"consumer" + 0.027*"say" + 0.023*"accord" + 0.023*"market" + 0.022*"than" + 0.019*"last"
2018-11-11 03:30:54,594 : INFO : topic #52 (0.201): 0.020*"what" + 0.020*"but" + 0.017*"about" + 0.017*"there" + 0.015*"this" + 0.013*"can" + 0.013*"people" + 0.012

2018-11-11 03:31:23,634 : INFO : topic #61 (0.004): 0.057*"susan" + 0.028*"administrator" + 0.018*"sugar" + 0.015*"eat" + 0.012*"but" + 0.012*"fat" + 0.011*"body" + 0.011*"add" + 0.009*"can" + 0.009*"tea"
2018-11-11 03:31:23,635 : INFO : topic #89 (0.004): 0.025*"coleman" + 0.021*"natural" + 0.021*"more" + 0.013*"worker" + 0.011*"ranch" + 0.011*"healthy" + 0.011*"yield" + 0.010*"employee" + 0.010*"than" + 0.010*"some"
2018-11-11 03:31:23,636 : INFO : topic #76 (0.059): 0.033*"farm" + 0.024*"say" + 0.019*"farmer" + 0.015*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:31:23,638 : INFO : topic #13 (0.065): 0.060*"percent" + 0.052*"year" + 0.043*"sale" + 0.032*"more" + 0.032*"consumer" + 0.027*"say" + 0.024*"market" + 0.024*"accord" + 0.023*"than" + 0.019*"last"
2018-11-11 03:31:23,639 : INFO : topic #52 (0.220): 0.020*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"people" + 0.012*"

2018-11-11 03:31:53,800 : INFO : topic #61 (0.004): 0.057*"susan" + 0.028*"administrator" + 0.018*"sugar" + 0.015*"eat" + 0.012*"but" + 0.012*"fat" + 0.011*"body" + 0.011*"add" + 0.010*"tea" + 0.009*"fruit"
2018-11-11 03:31:53,801 : INFO : topic #89 (0.004): 0.025*"coleman" + 0.021*"natural" + 0.021*"more" + 0.013*"worker" + 0.012*"ranch" + 0.011*"healthy" + 0.011*"yield" + 0.010*"employee" + 0.010*"than" + 0.010*"some"
2018-11-11 03:31:53,803 : INFO : topic #76 (0.060): 0.034*"farm" + 0.024*"say" + 0.019*"farmer" + 0.015*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:31:53,803 : INFO : topic #13 (0.067): 0.060*"percent" + 0.052*"year" + 0.043*"sale" + 0.032*"more" + 0.032*"consumer" + 0.028*"say" + 0.024*"market" + 0.024*"accord" + 0.023*"than" + 0.019*"last"
2018-11-11 03:31:53,805 : INFO : topic #52 (0.237): 0.020*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"people" + 0.012

2018-11-11 03:32:26,589 : INFO : topic #61 (0.004): 0.058*"susan" + 0.029*"administrator" + 0.017*"sugar" + 0.015*"eat" + 0.012*"but" + 0.012*"fat" + 0.011*"body" + 0.011*"add" + 0.010*"tea" + 0.010*"fruit"
2018-11-11 03:32:26,590 : INFO : topic #89 (0.004): 0.025*"coleman" + 0.021*"natural" + 0.021*"more" + 0.013*"worker" + 0.011*"ranch" + 0.011*"yield" + 0.011*"healthy" + 0.010*"employee" + 0.010*"than" + 0.010*"some"
2018-11-11 03:32:26,591 : INFO : topic #76 (0.061): 0.034*"farm" + 0.025*"say" + 0.019*"farmer" + 0.015*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:32:26,592 : INFO : topic #13 (0.069): 0.060*"percent" + 0.053*"year" + 0.043*"sale" + 0.033*"more" + 0.031*"consumer" + 0.028*"say" + 0.024*"market" + 0.024*"accord" + 0.023*"than" + 0.019*"last"
2018-11-11 03:32:26,593 : INFO : topic #52 (0.257): 0.020*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"people" + 0.013

2018-11-11 03:32:58,176 : INFO : topic #61 (0.004): 0.058*"susan" + 0.029*"administrator" + 0.017*"sugar" + 0.014*"eat" + 0.012*"but" + 0.012*"fat" + 0.011*"body" + 0.011*"add" + 0.010*"tea" + 0.010*"fruit"
2018-11-11 03:32:58,177 : INFO : topic #89 (0.004): 0.026*"coleman" + 0.021*"natural" + 0.021*"more" + 0.014*"worker" + 0.011*"yield" + 0.011*"ranch" + 0.011*"healthy" + 0.010*"employee" + 0.010*"than" + 0.010*"some"
2018-11-11 03:32:58,177 : INFO : topic #76 (0.062): 0.034*"farm" + 0.025*"say" + 0.019*"farmer" + 0.015*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:32:58,178 : INFO : topic #13 (0.071): 0.060*"percent" + 0.053*"year" + 0.043*"sale" + 0.033*"more" + 0.031*"consumer" + 0.028*"say" + 0.024*"market" + 0.024*"accord" + 0.023*"than" + 0.019*"last"
2018-11-11 03:32:58,179 : INFO : topic #52 (0.277): 0.021*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"all" + 0.013*"p

2018-11-11 03:33:28,618 : INFO : topic #61 (0.004): 0.058*"susan" + 0.029*"administrator" + 0.017*"sugar" + 0.014*"eat" + 0.012*"but" + 0.012*"fat" + 0.011*"body" + 0.011*"add" + 0.010*"tea" + 0.010*"fruit"
2018-11-11 03:33:28,618 : INFO : topic #89 (0.004): 0.026*"coleman" + 0.021*"more" + 0.021*"natural" + 0.014*"worker" + 0.011*"yield" + 0.011*"ranch" + 0.011*"healthy" + 0.010*"employee" + 0.010*"than" + 0.010*"some"
2018-11-11 03:33:28,619 : INFO : topic #76 (0.063): 0.034*"farm" + 0.025*"say" + 0.019*"farmer" + 0.016*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:33:28,620 : INFO : topic #13 (0.073): 0.061*"percent" + 0.053*"year" + 0.042*"sale" + 0.033*"more" + 0.031*"consumer" + 0.028*"say" + 0.024*"market" + 0.024*"accord" + 0.023*"than" + 0.019*"last"
2018-11-11 03:33:28,621 : INFO : topic #52 (0.297): 0.021*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"all" + 0.013*"p

2018-11-11 03:33:59,514 : INFO : topic #61 (0.004): 0.059*"susan" + 0.029*"administrator" + 0.017*"sugar" + 0.014*"eat" + 0.012*"but" + 0.011*"body" + 0.011*"add" + 0.010*"fat" + 0.010*"tea" + 0.010*"fruit"
2018-11-11 03:33:59,515 : INFO : topic #89 (0.004): 0.026*"coleman" + 0.021*"more" + 0.021*"natural" + 0.014*"worker" + 0.011*"yield" + 0.011*"ranch" + 0.010*"employee" + 0.010*"healthy" + 0.010*"healthcare" + 0.010*"than"
2018-11-11 03:33:59,515 : INFO : topic #76 (0.064): 0.034*"farm" + 0.025*"say" + 0.019*"farmer" + 0.016*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:33:59,516 : INFO : topic #13 (0.074): 0.061*"percent" + 0.053*"year" + 0.042*"sale" + 0.033*"more" + 0.031*"consumer" + 0.029*"say" + 0.024*"accord" + 0.024*"market" + 0.023*"than" + 0.019*"last"
2018-11-11 03:33:59,518 : INFO : topic #52 (0.319): 0.021*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"all" + 0.

2018-11-11 03:34:29,883 : INFO : topic #61 (0.004): 0.059*"susan" + 0.029*"administrator" + 0.017*"sugar" + 0.015*"eat" + 0.012*"but" + 0.011*"body" + 0.011*"add" + 0.010*"fruit" + 0.010*"tea" + 0.010*"vegetable"
2018-11-11 03:34:29,884 : INFO : topic #89 (0.004): 0.026*"coleman" + 0.022*"more" + 0.021*"natural" + 0.014*"worker" + 0.011*"yield" + 0.011*"ranch" + 0.011*"employee" + 0.010*"healthcare" + 0.010*"healthy" + 0.010*"than"
2018-11-11 03:34:29,885 : INFO : topic #76 (0.065): 0.035*"farm" + 0.025*"say" + 0.019*"farmer" + 0.016*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:34:29,886 : INFO : topic #13 (0.076): 0.061*"percent" + 0.053*"year" + 0.042*"sale" + 0.033*"more" + 0.031*"consumer" + 0.029*"say" + 0.024*"accord" + 0.024*"market" + 0.024*"than" + 0.019*"last"
2018-11-11 03:34:29,888 : INFO : topic #52 (0.343): 0.021*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"all

2018-11-11 03:34:59,230 : INFO : topic #61 (0.004): 0.060*"susan" + 0.029*"administrator" + 0.017*"sugar" + 0.015*"eat" + 0.012*"but" + 0.011*"body" + 0.011*"add" + 0.010*"fruit" + 0.010*"tea" + 0.010*"vegetable"
2018-11-11 03:34:59,231 : INFO : topic #89 (0.004): 0.026*"coleman" + 0.022*"more" + 0.021*"natural" + 0.014*"worker" + 0.012*"yield" + 0.011*"ranch" + 0.011*"employee" + 0.011*"healthcare" + 0.010*"than" + 0.010*"healthy"
2018-11-11 03:34:59,233 : INFO : topic #76 (0.066): 0.035*"farm" + 0.025*"say" + 0.019*"farmer" + 0.016*"year" + 0.013*"grow" + 0.010*"who" + 0.010*"but" + 0.008*"farming" + 0.008*"sell" + 0.007*"work"
2018-11-11 03:34:59,235 : INFO : topic #13 (0.077): 0.061*"percent" + 0.054*"year" + 0.042*"sale" + 0.034*"more" + 0.031*"consumer" + 0.029*"say" + 0.024*"accord" + 0.024*"market" + 0.024*"than" + 0.019*"last"
2018-11-11 03:34:59,236 : INFO : topic #52 (0.371): 0.021*"but" + 0.020*"what" + 0.017*"there" + 0.017*"about" + 0.015*"this" + 0.013*"can" + 0.013*"all