In [4]:
import sys
sys.path.append('../../..')
import src.data.data_loader as dl
from src.features.vectorizer import Vectorizer
from src.models.topic_models import TopicModel
import pandas as pd
import sklearn.utils as skutil
pd.set_option('display.max_rows', None)



In [5]:
# Data 
language = 'english'
typex = 'forum'

# Vectorization
min_df = 0.005
max_df = 0.9

# Topic Modeling
algorithm = 'lda'
num_topics = 110

train_percentage = 0.9
alpha = 'auto'
eta = 0.01
iterations = 200
passes = 60
chunksize = 5000
kappa = 0
tau_0 = 0

In [6]:
data = dl.get_forum_threads_by_language(language, typex,kind = "wobigrams")
texts = data['thread_texts']

def min_length (texts,min_characters):
    neu = []
    for t in texts: 
        token_perdoc_list = t.split()
        token_min_character = []
        for token in token_perdoc_list: 
            if len(token)>= min_characters: 
                token_min_character.append(token)
        joined = (" ").join(token_min_character)
        neu.append(joined)
    return neu

texts = min_length(texts,3)

In [7]:
vec = Vectorizer('tf', texts, min_df=min_df, max_df=max_df)
vec.save('{}_{}_{}_{}.pkl'.format(algorithm, language, typex,"without_bigrams"))

document_term_matrix = vec.get_document_token_matrix(texts)
id2token = vec.get_id2token_mapping()

In [8]:
document_term_matrix = skutil.shuffle(document_term_matrix, random_state=1)
num_docs, num_terms = document_term_matrix.shape
train = int(num_docs * train_percentage)
train_document_term_matrix = document_term_matrix[0:train, :]
test_document_term_matrix = document_term_matrix[train: num_docs, :]

In [6]:
model = TopicModel('lda', num_topics, train_document_term_matrix, id2token, alpha=alpha, eta=eta, iterations=iterations, passes=passes, chunksize=chunksize, test_document_term_matrix=test_document_term_matrix, decay=kappa, offset=tau_0)
model.save('{}_{}_{}_{}_forum_{}.pkl'.format(algorithm, language, typex,"without_bigrams",num_topics))

2018-07-11 16:55:24,177 : INFO : using autotuned alpha, starting with [0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.009090909, 0.0090

2018-07-11 16:57:24,364 : INFO : topic #11 (0.008): 0.049*"gut" + 0.032*"food" + 0.027*"bacteria" + 0.018*"roundup" + 0.017*"pharma" + 0.016*"formation" + 0.015*"soil" + 0.015*"organic" + 0.015*"pepper" + 0.015*"gmo"
2018-07-11 16:57:24,365 : INFO : topic #104 (0.008): 0.065*"water" + 0.025*"chemical" + 0.022*"organic" + 0.021*"free" + 0.014*"natural" + 0.013*"algae" + 0.013*"bacteria" + 0.012*"crop" + 0.011*"stream" + 0.011*"gmo"
2018-07-11 16:57:24,366 : INFO : topic #96 (0.011): 0.059*"organic" + 0.032*"food" + 0.023*"product" + 0.018*"buy" + 0.014*"natural" + 0.010*"label" + 0.010*"store" + 0.010*"use" + 0.010*"make" + 0.009*"good"
2018-07-11 16:57:24,367 : INFO : topic #60 (0.012): 0.090*"organic" + 0.045*"food" + 0.016*"pesticide" + 0.012*"use" + 0.012*"produce" + 0.012*"good" + 0.009*"grow" + 0.008*"conventional" + 0.008*"non" + 0.008*"make"
2018-07-11 16:57:24,368 : INFO : topic #18 (0.013): 0.030*"food" + 0.017*"organic" + 0.012*"people" + 0.012*"gmo" + 0.010*"good" + 0.010*"j

2018-07-11 16:58:23,755 : INFO : topic #83 (0.007): 0.084*"india" + 0.031*"food" + 0.020*"gmo" + 0.019*"healthy" + 0.015*"pledge" + 0.014*"corner" + 0.013*"anybody" + 0.011*"suicide" + 0.011*"country" + 0.011*"choice"
2018-07-11 16:58:23,756 : INFO : topic #101 (0.007): 0.038*"read" + 0.035*"dr." + 0.032*"disease" + 0.027*"heart" + 0.024*"article" + 0.023*"diet" + 0.019*"study" + 0.014*"fat" + 0.013*"click" + 0.013*"cancer"
2018-07-11 16:58:23,757 : INFO : topic #96 (0.015): 0.057*"organic" + 0.029*"food" + 0.028*"product" + 0.023*"buy" + 0.019*"natural" + 0.014*"label" + 0.012*"store" + 0.011*"gmo" + 0.011*"make" + 0.011*"know"
2018-07-11 16:58:23,757 : INFO : topic #18 (0.019): 0.031*"food" + 0.017*"organic" + 0.014*"people" + 0.012*"gmo" + 0.011*"just" + 0.010*"make" + 0.010*"know" + 0.010*"good" + 0.009*"buy" + 0.009*"eat"
2018-07-11 16:58:23,758 : INFO : topic #60 (0.020): 0.112*"organic" + 0.055*"food" + 0.017*"pesticide" + 0.014*"produce" + 0.012*"use" + 0.011*"good" + 0.011*"gr

2018-07-11 16:59:14,161 : INFO : topic #42 (0.007): 0.033*"organic" + 0.023*"trade" + 0.017*"awareness" + 0.015*"fair" + 0.014*"source" + 0.013*"movement" + 0.012*"<url>" + 0.012*"fertilizer" + 0.012*"like" + 0.010*"label"
2018-07-11 16:59:14,162 : INFO : topic #84 (0.007): 0.017*"use" + 0.015*"climate" + 0.014*"<url>" + 0.012*"grow" + 0.012*"think" + 0.010*"change" + 0.009*"animal" + 0.008*"tom" + 0.008*"like" + 0.008*"article"
2018-07-11 16:59:14,164 : INFO : topic #96 (0.019): 0.056*"organic" + 0.030*"product" + 0.027*"food" + 0.025*"buy" + 0.023*"natural" + 0.015*"label" + 0.014*"company" + 0.013*"gmo" + 0.012*"know" + 0.012*"brand"
2018-07-11 16:59:14,165 : INFO : topic #18 (0.026): 0.029*"food" + 0.016*"organic" + 0.016*"people" + 0.013*"gmo" + 0.012*"just" + 0.011*"know" + 0.011*"make" + 0.010*"good" + 0.010*"buy" + 0.009*"eat"
2018-07-11 16:59:14,166 : INFO : topic #60 (0.034): 0.124*"organic" + 0.061*"food" + 0.017*"pesticide" + 0.015*"produce" + 0.012*"use" + 0.012*"grow" + 0

2018-07-11 17:00:01,809 : INFO : topic #42 (0.006): 0.034*"organic" + 0.018*"rural" + 0.015*"movement" + 0.014*"awareness" + 0.014*"refrigerator" + 0.012*"trade" + 0.012*"source" + 0.012*"<url>" + 0.012*"like" + 0.012*"cool"
2018-07-11 17:00:01,810 : INFO : topic #84 (0.006): 0.014*"<url>" + 0.013*"use" + 0.013*"think" + 0.013*"grow" + 0.012*"climate" + 0.009*"animal" + 0.009*"tom" + 0.009*"like" + 0.008*"article" + 0.008*"intensive"
2018-07-11 17:00:01,811 : INFO : topic #61 (0.023): 0.029*"farming" + 0.028*"organic" + 0.015*"use" + 0.014*"farm" + 0.013*"farmer" + 0.012*"land" + 0.011*"agriculture" + 0.011*"crop" + 0.011*"produce" + 0.009*"sustainable"
2018-07-11 17:00:01,812 : INFO : topic #18 (0.037): 0.028*"food" + 0.017*"people" + 0.016*"organic" + 0.013*"just" + 0.013*"gmo" + 0.011*"know" + 0.011*"make" + 0.010*"good" + 0.010*"buy" + 0.009*"eat"
2018-07-11 17:00:01,813 : INFO : topic #60 (0.052): 0.132*"organic" + 0.065*"food" + 0.017*"pesticide" + 0.015*"produce" + 0.012*"grow" 

2018-07-11 17:00:47,577 : INFO : topic #84 (0.006): 0.015*"<url>" + 0.013*"think" + 0.013*"grow" + 0.011*"benbrook" + 0.010*"use" + 0.009*"animal" + 0.009*"tom" + 0.009*"like" + 0.009*"article" + 0.008*"intensive"
2018-07-11 17:00:47,578 : INFO : topic #42 (0.006): 0.033*"organic" + 0.027*"rural" + 0.020*"cooperative" + 0.017*"refrigerator" + 0.015*"movement" + 0.014*"cool" + 0.014*"awareness" + 0.013*"<url>" + 0.013*"like" + 0.012*"extension"
2018-07-11 17:00:47,579 : INFO : topic #65 (0.029): 0.054*"food" + 0.029*"organic" + 0.023*"buy" + 0.018*"people" + 0.014*"eat" + 0.013*"price" + 0.013*"cost" + 0.013*"good" + 0.012*"make" + 0.012*"cheap"
2018-07-11 17:00:47,580 : INFO : topic #18 (0.049): 0.027*"food" + 0.017*"people" + 0.016*"organic" + 0.013*"just" + 0.012*"gmo" + 0.011*"know" + 0.011*"make" + 0.010*"good" + 0.010*"buy" + 0.009*"eat"
2018-07-11 17:00:47,581 : INFO : topic #60 (0.072): 0.138*"organic" + 0.068*"food" + 0.017*"pesticide" + 0.016*"produce" + 0.013*"grow" + 0.012*"

2018-07-11 17:01:30,547 : INFO : topic #20 (0.006): 0.049*"cabbage" + 0.026*"unit" + 0.020*"need" + 0.020*"cost" + 0.018*"sell" + 0.014*"market" + 0.014*"know" + 0.012*"make" + 0.009*"year" + 0.009*"today"
2018-07-11 17:01:30,549 : INFO : topic #84 (0.006): 0.024*"benbrook" + 0.015*"<url>" + 0.014*"think" + 0.014*"smell" + 0.014*"grow" + 0.010*"tom" + 0.010*"animal" + 0.009*"like" + 0.009*"article" + 0.009*"intensive"
2018-07-11 17:01:30,550 : INFO : topic #65 (0.037): 0.056*"food" + 0.029*"organic" + 0.023*"buy" + 0.018*"people" + 0.014*"eat" + 0.014*"cost" + 0.013*"price" + 0.013*"good" + 0.013*"make" + 0.013*"cheap"
2018-07-11 17:01:30,551 : INFO : topic #18 (0.061): 0.026*"food" + 0.018*"people" + 0.015*"organic" + 0.013*"just" + 0.011*"know" + 0.011*"make" + 0.011*"gmo" + 0.010*"good" + 0.010*"buy" + 0.009*"eat"
2018-07-11 17:01:30,552 : INFO : topic #60 (0.088): 0.142*"organic" + 0.069*"food" + 0.017*"pesticide" + 0.016*"produce" + 0.014*"grow" + 0.012*"use" + 0.012*"good" + 0.01

2018-07-11 17:02:12,460 : INFO : topic #20 (0.005): 0.050*"cabbage" + 0.027*"unit" + 0.020*"need" + 0.020*"cost" + 0.018*"sell" + 0.014*"market" + 0.013*"know" + 0.012*"make" + 0.009*"year" + 0.009*"today"
2018-07-11 17:02:12,461 : INFO : topic #84 (0.005): 0.034*"benbrook" + 0.017*"smell" + 0.016*"<url>" + 0.014*"think" + 0.014*"grow" + 0.010*"specialist" + 0.010*"like" + 0.010*"animal" + 0.010*"tom" + 0.009*"article"
2018-07-11 17:02:12,462 : INFO : topic #65 (0.044): 0.056*"food" + 0.029*"organic" + 0.023*"buy" + 0.018*"people" + 0.014*"cost" + 0.014*"price" + 0.014*"eat" + 0.013*"cheap" + 0.013*"make" + 0.013*"good"
2018-07-11 17:02:12,463 : INFO : topic #18 (0.073): 0.025*"food" + 0.018*"people" + 0.015*"organic" + 0.014*"just" + 0.011*"know" + 0.011*"make" + 0.010*"good" + 0.010*"gmo" + 0.010*"need" + 0.010*"eat"
2018-07-11 17:02:12,464 : INFO : topic #60 (0.100): 0.146*"organic" + 0.071*"food" + 0.017*"pesticide" + 0.016*"produce" + 0.014*"grow" + 0.012*"good" + 0.012*"use" + 0.

2018-07-11 17:02:51,061 : INFO : topic #20 (0.005): 0.051*"cabbage" + 0.027*"unit" + 0.020*"need" + 0.020*"cost" + 0.018*"sell" + 0.014*"market" + 0.013*"know" + 0.012*"make" + 0.009*"year" + 0.009*"today"
2018-07-11 17:02:51,062 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.018*"smell" + 0.016*"<url>" + 0.014*"think" + 0.014*"grow" + 0.011*"specialist" + 0.010*"like" + 0.010*"tom" + 0.010*"animal" + 0.009*"intensive"
2018-07-11 17:02:51,063 : INFO : topic #65 (0.050): 0.057*"food" + 0.029*"organic" + 0.023*"buy" + 0.018*"people" + 0.015*"cost" + 0.015*"price" + 0.014*"eat" + 0.013*"cheap" + 0.013*"make" + 0.012*"good"
2018-07-11 17:02:51,064 : INFO : topic #18 (0.082): 0.024*"food" + 0.019*"people" + 0.015*"organic" + 0.014*"just" + 0.012*"make" + 0.012*"know" + 0.010*"good" + 0.010*"need" + 0.010*"eat" + 0.009*"gmo"
2018-07-11 17:02:51,065 : INFO : topic #60 (0.109): 0.149*"organic" + 0.072*"food" + 0.017*"pesticide" + 0.017*"produce" + 0.014*"grow" + 0.012*"good" + 0.012*"non" + 

2018-07-11 17:03:27,839 : INFO : topic #20 (0.005): 0.051*"cabbage" + 0.027*"unit" + 0.020*"need" + 0.020*"cost" + 0.018*"sell" + 0.014*"market" + 0.013*"know" + 0.012*"make" + 0.010*"year" + 0.010*"acre"
2018-07-11 17:03:27,840 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.018*"smell" + 0.016*"<url>" + 0.015*"think" + 0.014*"grow" + 0.011*"specialist" + 0.010*"like" + 0.010*"tom" + 0.010*"animal" + 0.009*"intensive"
2018-07-11 17:03:27,840 : INFO : topic #65 (0.056): 0.057*"food" + 0.029*"organic" + 0.023*"buy" + 0.018*"people" + 0.015*"cost" + 0.015*"price" + 0.014*"eat" + 0.013*"cheap" + 0.013*"make" + 0.012*"good"
2018-07-11 17:03:27,841 : INFO : topic #18 (0.090): 0.023*"food" + 0.019*"people" + 0.015*"organic" + 0.014*"just" + 0.012*"make" + 0.012*"know" + 0.010*"good" + 0.010*"need" + 0.010*"eat" + 0.009*"buy"
2018-07-11 17:03:27,842 : INFO : topic #60 (0.116): 0.151*"organic" + 0.073*"food" + 0.017*"pesticide" + 0.017*"produce" + 0.015*"grow" + 0.012*"good" + 0.012*"non" + 0

2018-07-11 17:04:04,497 : INFO : topic #20 (0.005): 0.052*"cabbage" + 0.027*"unit" + 0.021*"need" + 0.019*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"make" + 0.010*"year" + 0.010*"acre"
2018-07-11 17:04:04,498 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.018*"smell" + 0.015*"think" + 0.014*"grow" + 0.012*"<url>" + 0.011*"specialist" + 0.010*"intensive" + 0.010*"like" + 0.010*"tom" + 0.010*"animal"
2018-07-11 17:04:04,499 : INFO : topic #65 (0.060): 0.057*"food" + 0.029*"organic" + 0.023*"buy" + 0.018*"people" + 0.015*"cost" + 0.015*"price" + 0.013*"eat" + 0.013*"cheap" + 0.013*"make" + 0.012*"good"
2018-07-11 17:04:04,500 : INFO : topic #18 (0.097): 0.023*"food" + 0.020*"people" + 0.015*"organic" + 0.014*"just" + 0.012*"make" + 0.012*"know" + 0.011*"good" + 0.010*"need" + 0.010*"eat" + 0.009*"buy"
2018-07-11 17:04:04,501 : INFO : topic #60 (0.123): 0.153*"organic" + 0.073*"food" + 0.017*"pesticide" + 0.017*"produce" + 0.015*"grow" + 0.013*"good" + 0.012*"non" + 0

2018-07-11 17:04:40,804 : INFO : topic #20 (0.005): 0.052*"cabbage" + 0.027*"unit" + 0.021*"need" + 0.019*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"make" + 0.010*"year" + 0.010*"acre"
2018-07-11 17:04:40,805 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.018*"smell" + 0.015*"think" + 0.014*"grow" + 0.011*"intensive" + 0.011*"specialist" + 0.010*"dust" + 0.010*"like" + 0.010*"tom" + 0.010*"animal"
2018-07-11 17:04:40,806 : INFO : topic #65 (0.064): 0.057*"food" + 0.029*"organic" + 0.023*"buy" + 0.018*"people" + 0.016*"cost" + 0.016*"price" + 0.014*"cheap" + 0.014*"make" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:04:40,807 : INFO : topic #18 (0.104): 0.022*"food" + 0.020*"people" + 0.015*"just" + 0.014*"organic" + 0.012*"make" + 0.012*"know" + 0.011*"good" + 0.010*"need" + 0.010*"eat" + 0.009*"like"
2018-07-11 17:04:40,808 : INFO : topic #60 (0.130): 0.155*"organic" + 0.073*"food" + 0.017*"produce" + 0.017*"pesticide" + 0.015*"grow" + 0.013*"good" + 0.012*"non" + 0

2018-07-11 17:05:17,046 : INFO : topic #20 (0.005): 0.053*"cabbage" + 0.028*"unit" + 0.021*"need" + 0.019*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"make" + 0.010*"year" + 0.010*"acre"
2018-07-11 17:05:17,047 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.018*"smell" + 0.015*"think" + 0.015*"grow" + 0.012*"dust" + 0.012*"specialist" + 0.011*"intensive" + 0.010*"like" + 0.010*"tom" + 0.009*"animal"
2018-07-11 17:05:17,048 : INFO : topic #65 (0.067): 0.057*"food" + 0.028*"organic" + 0.024*"buy" + 0.018*"people" + 0.016*"cost" + 0.016*"price" + 0.014*"make" + 0.014*"cheap" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:05:17,049 : INFO : topic #18 (0.110): 0.022*"food" + 0.020*"people" + 0.015*"just" + 0.014*"organic" + 0.012*"make" + 0.012*"know" + 0.011*"good" + 0.011*"need" + 0.010*"eat" + 0.009*"like"
2018-07-11 17:05:17,050 : INFO : topic #60 (0.137): 0.157*"organic" + 0.073*"food" + 0.017*"produce" + 0.017*"pesticide" + 0.015*"grow" + 0.013*"good" + 0.012*"non" + 0

2018-07-11 17:05:51,611 : INFO : topic #20 (0.004): 0.054*"cabbage" + 0.028*"unit" + 0.021*"need" + 0.019*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"make" + 0.010*"year" + 0.010*"acre"
2018-07-11 17:05:51,612 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.019*"smell" + 0.015*"think" + 0.015*"grow" + 0.013*"specialist" + 0.012*"dust" + 0.011*"author" + 0.011*"intensive" + 0.010*"like" + 0.010*"tom"
2018-07-11 17:05:51,613 : INFO : topic #65 (0.070): 0.057*"food" + 0.028*"organic" + 0.024*"buy" + 0.018*"people" + 0.016*"price" + 0.016*"cost" + 0.014*"make" + 0.014*"cheap" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:05:51,614 : INFO : topic #18 (0.115): 0.021*"food" + 0.020*"people" + 0.015*"just" + 0.014*"organic" + 0.012*"make" + 0.012*"know" + 0.011*"good" + 0.011*"need" + 0.010*"eat" + 0.009*"like"
2018-07-11 17:05:51,615 : INFO : topic #60 (0.143): 0.158*"organic" + 0.073*"food" + 0.017*"produce" + 0.017*"pesticide" + 0.015*"grow" + 0.013*"good" + 0.012*"non" + 0

2018-07-11 17:06:24,888 : INFO : topic #20 (0.004): 0.053*"cabbage" + 0.028*"unit" + 0.021*"need" + 0.018*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"make" + 0.011*"acre" + 0.011*"rally"
2018-07-11 17:06:24,888 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.019*"smell" + 0.015*"grow" + 0.015*"think" + 0.013*"dust" + 0.013*"author" + 0.013*"specialist" + 0.011*"intensive" + 0.010*"like" + 0.010*"tom"
2018-07-11 17:06:24,889 : INFO : topic #65 (0.073): 0.056*"food" + 0.027*"organic" + 0.024*"buy" + 0.018*"people" + 0.017*"price" + 0.017*"cost" + 0.014*"cheap" + 0.014*"make" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:06:24,890 : INFO : topic #18 (0.119): 0.021*"food" + 0.021*"people" + 0.015*"just" + 0.014*"organic" + 0.012*"make" + 0.012*"know" + 0.011*"good" + 0.011*"need" + 0.010*"eat" + 0.009*"like"
2018-07-11 17:06:24,892 : INFO : topic #60 (0.148): 0.160*"organic" + 0.072*"food" + 0.017*"pesticide" + 0.017*"produce" + 0.015*"grow" + 0.013*"good" + 0.012*"non" + 

2018-07-11 17:06:57,452 : INFO : topic #20 (0.004): 0.054*"cabbage" + 0.028*"unit" + 0.021*"need" + 0.018*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"rally" + 0.011*"acre" + 0.011*"make"
2018-07-11 17:06:57,453 : INFO : topic #84 (0.005): 0.039*"benbrook" + 0.019*"smell" + 0.015*"think" + 0.015*"grow" + 0.014*"author" + 0.013*"dust" + 0.013*"specialist" + 0.011*"intensive" + 0.010*"like" + 0.010*"tom"
2018-07-11 17:06:57,455 : INFO : topic #65 (0.075): 0.055*"food" + 0.027*"organic" + 0.024*"buy" + 0.018*"people" + 0.017*"price" + 0.017*"cost" + 0.014*"cheap" + 0.014*"make" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:06:57,456 : INFO : topic #18 (0.124): 0.021*"people" + 0.020*"food" + 0.015*"just" + 0.014*"organic" + 0.012*"make" + 0.012*"know" + 0.011*"good" + 0.011*"need" + 0.010*"eat" + 0.010*"like"
2018-07-11 17:06:57,457 : INFO : topic #60 (0.152): 0.162*"organic" + 0.070*"food" + 0.018*"pesticide" + 0.017*"produce" + 0.015*"grow" + 0.014*"good" + 0.012*"non" + 

2018-07-11 17:07:30,844 : INFO : topic #20 (0.004): 0.055*"cabbage" + 0.028*"unit" + 0.021*"need" + 0.018*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"rally" + 0.012*"acre" + 0.011*"make"
2018-07-11 17:07:30,845 : INFO : topic #84 (0.005): 0.038*"benbrook" + 0.019*"smell" + 0.015*"think" + 0.015*"grow" + 0.014*"author" + 0.013*"dust" + 0.012*"specialist" + 0.011*"like" + 0.010*"intensive" + 0.010*"pig"
2018-07-11 17:07:30,846 : INFO : topic #65 (0.077): 0.054*"food" + 0.026*"organic" + 0.024*"buy" + 0.018*"people" + 0.017*"price" + 0.017*"cost" + 0.014*"cheap" + 0.014*"make" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:07:30,846 : INFO : topic #18 (0.129): 0.021*"people" + 0.019*"food" + 0.015*"just" + 0.013*"organic" + 0.012*"make" + 0.012*"know" + 0.011*"good" + 0.011*"need" + 0.010*"like" + 0.010*"eat"
2018-07-11 17:07:30,847 : INFO : topic #60 (0.155): 0.163*"organic" + 0.067*"food" + 0.018*"pesticide" + 0.017*"produce" + 0.015*"grow" + 0.014*"good" + 0.012*"non" + 

2018-07-11 17:08:04,643 : INFO : topic #20 (0.004): 0.055*"cabbage" + 0.028*"unit" + 0.021*"need" + 0.018*"cost" + 0.018*"sell" + 0.015*"market" + 0.014*"know" + 0.012*"rally" + 0.012*"make" + 0.012*"acre"
2018-07-11 17:08:04,644 : INFO : topic #84 (0.005): 0.037*"benbrook" + 0.019*"smell" + 0.016*"think" + 0.016*"grow" + 0.015*"pig" + 0.014*"author" + 0.013*"specialist" + 0.013*"dust" + 0.010*"like" + 0.009*"farming"
2018-07-11 17:08:04,645 : INFO : topic #65 (0.078): 0.052*"food" + 0.026*"organic" + 0.024*"buy" + 0.018*"people" + 0.018*"price" + 0.017*"cost" + 0.014*"cheap" + 0.014*"make" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:08:04,646 : INFO : topic #18 (0.134): 0.021*"people" + 0.019*"food" + 0.016*"just" + 0.013*"organic" + 0.013*"make" + 0.012*"know" + 0.011*"good" + 0.011*"need" + 0.010*"like" + 0.010*"eat"
2018-07-11 17:08:04,647 : INFO : topic #60 (0.158): 0.165*"organic" + 0.065*"food" + 0.018*"pesticide" + 0.018*"produce" + 0.015*"grow" + 0.014*"good" + 0.012*"non" + 0.

2018-07-11 17:08:37,470 : INFO : topic #84 (0.005): 0.036*"benbrook" + 0.022*"pig" + 0.018*"smell" + 0.016*"grow" + 0.016*"think" + 0.014*"author" + 0.013*"specialist" + 0.013*"dust" + 0.010*"like" + 0.010*"link"
2018-07-11 17:08:37,471 : INFO : topic #65 (0.080): 0.051*"food" + 0.025*"organic" + 0.024*"buy" + 0.018*"price" + 0.018*"people" + 0.017*"cost" + 0.014*"cheap" + 0.014*"make" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:08:37,473 : INFO : topic #18 (0.138): 0.021*"people" + 0.018*"food" + 0.016*"just" + 0.013*"make" + 0.013*"organic" + 0.013*"know" + 0.011*"good" + 0.011*"need" + 0.010*"like" + 0.010*"eat"
2018-07-11 17:08:37,474 : INFO : topic #60 (0.162): 0.166*"organic" + 0.062*"food" + 0.018*"pesticide" + 0.018*"produce" + 0.016*"grow" + 0.014*"good" + 0.013*"non" + 0.012*"conventional" + 0.011*"chemical" + 0.011*"use"
2018-07-11 17:08:37,480 : INFO : topic diff=inf, rho=1.000000
2018-07-11 17:08:39,437 : INFO : Epoch 53: perplexity estimate: 497.3752768683296
2018-07-11 17

2018-07-11 17:09:05,088 : INFO : topic #65 (0.082): 0.049*"food" + 0.024*"organic" + 0.024*"buy" + 0.018*"price" + 0.018*"cost" + 0.018*"people" + 0.015*"cheap" + 0.014*"make" + 0.013*"eat" + 0.012*"good"
2018-07-11 17:09:05,089 : INFO : topic #18 (0.142): 0.022*"people" + 0.017*"food" + 0.016*"just" + 0.013*"make" + 0.013*"know" + 0.012*"organic" + 0.012*"good" + 0.011*"need" + 0.010*"like" + 0.010*"eat"
2018-07-11 17:09:05,090 : INFO : topic #60 (0.165): 0.168*"organic" + 0.059*"food" + 0.018*"pesticide" + 0.018*"produce" + 0.016*"grow" + 0.014*"good" + 0.013*"non" + 0.012*"conventional" + 0.011*"chemical" + 0.011*"use"
2018-07-11 17:09:05,093 : INFO : topic diff=inf, rho=1.000000
2018-07-11 17:09:06,634 : INFO : Epoch 56: perplexity estimate: 492.0184436802451
2018-07-11 17:09:06,747 : INFO : PROGRESS: pass 57, at document #2946/2946
2018-07-11 17:09:14,202 : INFO : optimized alpha [0.013803174, 0.03250655, 0.022858297, 0.023805512, 0.009421615, 0.025532134, 0.0066961744, 0.03133627

2018-07-11 17:09:32,329 : INFO : topic #35 (0.087): 0.573*"food" + 0.040*"healthy" + 0.025*"people" + 0.023*"restaurant" + 0.016*"fast" + 0.014*"industry" + 0.014*"question" + 0.010*"large" + 0.010*"way" + 0.009*"serve"
2018-07-11 17:09:32,330 : INFO : topic #18 (0.146): 0.022*"people" + 0.017*"food" + 0.016*"just" + 0.013*"make" + 0.013*"know" + 0.012*"organic" + 0.012*"good" + 0.011*"need" + 0.010*"like" + 0.010*"eat"
2018-07-11 17:09:32,331 : INFO : topic #60 (0.168): 0.169*"organic" + 0.057*"food" + 0.018*"pesticide" + 0.018*"produce" + 0.016*"grow" + 0.014*"good" + 0.013*"non" + 0.012*"conventional" + 0.011*"chemical" + 0.011*"use"
2018-07-11 17:09:32,335 : INFO : topic diff=inf, rho=1.000000
2018-07-11 17:09:33,850 : INFO : Epoch 59: perplexity estimate: 487.1607924852777
