In [96]:
%run load_helper.ipynb
import statsmodels.api as sm
from statsmodels.tsa.stattools import grangercausalitytests
import numpy as np


# ##################################################
#             SET PARAMETERS
#
# pick a baseline
#        baselines = ["10topics", "15topics", "20topics", "25topics", "30topics"]
#
# name your run (used to store the iterations); models will be saved myrun1.sav myrun2.save etc
#
# set your parameters
#
# ##################################################
runname = "initialrun"
mybaseline = "20topics"

# below are default params that can be played with
num_buffers = 5    # how many buffers to add each iteration
lda_decay = .5     # how much the prior influences the iteration 0 - 1 
num_iterations = 1 # the article used 5

# lag of 5 is mentioned in the paper, and seems to work the best with trial runs
the_lag = 5


# ##################################################
#
# The ITMFT algorithm
#
#  Run cell 1
#  and either cell 2 (to create a baseline)
#      or cell 3 to load the baseline
# ##################################################
file_name = save_path + mybaseline + ".sav"
model = LdaModel.load(file_name)
    

iteration = 0
oldsignificanttopics = 0
significanttopcs = 1

while iteration < num_iterations and significanttopcs > oldsignificanttopics :
    topics = model.get_topics()
    num_topics = len(topics)
    
    # create a topic coverage matrix preset to 0
    topiccoverage = []
    i = 0
    while i < len(docs_per_timeslice) :
        y = 0
        thistopic = []
        while y < num_topics:
            thistopic.append(0.0)
            y += 1
        topiccoverage.append(thistopic)
        i += 1
            
    # get the topic coverage per timeslice per doc
    timeslice = 0
    for timeslicedocs in docs_per_timeslice :
        # for each doc in this timeslice
        for doc in timeslicedocs :
            # get the probability matrix
            probs = model.get_document_topics(bow[doc])
            #its a sparse array, prob[0] is the topic and prob[1] is the probabiltiy
            for prob in probs :
                topiccoverage[timeslice][prob[0]] += prob[1]
        timeslice += 1
        
    newtopics = []
    # ##################################################
    # INPUT:
    # timeslicetokencounts - we have the word coverage for each model token
    # topiccoverage - and now we have the topic coverage
    # topics - the current topic word probabilities
    #
    # OUTPUT:
    # updated array newtopics = []
    #
    # run the iteration
    # ##################################################
    bets = [] 
    with open(".\\LDA_data\\betdataclean.csv") as swf:
        for line in swf:
            bets.append(np.longdouble(float(line)))

    swf.close()
    
    ii = 0
    
    high_threshold = .95
    hightopicsgc = []
    hightopics = []
    highlags = []
    low_threshold = .05
    lowtopicsgc = []
    lowtopics = []
    lowlags = []
    while ii < num_topics :
        tempgc = grangercausalitytests([[bets[i],topiccoverage[i][ii]] for i in range(0, len(bets))], the_lag, verbose=False)
        #sigtopicsgc.append(tempgc)
        highpvalue = 0
        highlag = 0
        lowpvalue = 2
        lowlag = 0
        for yy in range(1,5) :
            stats = tempgc.get(yy)[0].get('ssr_ftest')
            if (stats[1] > highpvalue) :
                highlag = yy
                highpvalue = stats[1]
            if (stats[1] < lowpvalue) :
                lowlag = yy
                lowpvalue = stats[1]
        if highpvalue > high_threshold :
            highlags.append(highlag)
            hightopics.append(ii)
            hightopicsgc.append(tempgc.get(highlag)[0].get('ssr_ftest'))
        if lowpvalue < low_threshold :
            lowlags.append(lowlag)
            lowtopics.append(ii)
            lowtopicsgc.append(tempgc.get(lowlag)[0].get('ssr_ftest'))
        """ 
        for yy in range(1, 5) :
            stats = tempgc.get(yy)[0].get('ssr_ftest')
            if stats[1] < sig_threshold :
                sigtopics.append(ii)  # save the topic number
                sigtopicsgc.append(stats)
                break                
        """
        ii += 1
    print(hightopics)
    print(lowtopics)
    #print(siggc)
    
    """ 
    sigwordsgc = []
    sigwords = []
    while ii < num_words :
        tempgc = grangercausalitytests([[bets[i], timeslicetokencounts[i][ii]] for i in range(0, len(bets))], 5, verbose=False)
        for yy in range(1, 5) :
            stats = tempgc.get(yy)[0].get('ssr_ftest')
            if stats[1] > sig_threshold :
                sigwords.append(ii)  # save the topic number
                sigwordsgc.append(stats)
                break                
        ii += 1
    print(sigwords)
    """
    #%run ITMTF_iterate.ipynb

    break 
    # ##################################################
    #
    # using the returned topics probabilies
    # and adding buffers - num_buffers using bufferprob
    # create the prior
    # update num_topics
    # and run the model
    # ##################################################
    
    #$$$ remove this, for now just creating a topic prob list of X from old model as the return
    topics = model.get_topics()
    print(len(topics))
    for topic in topics :
        newtopics.append(topic)
        
    #$$$ remove this, for now just creating a topic prob list of X from old model as the return
        
    # add the buffers
    z = 0
    while z < num_buffers:
        newtopics.append(bufferprob)
        z += 1
    num_topics = len(newtopics)

    now = datetime.now()
    current_time = now.strftime("%H:%M:%S")
    print("Iteration start timee =", current_time)
    model = LdaModel(
        corpus=corpus,
        id2word=tokentoword,
        chunksize=chunksize,
        alpha='auto',               
        eta=newtopics,                 # preset topic/word
        iterations=iterations,
        num_topics=num_topics,         # added buffer topics
        passes=passes,
        decay = lda_decay,
        eval_every=eval_every
    )

    file_name = runname + str(iteration) 
    path_name = save_path + file_name + ".sav"
    print(file_name + " - saved for visualization")
    model.save(path_name )
 
    now = datetime.now()
    current_time = now.strftime("%H:%M:%S")
    print("Iteration Complete = ", current_time)

    iteration += 1
print("Run Complete ")


Number of time slices with docs: 123
Number of time slices: 123
Number of time vocab: 12517
Size of doctokens: 2673
Number of documents: 2673
12517
Number of unique tokens: 12517
[]
[0, 6, 7, 8, 10, 11, 14]
Run Complete 


In [90]:
from scipy.stats import pearsonr
# calculate Pearson's correlation
print (len(bets))
print(bets[0].dtype)
trans = np.array(timeslicetokencounts).transpose()
wordcorr = []
print (len(trans[1]))
print (len(timeslicetokencounts[1]))
for yy in range(0,num_words) :
    corr, _ = pearsonr(bets, trans[yy])
    wordcorr.append(corr)
    print('Pearsons correlation: %.3f' % corr)

123
float64
123
12517
Pearsons correlation: -0.167
Pearsons correlation: 0.018
Pearsons correlation: -0.079
Pearsons correlation: 0.001
Pearsons correlation: 0.058
Pearsons correlation: 0.015
Pearsons correlation: 0.021
Pearsons correlation: 0.044
Pearsons correlation: 0.021
Pearsons correlation: 0.052
Pearsons correlation: 0.007
Pearsons correlation: -0.111
Pearsons correlation: -0.297
Pearsons correlation: -0.028
Pearsons correlation: -0.041
Pearsons correlation: -0.062
Pearsons correlation: 0.168
Pearsons correlation: 0.052
Pearsons correlation: 0.069
Pearsons correlation: 0.081
Pearsons correlation: -0.039
Pearsons correlation: -0.174
Pearsons correlation: 0.067
Pearsons correlation: -0.137
Pearsons correlation: 0.090
Pearsons correlation: -0.078
Pearsons correlation: -0.055
Pearsons correlation: 0.069
Pearsons correlation: 0.077
Pearsons correlation: -0.016
Pearsons correlation: -0.111
Pearsons correlation: -0.078
Pearsons correlation: 0.058
Pearsons correlation: -0.025
Pearsons c

Pearsons correlation: 0.013
Pearsons correlation: 0.039
Pearsons correlation: -0.155
Pearsons correlation: -0.060
Pearsons correlation: 0.152
Pearsons correlation: 0.065
Pearsons correlation: -0.091
Pearsons correlation: 0.027
Pearsons correlation: -0.103
Pearsons correlation: 0.039
Pearsons correlation: -0.112
Pearsons correlation: -0.254
Pearsons correlation: -0.112
Pearsons correlation: -0.008
Pearsons correlation: -0.109
Pearsons correlation: -0.012
Pearsons correlation: 0.013
Pearsons correlation: 0.027
Pearsons correlation: -0.254
Pearsons correlation: -0.091
Pearsons correlation: -0.008
Pearsons correlation: -0.090
Pearsons correlation: -0.060
Pearsons correlation: 0.212
Pearsons correlation: -0.002
Pearsons correlation: -0.002
Pearsons correlation: 0.212
Pearsons correlation: 0.225
Pearsons correlation: -0.075
Pearsons correlation: -0.002
Pearsons correlation: -0.151
Pearsons correlation: -0.001
Pearsons correlation: -0.030
Pearsons correlation: -0.075
Pearsons correlation: -0.

Pearsons correlation: -0.042
Pearsons correlation: 0.126
Pearsons correlation: -0.096
Pearsons correlation: 0.209
Pearsons correlation: -0.035
Pearsons correlation: 0.169
Pearsons correlation: -0.333
Pearsons correlation: 0.060
Pearsons correlation: 0.209
Pearsons correlation: 0.025
Pearsons correlation: -0.096
Pearsons correlation: 0.072
Pearsons correlation: -0.028
Pearsons correlation: -0.283
Pearsons correlation: 0.031
Pearsons correlation: 0.031
Pearsons correlation: 0.060
Pearsons correlation: -0.043
Pearsons correlation: -0.028
Pearsons correlation: 0.031
Pearsons correlation: -0.028
Pearsons correlation: -0.042
Pearsons correlation: -0.042
Pearsons correlation: -0.122
Pearsons correlation: -0.028
Pearsons correlation: 0.060
Pearsons correlation: -0.053
Pearsons correlation: 0.031
Pearsons correlation: 0.169
Pearsons correlation: 0.332
Pearsons correlation: -0.255
Pearsons correlation: -0.076
Pearsons correlation: -0.091
Pearsons correlation: 0.174
Pearsons correlation: -0.006
P

Pearsons correlation: -0.033
Pearsons correlation: -0.012
Pearsons correlation: -0.081
Pearsons correlation: 0.002
Pearsons correlation: -0.202
Pearsons correlation: -0.101
Pearsons correlation: -0.080
Pearsons correlation: 0.061
Pearsons correlation: -0.034
Pearsons correlation: -0.080
Pearsons correlation: -0.155
Pearsons correlation: -0.110
Pearsons correlation: -0.075
Pearsons correlation: -0.094
Pearsons correlation: -0.087
Pearsons correlation: -0.071
Pearsons correlation: 0.006
Pearsons correlation: -0.075
Pearsons correlation: -0.094
Pearsons correlation: -0.080
Pearsons correlation: -0.186
Pearsons correlation: -0.012
Pearsons correlation: -0.186
Pearsons correlation: -0.110
Pearsons correlation: -0.101
Pearsons correlation: -0.071
Pearsons correlation: -0.087
Pearsons correlation: -0.071
Pearsons correlation: -0.202
Pearsons correlation: -0.155
Pearsons correlation: -0.012
Pearsons correlation: -0.155
Pearsons correlation: 0.061
Pearsons correlation: -0.101
Pearsons correlati

Pearsons correlation: -0.217
Pearsons correlation: 0.029
Pearsons correlation: -0.297
Pearsons correlation: -0.015
Pearsons correlation: -0.211
Pearsons correlation: -0.212
Pearsons correlation: -0.075
Pearsons correlation: -0.044
Pearsons correlation: -0.111
Pearsons correlation: 0.050
Pearsons correlation: -0.183
Pearsons correlation: -0.080
Pearsons correlation: -0.092
Pearsons correlation: -0.100
Pearsons correlation: 0.144
Pearsons correlation: -0.085
Pearsons correlation: -0.015
Pearsons correlation: 0.050
Pearsons correlation: -0.186
Pearsons correlation: 0.092
Pearsons correlation: -0.042
Pearsons correlation: -0.075
Pearsons correlation: -0.109
Pearsons correlation: -0.077
Pearsons correlation: 0.052
Pearsons correlation: -0.015
Pearsons correlation: 0.001
Pearsons correlation: -0.211
Pearsons correlation: -0.032
Pearsons correlation: -0.140
Pearsons correlation: -0.002
Pearsons correlation: 0.029
Pearsons correlation: -0.073
Pearsons correlation: -0.077
Pearsons correlation: 

Pearsons correlation: 0.037
Pearsons correlation: 0.068
Pearsons correlation: -0.154
Pearsons correlation: 0.083
Pearsons correlation: -0.096
Pearsons correlation: -0.068
Pearsons correlation: -0.198
Pearsons correlation: 0.037
Pearsons correlation: 0.020
Pearsons correlation: 0.083
Pearsons correlation: 0.159
Pearsons correlation: -0.198
Pearsons correlation: -0.026
Pearsons correlation: -0.026
Pearsons correlation: -0.096
Pearsons correlation: 0.047
Pearsons correlation: 0.068
Pearsons correlation: -0.007
Pearsons correlation: -0.026
Pearsons correlation: -0.153
Pearsons correlation: 0.068
Pearsons correlation: -0.063
Pearsons correlation: -0.089
Pearsons correlation: 0.159
Pearsons correlation: -0.064
Pearsons correlation: -0.110
Pearsons correlation: -0.068
Pearsons correlation: 0.014
Pearsons correlation: -0.119
Pearsons correlation: -0.070
Pearsons correlation: 0.056
Pearsons correlation: -0.001
Pearsons correlation: -0.039
Pearsons correlation: 0.060
Pearsons correlation: -0.001

Pearsons correlation: -0.021
Pearsons correlation: -0.046
Pearsons correlation: -0.071
Pearsons correlation: -0.106
Pearsons correlation: -0.084
Pearsons correlation: -0.085
Pearsons correlation: 0.051
Pearsons correlation: -0.239
Pearsons correlation: -0.002
Pearsons correlation: -0.024
Pearsons correlation: 0.099
Pearsons correlation: -0.146
Pearsons correlation: 0.020
Pearsons correlation: -0.044
Pearsons correlation: -0.143
Pearsons correlation: -0.071
Pearsons correlation: -0.132
Pearsons correlation: -0.063
Pearsons correlation: 0.007
Pearsons correlation: 0.061
Pearsons correlation: -0.162
Pearsons correlation: -0.063
Pearsons correlation: -0.239
Pearsons correlation: -0.076
Pearsons correlation: 0.001
Pearsons correlation: -0.078
Pearsons correlation: -0.092
Pearsons correlation: -0.061
Pearsons correlation: -0.084
Pearsons correlation: -0.169
Pearsons correlation: -0.095
Pearsons correlation: 0.009
Pearsons correlation: 0.009
Pearsons correlation: 0.004
Pearsons correlation: 0

Pearsons correlation: 0.071
Pearsons correlation: 0.129
Pearsons correlation: -0.099
Pearsons correlation: 0.181
Pearsons correlation: 0.144
Pearsons correlation: -0.033
Pearsons correlation: -0.081
Pearsons correlation: -0.133
Pearsons correlation: -0.186
Pearsons correlation: 0.181
Pearsons correlation: -0.186
Pearsons correlation: 0.071
Pearsons correlation: 0.028
Pearsons correlation: -0.133
Pearsons correlation: 0.144
Pearsons correlation: -0.133
Pearsons correlation: 0.129
Pearsons correlation: -0.186
Pearsons correlation: -0.135
Pearsons correlation: -0.186
Pearsons correlation: 0.019
Pearsons correlation: -0.107
Pearsons correlation: -0.023
Pearsons correlation: 0.053
Pearsons correlation: 0.059
Pearsons correlation: -0.389
Pearsons correlation: 0.016
Pearsons correlation: -0.365
Pearsons correlation: -0.074
Pearsons correlation: 0.086
Pearsons correlation: -0.094
Pearsons correlation: 0.016
Pearsons correlation: 0.045
Pearsons correlation: -0.000
Pearsons correlation: -0.000
P

Pearsons correlation: -0.074
Pearsons correlation: -0.065
Pearsons correlation: -0.036
Pearsons correlation: -0.084
Pearsons correlation: -0.101
Pearsons correlation: -0.050
Pearsons correlation: -0.104
Pearsons correlation: -0.076
Pearsons correlation: -0.092
Pearsons correlation: 0.110
Pearsons correlation: 0.149
Pearsons correlation: -0.079
Pearsons correlation: -0.086
Pearsons correlation: -0.072
Pearsons correlation: -0.084
Pearsons correlation: -0.161
Pearsons correlation: -0.068
Pearsons correlation: -0.077
Pearsons correlation: -0.008
Pearsons correlation: -0.121
Pearsons correlation: -0.072
Pearsons correlation: 0.032
Pearsons correlation: 0.034
Pearsons correlation: -0.080
Pearsons correlation: -0.051
Pearsons correlation: -0.054
Pearsons correlation: -0.079
Pearsons correlation: -0.053
Pearsons correlation: -0.071
Pearsons correlation: 0.009
Pearsons correlation: -0.127
Pearsons correlation: -0.078
Pearsons correlation: -0.067
Pearsons correlation: -0.071
Pearsons correlatio

Pearsons correlation: -0.080
Pearsons correlation: 0.032
Pearsons correlation: -0.021
Pearsons correlation: 0.072
Pearsons correlation: -0.132
Pearsons correlation: -0.022
Pearsons correlation: -0.080
Pearsons correlation: -0.020
Pearsons correlation: -0.052
Pearsons correlation: -0.020
Pearsons correlation: 0.178
Pearsons correlation: -0.132
Pearsons correlation: -0.118
Pearsons correlation: 0.133
Pearsons correlation: -0.121
Pearsons correlation: -0.072
Pearsons correlation: -0.072
Pearsons correlation: -0.072
Pearsons correlation: 0.133
Pearsons correlation: -0.121
Pearsons correlation: -0.152
Pearsons correlation: -0.049
Pearsons correlation: -0.049
Pearsons correlation: 0.244
Pearsons correlation: -0.064
Pearsons correlation: 0.040
Pearsons correlation: 0.183
Pearsons correlation: 0.040
Pearsons correlation: 0.183
Pearsons correlation: -0.064
Pearsons correlation: 0.149
Pearsons correlation: -0.064
Pearsons correlation: 0.016
Pearsons correlation: -0.205
Pearsons correlation: 0.12

Pearsons correlation: 0.047
Pearsons correlation: 0.068
Pearsons correlation: 0.046
Pearsons correlation: -0.194
Pearsons correlation: -0.047
Pearsons correlation: -0.015
Pearsons correlation: 0.188
Pearsons correlation: -0.015
Pearsons correlation: 0.047
Pearsons correlation: -0.001
Pearsons correlation: -0.047
Pearsons correlation: -0.393
Pearsons correlation: -0.001
Pearsons correlation: -0.079
Pearsons correlation: -0.047
Pearsons correlation: -0.079
Pearsons correlation: -0.015
Pearsons correlation: -0.015
Pearsons correlation: -0.119
Pearsons correlation: -0.119
Pearsons correlation: -0.194
Pearsons correlation: 0.007
Pearsons correlation: -0.197
Pearsons correlation: -0.047
Pearsons correlation: -0.016
Pearsons correlation: -0.095
Pearsons correlation: -0.052
Pearsons correlation: -0.189
Pearsons correlation: 0.055
Pearsons correlation: -0.136
Pearsons correlation: 0.055
Pearsons correlation: 0.007
Pearsons correlation: 0.055
Pearsons correlation: -0.056
Pearsons correlation: -0

Pearsons correlation: -0.104
Pearsons correlation: 0.090
Pearsons correlation: -0.060
Pearsons correlation: 0.023
Pearsons correlation: 0.090
Pearsons correlation: 0.223
Pearsons correlation: -0.104
Pearsons correlation: 0.023
Pearsons correlation: 0.090
Pearsons correlation: 0.090
Pearsons correlation: 0.023
Pearsons correlation: 0.091
Pearsons correlation: 0.091
Pearsons correlation: -0.060
Pearsons correlation: 0.223
Pearsons correlation: -0.053
Pearsons correlation: 0.192
Pearsons correlation: -0.070
Pearsons correlation: -0.176
Pearsons correlation: -0.025
Pearsons correlation: -0.069
Pearsons correlation: 0.141
Pearsons correlation: -0.220
Pearsons correlation: -0.126
Pearsons correlation: 0.140
Pearsons correlation: -0.078
Pearsons correlation: -0.220
Pearsons correlation: 0.073
Pearsons correlation: 0.024
Pearsons correlation: -0.078
Pearsons correlation: 0.073
Pearsons correlation: 0.192
Pearsons correlation: -0.025
Pearsons correlation: 0.014
Pearsons correlation: -0.069
Pear

Pearsons correlation: 0.070
Pearsons correlation: -0.052
Pearsons correlation: -0.004
Pearsons correlation: -0.055
Pearsons correlation: 0.103
Pearsons correlation: -0.016
Pearsons correlation: -0.052
Pearsons correlation: -0.152
Pearsons correlation: -0.141
Pearsons correlation: -0.072
Pearsons correlation: -0.004
Pearsons correlation: 0.019
Pearsons correlation: -0.029
Pearsons correlation: 0.012
Pearsons correlation: 0.012
Pearsons correlation: 0.012
Pearsons correlation: -0.040
Pearsons correlation: 0.007
Pearsons correlation: 0.007
Pearsons correlation: 0.007
Pearsons correlation: -0.007
Pearsons correlation: 0.038
Pearsons correlation: -0.131
Pearsons correlation: -0.098
Pearsons correlation: -0.131
Pearsons correlation: -0.035
Pearsons correlation: -0.035
Pearsons correlation: -0.053
Pearsons correlation: -0.054
Pearsons correlation: -0.111
Pearsons correlation: -0.007
Pearsons correlation: -0.054
Pearsons correlation: -0.110
Pearsons correlation: -0.098
Pearsons correlation: 0.

Pearsons correlation: -0.082
Pearsons correlation: -0.344
Pearsons correlation: -0.052
Pearsons correlation: 0.111
Pearsons correlation: -0.117
Pearsons correlation: -0.041
Pearsons correlation: 0.111
Pearsons correlation: -0.082
Pearsons correlation: -0.002
Pearsons correlation: 0.335
Pearsons correlation: -0.051
Pearsons correlation: -0.041
Pearsons correlation: 0.079
Pearsons correlation: 0.111
Pearsons correlation: 0.079
Pearsons correlation: -0.052
Pearsons correlation: -0.082
Pearsons correlation: -0.067
Pearsons correlation: 0.102
Pearsons correlation: -0.067
Pearsons correlation: -0.041
Pearsons correlation: -0.002
Pearsons correlation: 0.060
Pearsons correlation: -0.085
Pearsons correlation: 0.131
Pearsons correlation: 0.131
Pearsons correlation: 0.131
Pearsons correlation: -0.082
Pearsons correlation: 0.102
Pearsons correlation: 0.137
Pearsons correlation: 0.335
Pearsons correlation: -0.344
Pearsons correlation: 0.072
Pearsons correlation: 0.054
Pearsons correlation: 0.054
Pe

Pearsons correlation: -0.078
Pearsons correlation: 0.081
Pearsons correlation: 0.091
Pearsons correlation: 0.046
Pearsons correlation: -0.001
Pearsons correlation: 0.143
Pearsons correlation: 0.151
Pearsons correlation: 0.078
Pearsons correlation: 0.180
Pearsons correlation: 0.049
Pearsons correlation: 0.078
Pearsons correlation: -0.128
Pearsons correlation: 0.036
Pearsons correlation: -0.039
Pearsons correlation: -0.061
Pearsons correlation: 0.013
Pearsons correlation: 0.041
Pearsons correlation: -0.087
Pearsons correlation: -0.076
Pearsons correlation: 0.005
Pearsons correlation: -0.087
Pearsons correlation: -0.085
Pearsons correlation: -0.070
Pearsons correlation: -0.026
Pearsons correlation: 0.010
Pearsons correlation: -0.089
Pearsons correlation: 0.093
Pearsons correlation: 0.036
Pearsons correlation: 0.041
Pearsons correlation: -0.087
Pearsons correlation: -0.076
Pearsons correlation: -0.108
Pearsons correlation: -0.087
Pearsons correlation: 0.046
Pearsons correlation: -0.061
Pea

Pearsons correlation: 0.078
Pearsons correlation: 0.142
Pearsons correlation: 0.114
Pearsons correlation: 0.106
Pearsons correlation: -0.080
Pearsons correlation: -0.116
Pearsons correlation: 0.110
Pearsons correlation: 0.134
Pearsons correlation: -0.009
Pearsons correlation: 0.078
Pearsons correlation: 0.110
Pearsons correlation: -0.116
Pearsons correlation: 0.052
Pearsons correlation: -0.049
Pearsons correlation: -0.009
Pearsons correlation: -0.058
Pearsons correlation: 0.032
Pearsons correlation: -0.116
Pearsons correlation: -0.080
Pearsons correlation: -0.298
Pearsons correlation: 0.032
Pearsons correlation: 0.024
Pearsons correlation: -0.298
Pearsons correlation: 0.013
Pearsons correlation: 0.024
Pearsons correlation: -0.028
Pearsons correlation: -0.009
Pearsons correlation: -0.137
Pearsons correlation: 0.198
Pearsons correlation: 0.024
Pearsons correlation: 0.106
Pearsons correlation: 0.070
Pearsons correlation: 0.134
Pearsons correlation: 0.052
Pearsons correlation: -0.137
Pears

Pearsons correlation: 0.072
Pearsons correlation: -0.099
Pearsons correlation: 0.056
Pearsons correlation: -0.099
Pearsons correlation: -0.067
Pearsons correlation: -0.062
Pearsons correlation: -0.099
Pearsons correlation: -0.067
Pearsons correlation: 0.072
Pearsons correlation: 0.056
Pearsons correlation: -0.030
Pearsons correlation: -0.007
Pearsons correlation: 0.049
Pearsons correlation: 0.049
Pearsons correlation: -0.023
Pearsons correlation: -0.023
Pearsons correlation: -0.094
Pearsons correlation: -0.152
Pearsons correlation: 0.048
Pearsons correlation: -0.048
Pearsons correlation: -0.030
Pearsons correlation: -0.004
Pearsons correlation: 0.072
Pearsons correlation: 0.072
Pearsons correlation: -0.094
Pearsons correlation: -0.048
Pearsons correlation: -0.004
Pearsons correlation: -0.094
Pearsons correlation: 0.061
Pearsons correlation: 0.061
Pearsons correlation: 0.061
Pearsons correlation: -0.093
Pearsons correlation: -0.235
Pearsons correlation: 0.152
Pearsons correlation: 0.023

Pearsons correlation: -0.031
Pearsons correlation: 0.084
Pearsons correlation: -0.016
Pearsons correlation: 0.009
Pearsons correlation: 0.084
Pearsons correlation: -0.205
Pearsons correlation: -0.205
Pearsons correlation: -0.016
Pearsons correlation: -0.031
Pearsons correlation: -0.205
Pearsons correlation: -0.205
Pearsons correlation: -0.016
Pearsons correlation: 0.084
Pearsons correlation: -0.016
Pearsons correlation: -0.027
Pearsons correlation: 0.009
Pearsons correlation: -0.031
Pearsons correlation: -0.083
Pearsons correlation: 0.088
Pearsons correlation: -0.060
Pearsons correlation: -0.060
Pearsons correlation: 0.088
Pearsons correlation: -0.060
Pearsons correlation: -0.067
Pearsons correlation: -0.062
Pearsons correlation: -0.062
Pearsons correlation: -0.067
Pearsons correlation: -0.164
Pearsons correlation: -0.062
Pearsons correlation: 0.006
Pearsons correlation: 0.082
Pearsons correlation: -0.081
Pearsons correlation: 0.105
Pearsons correlation: 0.105
Pearsons correlation: 0.0

Pearsons correlation: 0.008
Pearsons correlation: -0.178
Pearsons correlation: -0.075
Pearsons correlation: -0.110
Pearsons correlation: -0.075
Pearsons correlation: -0.178
Pearsons correlation: -0.009
Pearsons correlation: -0.047
Pearsons correlation: -0.030
Pearsons correlation: 0.013
Pearsons correlation: 0.059
Pearsons correlation: 0.072
Pearsons correlation: -0.073
Pearsons correlation: -0.079
Pearsons correlation: -0.073
Pearsons correlation: 0.130
Pearsons correlation: 0.059
Pearsons correlation: -0.073
Pearsons correlation: -0.013
Pearsons correlation: 0.059
Pearsons correlation: 0.072
Pearsons correlation: 0.077
Pearsons correlation: -0.073
Pearsons correlation: 0.077
Pearsons correlation: 0.072
Pearsons correlation: 0.040
Pearsons correlation: -0.079
Pearsons correlation: -0.013
Pearsons correlation: -0.060
Pearsons correlation: 0.019
Pearsons correlation: 0.094
Pearsons correlation: 0.019
Pearsons correlation: -0.022
Pearsons correlation: -0.010
Pearsons correlation: -0.063


Pearsons correlation: 0.058
Pearsons correlation: -0.009
Pearsons correlation: 0.102
Pearsons correlation: -0.106
Pearsons correlation: -0.029
Pearsons correlation: 0.058
Pearsons correlation: 0.042
Pearsons correlation: -0.009
Pearsons correlation: 0.058
Pearsons correlation: -0.088
Pearsons correlation: -0.045
Pearsons correlation: -0.103
Pearsons correlation: -0.083
Pearsons correlation: 0.146
Pearsons correlation: -0.103
Pearsons correlation: -0.045
Pearsons correlation: -0.083
Pearsons correlation: -0.103
Pearsons correlation: 0.146
Pearsons correlation: -0.049
Pearsons correlation: 0.171
Pearsons correlation: 0.171
Pearsons correlation: -0.222
Pearsons correlation: 0.197
Pearsons correlation: -0.175
Pearsons correlation: 0.127
Pearsons correlation: -0.071
Pearsons correlation: -0.071
Pearsons correlation: 0.096
Pearsons correlation: -0.292
Pearsons correlation: -0.292
Pearsons correlation: 0.045
Pearsons correlation: 0.045
Pearsons correlation: 0.045
Pearsons correlation: 0.045
P

Pearsons correlation: 0.061
Pearsons correlation: -0.088
Pearsons correlation: 0.106
Pearsons correlation: 0.089
Pearsons correlation: -0.115
Pearsons correlation: 0.086
Pearsons correlation: 0.086
Pearsons correlation: -0.018
Pearsons correlation: -0.051
Pearsons correlation: -0.124
Pearsons correlation: -0.051
Pearsons correlation: 0.025
Pearsons correlation: -0.049
Pearsons correlation: -0.049
Pearsons correlation: -0.024
Pearsons correlation: -0.024
Pearsons correlation: 0.071
Pearsons correlation: -0.046
Pearsons correlation: -0.121
Pearsons correlation: -0.229
Pearsons correlation: -0.000
Pearsons correlation: -0.101
Pearsons correlation: 0.063
Pearsons correlation: 0.108
Pearsons correlation: 0.058
Pearsons correlation: -0.061
Pearsons correlation: -0.025
Pearsons correlation: -0.067
Pearsons correlation: -0.030
Pearsons correlation: -0.067
Pearsons correlation: -0.015
Pearsons correlation: -0.067
Pearsons correlation: 0.108
Pearsons correlation: -0.030
Pearsons correlation: 0.0

Pearsons correlation: 0.067
Pearsons correlation: -0.033
Pearsons correlation: -0.085
Pearsons correlation: 0.018
Pearsons correlation: -0.034
Pearsons correlation: -0.034
Pearsons correlation: 0.018
Pearsons correlation: -0.064
Pearsons correlation: 0.096
Pearsons correlation: -0.040
Pearsons correlation: 0.185
Pearsons correlation: -0.013
Pearsons correlation: -0.040
Pearsons correlation: 0.078
Pearsons correlation: -0.096
Pearsons correlation: 0.217
Pearsons correlation: 0.198
Pearsons correlation: 0.238
Pearsons correlation: 0.112
Pearsons correlation: -0.146
Pearsons correlation: -0.076
Pearsons correlation: 0.203
Pearsons correlation: 0.203
Pearsons correlation: -0.146
Pearsons correlation: -0.035
Pearsons correlation: -0.076
Pearsons correlation: -0.035
Pearsons correlation: -0.146
Pearsons correlation: -0.055
Pearsons correlation: -0.068
Pearsons correlation: 0.076
Pearsons correlation: -0.103
Pearsons correlation: -0.026
Pearsons correlation: -0.026
Pearsons correlation: -0.02

Pearsons correlation: -0.199
Pearsons correlation: -0.058
Pearsons correlation: -0.032
Pearsons correlation: -0.173
Pearsons correlation: -0.032
Pearsons correlation: -0.282
Pearsons correlation: -0.173
Pearsons correlation: -0.058
Pearsons correlation: 0.159
Pearsons correlation: -0.173
Pearsons correlation: 0.159
Pearsons correlation: -0.085
Pearsons correlation: -0.044
Pearsons correlation: -0.027
Pearsons correlation: 0.057
Pearsons correlation: 0.057
Pearsons correlation: 0.001
Pearsons correlation: 0.138
Pearsons correlation: -0.109
Pearsons correlation: -0.109
Pearsons correlation: -0.006
Pearsons correlation: 0.017
Pearsons correlation: -0.006
Pearsons correlation: -0.004
Pearsons correlation: -0.088
Pearsons correlation: -0.004
Pearsons correlation: -0.004
Pearsons correlation: 0.017
Pearsons correlation: -0.004
Pearsons correlation: -0.088
Pearsons correlation: -0.006
Pearsons correlation: -0.006
Pearsons correlation: -0.008
Pearsons correlation: -0.062
Pearsons correlation: 

Pearsons correlation: -0.100
Pearsons correlation: 0.015
Pearsons correlation: -0.100
Pearsons correlation: 0.054
Pearsons correlation: -0.145
Pearsons correlation: -0.078
Pearsons correlation: -0.145
Pearsons correlation: 0.162
Pearsons correlation: 0.162
Pearsons correlation: 0.162
Pearsons correlation: -0.023
Pearsons correlation: -0.109
Pearsons correlation: -0.162
Pearsons correlation: -0.005
Pearsons correlation: 0.024
Pearsons correlation: 0.000
Pearsons correlation: -0.100
Pearsons correlation: -0.100
Pearsons correlation: -0.100
Pearsons correlation: 0.000
Pearsons correlation: 0.016
Pearsons correlation: 0.016
Pearsons correlation: 0.006
Pearsons correlation: -0.086
Pearsons correlation: 0.150
Pearsons correlation: -0.111
Pearsons correlation: -0.111
Pearsons correlation: 0.064
Pearsons correlation: -0.228
Pearsons correlation: 0.012
Pearsons correlation: -0.084
Pearsons correlation: 0.012
Pearsons correlation: -0.042
Pearsons correlation: -0.042
Pearsons correlation: -0.042


Pearsons correlation: -0.163
Pearsons correlation: 0.058
Pearsons correlation: -0.086
Pearsons correlation: -0.085
Pearsons correlation: -0.085
Pearsons correlation: 0.287
Pearsons correlation: -0.085
Pearsons correlation: -0.085
Pearsons correlation: 0.287
Pearsons correlation: -0.024
Pearsons correlation: 0.020
Pearsons correlation: 0.020
Pearsons correlation: -0.086
Pearsons correlation: -0.086
Pearsons correlation: -0.086
Pearsons correlation: -0.046
Pearsons correlation: 0.087
Pearsons correlation: -0.054
Pearsons correlation: -0.054
Pearsons correlation: -0.054
Pearsons correlation: -0.047
Pearsons correlation: 0.053
Pearsons correlation: 0.053
Pearsons correlation: -0.020
Pearsons correlation: -0.047
Pearsons correlation: 0.053
Pearsons correlation: -0.020
Pearsons correlation: 0.053
Pearsons correlation: -0.001
Pearsons correlation: -0.001
Pearsons correlation: 0.057
Pearsons correlation: 0.057
Pearsons correlation: 0.042
Pearsons correlation: -0.002
Pearsons correlation: -0.16

Pearsons correlation: -0.004
Pearsons correlation: -0.004
Pearsons correlation: 0.049
Pearsons correlation: 0.078
Pearsons correlation: -0.046
Pearsons correlation: -0.028
Pearsons correlation: -0.028
Pearsons correlation: -0.049
Pearsons correlation: 0.092
Pearsons correlation: 0.092
Pearsons correlation: -0.049
Pearsons correlation: 0.092
Pearsons correlation: 0.023
Pearsons correlation: -0.045
Pearsons correlation: 0.023
Pearsons correlation: -0.045
Pearsons correlation: 0.123
Pearsons correlation: 0.118
Pearsons correlation: 0.118
Pearsons correlation: 0.118
Pearsons correlation: 0.234
Pearsons correlation: 0.143
Pearsons correlation: 0.201
Pearsons correlation: 0.106
Pearsons correlation: 0.106
Pearsons correlation: 0.038
Pearsons correlation: 0.038
Pearsons correlation: 0.084
Pearsons correlation: -0.142
Pearsons correlation: 0.021
Pearsons correlation: 0.021
Pearsons correlation: 0.153
Pearsons correlation: 0.035
Pearsons correlation: 0.021
Pearsons correlation: 0.196
Pearsons c

Pearsons correlation: 0.199
Pearsons correlation: 0.057
Pearsons correlation: 0.057
Pearsons correlation: -0.009
Pearsons correlation: 0.199
Pearsons correlation: 0.199
Pearsons correlation: 0.199
Pearsons correlation: 0.192
Pearsons correlation: 0.199
Pearsons correlation: 0.099
Pearsons correlation: 0.099
Pearsons correlation: 0.099
Pearsons correlation: 0.141
Pearsons correlation: 0.197
Pearsons correlation: 0.197
Pearsons correlation: 0.197
Pearsons correlation: 0.113
Pearsons correlation: 0.163
Pearsons correlation: 0.264
Pearsons correlation: 0.204
Pearsons correlation: 0.248
Pearsons correlation: 0.229
Pearsons correlation: 0.224
Pearsons correlation: 0.202
Pearsons correlation: 0.202
Pearsons correlation: 0.013
Pearsons correlation: 0.013
Pearsons correlation: 0.238
Pearsons correlation: 0.282
Pearsons correlation: 0.228
Pearsons correlation: 0.228
Pearsons correlation: 0.048
Pearsons correlation: 0.048
Pearsons correlation: 0.222
Pearsons correlation: 0.174
Pearsons correlatio

Pearsons correlation: 0.091
Pearsons correlation: 0.091
Pearsons correlation: -0.195
Pearsons correlation: -0.002
Pearsons correlation: -0.002
Pearsons correlation: -0.155
Pearsons correlation: 0.062
Pearsons correlation: 0.062
Pearsons correlation: 0.062
Pearsons correlation: -0.150
Pearsons correlation: 0.075
Pearsons correlation: 0.075
Pearsons correlation: -0.011
Pearsons correlation: 0.041
Pearsons correlation: -0.106
Pearsons correlation: -0.083
Pearsons correlation: -0.083
Pearsons correlation: -0.086
Pearsons correlation: -0.007
Pearsons correlation: -0.055
Pearsons correlation: -0.021
Pearsons correlation: -0.085
Pearsons correlation: -0.118
Pearsons correlation: 0.022
Pearsons correlation: -0.117
Pearsons correlation: 0.024
Pearsons correlation: 0.021
Pearsons correlation: -0.034
Pearsons correlation: 0.029
Pearsons correlation: -0.038
Pearsons correlation: -0.038
Pearsons correlation: -0.038
Pearsons correlation: 0.029
Pearsons correlation: 0.029
Pearsons correlation: -0.069

In [54]:
print(hightopicsgc)
print("great")
print(lowtopicsgc)


[(0.0008444492101469425, 0.9768658886037848, 119.0, 1), (0.0032522603558717625, 0.9546180648723632, 119.0, 1), (0.11324301753504634, 0.9521978098198819, 113.0, 3), (0.019802681300288196, 0.9803954174536407, 116.0, 2), (0.03682499032268726, 0.9638560657334383, 116.0, 2)]
great
[(1.069550493877081, 0.30314413227186543, 119.0, 1), (7.4139937589030325, 0.0009330932470641333, 116.0, 2), (1.398938234247598, 0.2509921117964006, 116.0, 2), (0.20568708148712, 0.6509949970265321, 119.0, 1), (1.2565250917775728, 0.29153363531988435, 110.0, 4), (0.1594600801811893, 0.6903698497460966, 119.0, 1), (0.35385944422322324, 0.7027287119822376, 116.0, 2), (0.5957490326644688, 0.44173465716871074, 119.0, 1), (2.8424912749161044, 0.0623473923173751, 116.0, 2), (1.9167082043774353, 0.1517199855539531, 116.0, 2), (3.484371558206412, 0.03392101191547016, 116.0, 2), (0.3415934277561153, 0.5600173160909241, 119.0, 1), (3.074575833390992, 0.019206130959471997, 110.0, 4), (0.41771501837324027, 0.7955643727532955, 

In [29]:
print(len(sigtopics))
print(sigtopicsgc)
print(len(sigwords))

4
[(2.918309668514483, 0.037246312369587684, 113.0, 3), (7.430810315746076, 0.007380439163615347, 119.0, 1), (5.969438823154103, 0.016024170904602293, 119.0, 1), (4.462832977567518, 0.036730359426318075, 119.0, 1)]
1838


In [39]:
for i in range(0, 100) :
     print( sigwordsgc[i])

(5.01436945024828, 0.008153181757236354, 116.0, 2)
(5.8249025694126475, 0.0038850294643095386, 116.0, 2)
(5.8249025694126475, 0.0038850294643095386, 116.0, 2)
(5.8249025694126475, 0.0038850294643095386, 116.0, 2)
(4.346276491174002, 0.039228547786845654, 119.0, 1)
(4.651376709574006, 0.033040026482686696, 119.0, 1)
(8.03087099475459, 0.005403821438928613, 119.0, 1)
(5.9444493139373265, 0.016241661961744227, 119.0, 1)
(9.478965235133751, 0.0025808573560517855, 119.0, 1)
(16.30222669419608, 9.59515118290293e-05, 119.0, 1)
(6.016192771095691, 0.01562539550996266, 119.0, 1)
(4.412520843163859, 0.03778733185577222, 119.0, 1)
(7.3599286424396135, 0.007659068913228034, 119.0, 1)
(4.696826965341041, 0.032210575306034266, 119.0, 1)
(5.052858926103237, 0.026427160705386792, 119.0, 1)
(3.458314047602421, 0.0347653312744739, 116.0, 2)
(4.107157797708055, 0.01890634718805877, 116.0, 2)
(16.30222669419608, 9.59515118290293e-05, 119.0, 1)
(4.490931414742298, 0.03615375771694308, 119.0, 1)
(6.01619277

In [34]:
for i in range(0, 100) :
     print( dictionary[sigwords[i]])
        

administration
adviser
iraq
richard
accuses
attention
attracting
bill
california
concerned
corporate
critic
crowd
democrats
demonstrations
green
hard
john
knock
leaders
level
nader
news
notion
november
organization
outside
party
passing
phenomenon
senator
staunch
voted
win
wind
worker
aflcio
appeared
ballot
candidacy
chose
college
commitment
competing
contender
dallas
difficulty
education
enrique
environmental
figure
gathering
gun
hispanics
house
included
intense
judge
litany
luncheon
meetings
minimum
name
national
office
partys
patrick
perot
perots
potential
primary
reform
reformer
republican
republicans
run
search
series
teacher
th
told
tour
update
urged
appeals
approach
brave
business
called
competition
continued
court
deeply
easier
head
hispanic
holding
honor
immigration
keeping


In [32]:
print(dictionary[61])

administration
