Skip to content

HTTPS clone URL

Subversion checkout URL

You can clone with
or
.
Download ZIP
Browse files

posted

  • Loading branch information...
commit 532f30652e1a74869848c4051c5be9efbcd933ae 1 parent 1962c8f
@rjurney authored
Showing with 3 additions and 1 deletion.
  1. +1 −1  cassandra_enron.pig
  2. +2 −0  test_pycassa.py
View
2  cassandra_enron.pig
@@ -69,5 +69,5 @@ per_message_cassandra = foreach (group tfidf_all by message_id) {
store per_message_cassandra into 'cassandra://enron/email_topics' USING CassandraStorage();
/* This will give you some message_id keys to fetch in Cassandra, and some message bodies to compare topics to. */
-samples = limit id_body 10;
+samples = limit just_ids 10;
dump samples;
View
2  test_pycassa.py
@@ -3,3 +3,5 @@
pool = pycassa.ConnectionPool('enron')
cf = pycassa.ColumnFamily(pool, 'email_topics')
+cf.get('<431.1075859137859.JavaMail.evans@thyme>') # Replace me
+# OrderedDict([(u'bankruptcy', u'0.02577520626485872'), (u'end', u'0.018016096034710077'), (u'left', u'0.024021461379613435'), (u'palmer', u'0.017183470843239148'), (u'party', u'0.05155041252971744'), (u'phillip', u'0.018016096034710077'), (u'pl', u'0.018016096034710077'), (u'plove', u'0.02577520626485872'), (u'tonight', u'0.018016096034710077'), (u'your', u'0.017969743348148298')])
Please sign in to comment.
Something went wrong with that request. Please try again.