nltk · stevenbird · Jul 16, 2013 · Jul 15, 2013 · Jul 15, 2013 · Jul 15, 2013
diff --git a/nltk/classify/maxent.py b/nltk/classify/maxent.py
@@ -66,7 +66,7 @@
 from collections import defaultdict
 
 from nltk import compat
-from nltk.data import GzipUnicodeFile
+from nltk.data import gzip_open_unicode
 from nltk.util import OrderedDict
 from nltk.probability import DictionaryProbDist
 
@@ -1440,7 +1440,7 @@ def train(cls, train_toks, **kwargs):
         weightfile_fd, weightfile_name = \
             tempfile.mkstemp(prefix='nltk-tadm-weights-')
 
-        trainfile = GzipUnicodeFile(trainfile_name, 'w')
+        trainfile = gzip_open_unicode(trainfile_name, 'w')
         write_tadm_file(train_toks, encoding, trainfile)
         trainfile.close()
 

diff --git a/nltk/classify/tadm.py b/nltk/classify/tadm.py
@@ -48,15 +48,15 @@ def write_tadm_file(train_toks, encoding, stream):
     labels = encoding.labels()
     for featureset, label in train_toks:
         length_line = '%d\n' % len(labels)
-        stream.write(length_line.encode('utf8'))
+        stream.write(length_line)
         for known_label in labels:
             v = encoding.encode(featureset, known_label)
             line = '%d %d %s\n' % (
                 int(label == known_label),
                 len(v),
                 ' '.join('%d %d' % u for u in v)
             )
-            stream.write(line.encode('utf8'))
+            stream.write(line)
 
 def parse_tadm_weights(paramfile):
     """

diff --git a/nltk/compat.py b/nltk/compat.py
@@ -61,6 +61,11 @@ def u(s):
     reload = reload
     raw_input = raw_input
 
+    #python 2.7 pickle compatibility
+    import UserString
+    import collections
+    UserString.defaultdict = collections.defaultdict
+
     from itertools import imap, izip
 
     try: