Merge branch 'master' of https://github.com/lijuncen/Sentiment-and-St…

…yle-Transfer update
lijuncen · May 3, 2018 · 250d22d · 250d22d
2 parents 1d6d320 + a4e2b74
commit 250d22d
Show file tree

Hide file tree

Showing 55 changed files with 22,128 additions and 6 deletions.
diff --git a/evaluation/human_ratings/ratings-amazon.csv b/evaluation/human_ratings/ratings-amazon.csv
diff --git a/evaluation/human_ratings/ratings-captions.csv b/evaluation/human_ratings/ratings-captions.csv
diff --git a/evaluation/human_ratings/ratings-yelp.csv b/evaluation/human_ratings/ratings-yelp.csv
diff --git a/evaluation/outputs/amazon/sentiment.test.0.fader b/evaluation/outputs/amazon/sentiment.test.0.fader
diff --git a/evaluation/outputs/amazon/sentiment.test.0.human b/evaluation/outputs/amazon/sentiment.test.0.human
diff --git a/evaluation/outputs/amazon/sentiment.test.0.label b/evaluation/outputs/amazon/sentiment.test.0.label
diff --git a/evaluation/outputs/amazon/sentiment.test.0.mit b/evaluation/outputs/amazon/sentiment.test.0.mit
diff --git a/evaluation/outputs/amazon/sentiment.test.0.multi_decoder b/evaluation/outputs/amazon/sentiment.test.0.multi_decoder
diff --git a/evaluation/outputs/amazon/sentiment.test.0.orgin b/evaluation/outputs/amazon/sentiment.test.0.orgin
diff --git a/evaluation/outputs/amazon/sentiment.test.0.retrieval b/evaluation/outputs/amazon/sentiment.test.0.retrieval
diff --git a/evaluation/outputs/amazon/sentiment.test.0.rule_base b/evaluation/outputs/amazon/sentiment.test.0.rule_base
diff --git a/evaluation/outputs/amazon/sentiment.test.1.fader b/evaluation/outputs/amazon/sentiment.test.1.fader
diff --git a/evaluation/outputs/amazon/sentiment.test.1.human b/evaluation/outputs/amazon/sentiment.test.1.human
diff --git a/evaluation/outputs/amazon/sentiment.test.1.label b/evaluation/outputs/amazon/sentiment.test.1.label
diff --git a/evaluation/outputs/amazon/sentiment.test.1.mit b/evaluation/outputs/amazon/sentiment.test.1.mit
diff --git a/evaluation/outputs/amazon/sentiment.test.1.multi_decoder b/evaluation/outputs/amazon/sentiment.test.1.multi_decoder
diff --git a/evaluation/outputs/amazon/sentiment.test.1.orgin b/evaluation/outputs/amazon/sentiment.test.1.orgin
diff --git a/evaluation/outputs/amazon/sentiment.test.1.retrieval b/evaluation/outputs/amazon/sentiment.test.1.retrieval
diff --git a/evaluation/outputs/amazon/sentiment.test.1.rule_base b/evaluation/outputs/amazon/sentiment.test.1.rule_base
diff --git a/evaluation/outputs/captions/sentiment.test.0.fader b/evaluation/outputs/captions/sentiment.test.0.fader
diff --git a/evaluation/outputs/captions/sentiment.test.0.label b/evaluation/outputs/captions/sentiment.test.0.label
diff --git a/evaluation/outputs/captions/sentiment.test.0.mit b/evaluation/outputs/captions/sentiment.test.0.mit
diff --git a/evaluation/outputs/captions/sentiment.test.0.multi_decoder b/evaluation/outputs/captions/sentiment.test.0.multi_decoder
diff --git a/evaluation/outputs/captions/sentiment.test.0.orgin b/evaluation/outputs/captions/sentiment.test.0.orgin
diff --git a/evaluation/outputs/captions/sentiment.test.0.retrieval b/evaluation/outputs/captions/sentiment.test.0.retrieval
diff --git a/evaluation/outputs/captions/sentiment.test.0.rule_base b/evaluation/outputs/captions/sentiment.test.0.rule_base
diff --git a/evaluation/outputs/captions/sentiment.test.0.target b/evaluation/outputs/captions/sentiment.test.0.target
diff --git a/evaluation/outputs/captions/sentiment.test.1.fader b/evaluation/outputs/captions/sentiment.test.1.fader
diff --git a/evaluation/outputs/captions/sentiment.test.1.label b/evaluation/outputs/captions/sentiment.test.1.label
diff --git a/evaluation/outputs/captions/sentiment.test.1.mit b/evaluation/outputs/captions/sentiment.test.1.mit
diff --git a/evaluation/outputs/captions/sentiment.test.1.multi_decoder b/evaluation/outputs/captions/sentiment.test.1.multi_decoder
diff --git a/evaluation/outputs/captions/sentiment.test.1.orgin b/evaluation/outputs/captions/sentiment.test.1.orgin
diff --git a/evaluation/outputs/captions/sentiment.test.1.retrieval b/evaluation/outputs/captions/sentiment.test.1.retrieval
diff --git a/evaluation/outputs/captions/sentiment.test.1.rule_base b/evaluation/outputs/captions/sentiment.test.1.rule_base
diff --git a/evaluation/outputs/captions/sentiment.test.1.target b/evaluation/outputs/captions/sentiment.test.1.target
diff --git a/evaluation/outputs/yelp/sentiment.test.0.fader b/evaluation/outputs/yelp/sentiment.test.0.fader
diff --git a/evaluation/outputs/yelp/sentiment.test.0.human b/evaluation/outputs/yelp/sentiment.test.0.human
diff --git a/evaluation/outputs/yelp/sentiment.test.0.label b/evaluation/outputs/yelp/sentiment.test.0.label
diff --git a/evaluation/outputs/yelp/sentiment.test.0.mit b/evaluation/outputs/yelp/sentiment.test.0.mit
diff --git a/evaluation/outputs/yelp/sentiment.test.0.multi_decoder b/evaluation/outputs/yelp/sentiment.test.0.multi_decoder
diff --git a/evaluation/outputs/yelp/sentiment.test.0.orgin b/evaluation/outputs/yelp/sentiment.test.0.orgin
diff --git a/evaluation/outputs/yelp/sentiment.test.0.retrieval b/evaluation/outputs/yelp/sentiment.test.0.retrieval
diff --git a/evaluation/outputs/yelp/sentiment.test.0.rule_base b/evaluation/outputs/yelp/sentiment.test.0.rule_base
diff --git a/evaluation/outputs/yelp/sentiment.test.1.fader b/evaluation/outputs/yelp/sentiment.test.1.fader
diff --git a/evaluation/outputs/yelp/sentiment.test.1.human b/evaluation/outputs/yelp/sentiment.test.1.human
diff --git a/evaluation/outputs/yelp/sentiment.test.1.label b/evaluation/outputs/yelp/sentiment.test.1.label
diff --git a/evaluation/outputs/yelp/sentiment.test.1.mit b/evaluation/outputs/yelp/sentiment.test.1.mit
diff --git a/evaluation/outputs/yelp/sentiment.test.1.multi_decoder b/evaluation/outputs/yelp/sentiment.test.1.multi_decoder
diff --git a/evaluation/outputs/yelp/sentiment.test.1.orgin b/evaluation/outputs/yelp/sentiment.test.1.orgin
diff --git a/evaluation/outputs/yelp/sentiment.test.1.retrieval b/evaluation/outputs/yelp/sentiment.test.1.retrieval
diff --git a/evaluation/outputs/yelp/sentiment.test.1.rule_base b/evaluation/outputs/yelp/sentiment.test.1.rule_base
diff --git a/evaluation/run_eval.py b/evaluation/run_eval.py
@@ -0,0 +1,109 @@
+"""Generate human evaluation numbers."""
+import argparse
+import collections
+import csv
+import glob
+import json
+import numpy as np
+import os
+import sys
+
+OPTS = None
+
+def parse_args():
+  parser = argparse.ArgumentParser('Insert a description of this script.')
+  parser.add_argument('domain', choices=['yelp', 'caption', 'amazon'])
+  parser.add_argument('pred_dir')
+  parser.add_argument('results_file')
+  parser.add_argument('--num-per-class', '-n', type=int, 
+                      help='Number of examples per class (default=all)')
+  parser.add_argument('--out-file', '-o', help='Print to this file')
+  parser.add_argument('--out-json', '-j', help='Write json data (for Vega)')
+  parser.add_argument('--tsv-file', '-t', help='Write tsv file (for stats)')
+  if len(sys.argv) == 1:
+    parser.print_help()
+    sys.exit(1)
+  return parser.parse_args()
+
+def read_preds():
+  preds = collections.defaultdict(list)
+  for fn in glob.glob(os.path.join(OPTS.pred_dir, 'sentiment.*')):
+    model = os.path.basename(fn).split('.')[3]
+    y_label = os.path.basename(fn).split('.')[2]
+    with open(fn) as f:
+      for i, line in enumerate(f):
+        if OPTS.num_per_class is not None and i == OPTS.num_per_class:
+          break
+        toks = line.strip().split('\t')
+        orig = toks[0].strip().lower()
+        mod = toks[1].strip().lower()
+        if OPTS.domain == 'caption':
+          target = 'humorous' if y_label == '1' else 'romantic'
+        else:
+          target = 'negative' if y_label == '1' else 'positive'
+        preds[model].append((orig, target, mod))
+  return preds
+
+def read_human_scores():
+  human_scores = {}
+  with open(OPTS.results_file) as f:
+    reader = csv.DictReader(f)
+    for row in reader:
+      origs = row['Input.origs'].split('\t')
+      mods = row['Input.mods'].split('\t')
+      target = row['Input.target']
+      responses = row['Answer.responses'].split('\t')
+      for (orig, mod, r) in zip(origs, mods, responses):
+        key = '\t'.join((orig, target, mod))
+        cur_scores = collections.OrderedDict()
+        for x in r.split(' '):
+          k, v = x.split('=')
+          cur_scores[k] = int(v)
+        success = int(all(v > 3 for v in cur_scores.values()))
+        cur_scores['success'] = success
+        human_scores[key] = cur_scores
+  return human_scores
+
+def main():
+  preds = read_preds()
+  human_scores = read_human_scores()
+  eval_obj = {}
+  out_lines = []
+  out_json = []
+  tsv_lines = []
+  for model in preds:
+    eval_obj[model] = collections.defaultdict(list)
+    for (orig, target, mod) in preds[model]:
+      key = '\t'.join((orig, target, mod))
+      cur_scores = human_scores[key]
+      json_ex = dict(cur_scores)  # clone
+      json_ex['model'] = model
+      out_json.append(json_ex)
+      for cat, val in cur_scores.iteritems():
+        eval_obj[model][cat].append(val)
+      score_str = ' '.join('%s=%d' %  (k, v) for k, v in cur_scores.iteritems())
+      out_lines.append('\t'.join((model, orig, target, mod, score_str)))
+    print model
+    for cat in eval_obj[model]:
+      mean = np.mean(eval_obj[model][cat])
+      std_err = np.std(eval_obj[model][cat]) / np.sqrt(len(eval_obj[model][cat]) - 1)
+      print '  %s: %.3f +/- %.3f' % (cat, mean, std_err)
+      tsv_lines.append('\t'.join((OPTS.domain, cat, model, '%.3f' % mean)))
+    print
+  if OPTS.out_file:
+    with open(OPTS.out_file, 'w') as f:
+      for line in out_lines:
+        print >> f, line
+  if OPTS.out_json:
+    with open(OPTS.out_json, 'w') as f:
+      json.dump(out_json, f)
+  if OPTS.tsv_file:
+    with open(OPTS.tsv_file, 'w') as f:
+      for line in tsv_lines:
+        print >> f, line
+
+
+if __name__ == '__main__':
+  OPTS = parse_args()
+  main()
+
diff --git a/src/deep/manage/model/cho_encoder_decoder_DT.py b/src/deep/manage/model/cho_encoder_decoder_DT.py
@@ -11,14 +11,14 @@
 class RnnEncoderDecoder(ModelManager) :
 
     def __init__(self, dataset_folder, dataset_file, dict_file, stopwords_file, word_embedding_file,
-                 train_rate, valid_rate, test_rate, algo_name, charset, mode) :
+                 train_rate, valid_rate, test_rate, algo_name, charset, mode, batch_size) :
         """
         Need to set these attributes.
             1. conf_dict: configuration of the model.
             2. cr: CorpursReader for operate data.
             3. model: the network model.
         """
-        self.conf_dict = {'algo_name': algo_name, 'batch_size': 256,
+        self.conf_dict = {'algo_name': algo_name, 'batch_size': batch_size,
                           'train_valid_test_rate': [train_rate, valid_rate, test_rate],
                           'split_level': 'zi', 'pre_word_embedding': False,
                           'word_embedding_dim': 128, 'n_topics':5000, 'topic_embedding_dim' :256,'max_sentence_word_num': 150,

diff --git a/src/deep/manage/model/cho_encoder_decoder_lm.py b/src/deep/manage/model/cho_encoder_decoder_lm.py
@@ -11,14 +11,14 @@
 class RnnEncoderDecoder(ModelManager) :
 
     def __init__(self, dataset_folder, dataset_file, dict_file, stopwords_file, word_embedding_file,
-                 train_rate, valid_rate, test_rate, algo_name, charset, mode) :
+                 train_rate, valid_rate, test_rate, algo_name, charset, mode, batch_size) :
         """
         Need to set these attributes.
             1. conf_dict: configuration of the model.
             2. cr: CorpursReader for operate data.
             3. model: the network model.
         """
-        self.conf_dict = {'algo_name': algo_name, 'batch_size': 256,
+        self.conf_dict = {'algo_name': algo_name, 'batch_size': batch_size,
                           'train_valid_test_rate': [train_rate, valid_rate, test_rate],
                           'split_level': 'zi', 'pre_word_embedding': False,
                           'word_embedding_dim': 128, 'n_topics':5000, 'topic_embedding_dim' :256,'max_sentence_word_num': 150,

diff --git a/src/main.py b/src/main.py
@@ -54,13 +54,25 @@
         manager = RnnEncoderDecoder(dataset_folder, dataset_file, dict_file, stopwords_file, word_embedding_file,
                                     train_rate, valid_rate, test_rate, algo_name, charset, mode)
     elif algo_name == 'ChoEncoderDecoderDT' :
+        if mode == 'train':
+            batch_size = int(sys.argv[11])
+        elif mode in ('generate_emb', 'generate_b_v_t', 'generate_b_v_t_v'):
+            batch_size = int(sys.argv[12])
+        else:
+            batch_size = 256
         from deep.manage.model.cho_encoder_decoder_DT import RnnEncoderDecoder
         manager = RnnEncoderDecoder(dataset_folder, dataset_file, dict_file, stopwords_file, word_embedding_file,
-                                    train_rate, valid_rate, test_rate, algo_name, charset, mode)
+                                    train_rate, valid_rate, test_rate, algo_name, charset, mode, batch_size)
     elif algo_name == 'ChoEncoderDecoderLm' :
+        if mode == 'train':
+            batch_size = int(sys.argv[11])
+        elif mode in ('generate_emb', 'generate_b_v_t', 'generate_b_v_t_v'):
+            batch_size = int(sys.argv[12])
+        else:
+            batch_size = 256
         from deep.manage.model.cho_encoder_decoder_lm import RnnEncoderDecoder
         manager = RnnEncoderDecoder(dataset_folder, dataset_file, dict_file, stopwords_file, word_embedding_file,
-                                    train_rate, valid_rate, test_rate, algo_name, charset, mode)
+                                    train_rate, valid_rate, test_rate, algo_name, charset, mode, batch_size)
     elif algo_name == 'TegEncoderDecoder' :
         from deep.manage.model.teg_encoder_decoder import RnnEncoderDecoder
         manager = RnnEncoderDecoder(dataset_folder, dataset_file, dict_file, stopwords_file, word_embedding_file,