added rnn allg

llSourcell · Mar 27, 2016 · a544c49 · a544c49
1 parent 7e4acc6
commit a544c49
Show file tree

Hide file tree

Showing 5 changed files with 171 additions and 46 deletions.
diff --git a/rnn.py b/rnn.py
@@ -71,34 +71,7 @@ def __repr__(self):
         input_dim = pickle["train"][0].shape[1]
         print 'Finished loading data, input dim: {}'.format(input_dim)
     else:
-        raise Exception("Implement other datasets (TBD)")
-
-
-    # model_suffix = '_softmax.model'
-    # charts_suffix = '_softmax.png'
-
-    # TODO: handle other datasets
-    # if args.dataset == 'bach':
-    #     # learning_rate = 1e-2
-    #     raise Exception("TODO: define stuff")
-    #     data_dir = 'data/JSBChorales'
-    #     resolution = 100
-    #     time_step = 120
-    #     time_batch_len = 100
-    #     max_time_batches = -1
-    #
-    # elif args.dataset == 'nottingham':
-    #     data_dir = 'data/Nottingham'
-    #     resolution = 480
-    #     time_step = 120
-    #     time_batch_len = 128
-    #     max_time_batches = 9
-    #
-    # else:
-    #     raise Exception("unrecognized dataset")
-    #
-    # data = util.load_data(data_dir, time_step, time_batch_len, max_time_batches)
-    # model_class = Model
+        raise Exception("Other datasets not yet implemented")
 
     initializer = tf.random_uniform_initializer(-0.1, 0.1)
 
@@ -121,10 +94,10 @@ def __repr__(self):
         "dropout_prob": [0.5],
         "input_dropout_prob": [0.8],
         "melody_coeff": [0.5],
-        "num_layers": [1, 2],
+        "num_layers": [2],
         "hidden_size": [50],
-        "num_epochs": [200],
-        "learning_rate": [5e-3],
+        "num_epochs": [250],
+        "learning_rate": [1e-2],
         "learning_rate_decay": [0.9],
         "time_batch_len": [128],
     }
@@ -140,17 +113,12 @@ def __repr__(self):
         config.model_name = ''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(12)) + '.model'
         for attr, value in combination:
             setattr(config, attr, value)
-            # if attr == "dropout_prob":
-            #     config.input_dropout_prob = value
-            # if attr == "time_batch_len":
-            #     # equivalent to 9 time batches of len 128 each
-            #     config.max_time_batches = 9 * 128 / value
 
         if config.dataset == 'softmax':
             data = util.load_data('', time_step, config.time_batch_len, config.max_time_batches, nottingham=pickle)
             config.input_dim = data["input_dim"]
         else:
-            raise Exception("Implement other datasets")
+            raise Exception("Other datasets not yet implemented")
 
         logger.info(config)
         config_file_path = os.path.join(run_folder, get_config_name(config) + '.config')

diff --git a/rnn_all.py b/rnn_all.py
@@ -0,0 +1,158 @@
+import os, sys
+import argparse
+import time
+import itertools
+import cPickle
+import logging
+import random
+import string
+import pprint
+
+import numpy as np
+import tensorflow as tf    
+import matplotlib.pyplot as plt
+
+import midi_util
+import nottingham_util
+import sampling
+import util
+from model import Model, NottinghamModel
+
+def get_config_name(config):
+    def replace_dot(s): return s.replace(".", "p")
+    return "nl_" + str(config.num_layers) + "_hs_" + str(config.hidden_size) + \
+            replace_dot("_mc_{}".format(config.melody_coeff)) + \
+            replace_dot("_dp_{}".format(config.dropout_prob)) + \
+            replace_dot("_idp_{}".format(config.input_dropout_prob)) + \
+            replace_dot("_tb_{}".format(config.time_batch_len)) 
+
+class DefaultConfig(object):
+    # model parameters
+    num_layers = 1
+    hidden_size = 100
+    melody_coeff = 0.5
+    dropout_prob = 0.5
+    input_dropout_prob = 0.9
+    cell_type = 'lstm'
+
+    # learning parameters
+    max_time_batches = 9
+    time_batch_len = 128
+    learning_rate = 5e-3
+    learning_rate_decay = 0.9
+    num_epochs = 200
+
+    # metadata
+    dataset = 'softmax'
+    model_file = ''
+
+    def __repr__(self):
+        return """Num Layers: {}, Hidden Size: {}, Melody Coeff: {}, Dropout Prob: {}, Input Dropout Prob: {}, Cell Type: {}, Time Batch Len: {}, Learning Rate: {}, Decay: {}""".format(self.num_layers, self.hidden_size, self.melody_coeff, self.dropout_prob, self.input_dropout_prob, self.cell_type, self.time_batch_len, self.learning_rate, self.learning_rate_decay)
+
+if __name__ == '__main__':
+    np.random.seed()      
+
+    parser = argparse.ArgumentParser(description='Music RNN')
+    parser.add_argument('--dataset', type=str, default='softmax',
+                        choices = ['bach', 'nottingham', 'softmax'])
+    parser.add_argument('--model_dir', type=str, default='models')
+    parser.add_argument('--run_name', type=str, default=time.strftime("%m%d_%H%M"))
+
+    args = parser.parse_args()
+
+    if args.dataset == 'softmax':
+        resolution = 480
+        time_step = 120
+        model_class = NottinghamModel
+        with open(nottingham_util.PICKLE_LOC, 'r') as f:
+            pickle = cPickle.load(f)
+            chord_to_idx = pickle['chord_to_idx']
+
+        input_dim = pickle["train"][0].shape[1]
+        print 'Finished loading data, input dim: {}'.format(input_dim)
+    else:
+        raise Exception("Implement other datasets (TBD)")
+
+    initializer = tf.random_uniform_initializer(-0.1, 0.1)
+
+    # set up run dir
+    run_folder = os.path.join(args.model_dir, args.run_name)
+    if os.path.exists(run_folder):
+        raise Exception("Run name {} already exists, choose a different one", format(run_folder))
+    os.makedirs(run_folder)
+
+    logger = logging.getLogger(__name__) 
+    logger.setLevel(logging.INFO)
+    logger.addHandler(logging.StreamHandler())
+    logger.addHandler(logging.FileHandler(os.path.join(run_folder, "training.log")))
+
+    # grid
+    grid = {
+        "dropout_prob": [1.0],
+        "input_dropout_prob": [1.0],
+        "melody_coeff": [0.5],
+        "num_layers": [3],
+        "hidden_size": [200],
+        "num_epochs": [200],
+        "learning_rate": [5e-3],
+        "learning_rate_decay": [0.9],
+        "time_batch_len": [128],
+    }
+
+    # Generate product of hyperparams
+    runs = list(list(itertools.izip(grid, x)) for x in itertools.product(*grid.itervalues()))
+    logger.info("{} runs detected".format(len(runs)))
+
+    for combination in runs:
+
+        config = DefaultConfig()
+        config.dataset = args.dataset
+        config.model_name = ''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(12)) + '.model'
+        for attr, value in combination:
+            setattr(config, attr, value)
+
+        if config.dataset == 'softmax':
+            data = util.batch_data(pickle['train'] + pickle['valid'] + pickle['test'],
+                                   config.time_batch_len, config.max_time_batches,
+                                   softmax=True)
+            config.input_dim = data[0][0][0].shape[2]
+        else:
+            raise Exception("Implement other datasets")
+
+        logger.info(config)
+        config_file_path = os.path.join(run_folder, get_config_name(config) + '.config')
+        with open(config_file_path, 'w') as f: 
+            cPickle.dump(config, f)
+
+        with tf.Graph().as_default(), tf.Session() as session:
+            with tf.variable_scope("model", reuse=None):
+                train_model = model_class(config, training=True)
+
+            saver = tf.train.Saver(tf.all_variables())
+            tf.initialize_all_variables().run()
+
+            # training
+            train_losses = []
+            start_time = time.time()
+            for i in range(config.num_epochs):
+                loss = util.run_epoch(session, train_model, 
+                    data, training=True, testing=False)
+                train_losses.append((i, loss))
+                if i == 0:
+                    continue
+
+                logger.info('Epoch: {}, Train Loss: {}, Time Per Epoch: {}'.format(\
+                        i, loss, (time.time() - start_time)/i))
+                saver.save(session, os.path.join(run_folder, config.model_name))
+
+            # set loss axis max to 20
+            axes = plt.gca()
+            if config.dataset == 'softmax':
+                axes.set_ylim([0, 2])
+            else:
+                axes.set_ylim([0, 100])
+            plt.plot([t[0] for t in train_losses], [t[1] for t in train_losses])
+            plt.legend(['Train Loss'])
+            chart_file_path = os.path.join(run_folder, get_config_name(config) + '.png')
+            plt.savefig(chart_file_path)
+            plt.clf()
diff --git a/rnn_sample.py b/rnn_sample.py
@@ -22,6 +22,7 @@
     parser.add_argument('--sample_seq', type=str, default='random',
         choices = ['random', 'chords'])
     parser.add_argument('--conditioning', type=int, default=-1)
+    parser.add_argument('--sample_length', type=int, default=512)
 
     args = parser.parse_args()
 
@@ -43,7 +44,7 @@
         test_data = util.batch_data(pickle['test'], time_batch_len = 1, 
             max_time_batches = -1, softmax = True)
     else:
-        raise Exception("")
+        raise Exception("Other datasets not yet implemented")
 
     print config
 
@@ -59,16 +60,14 @@
         state = sampling_model.get_cell_zero_state(session, 1)
         if args.sample_seq == 'chords':
             # 16 - one measure, 64 - chord progression
-            sampling_length = 512 
-            repeats = sampling_length / 64
+            repeats = args.sample_length / 64
             sample_seq = nottingham_util.i_vi_iv_v(chord_to_idx, repeats, config.input_dim)
             print 'Sampling melody using a I, VI, IV, V progression'
 
         elif args.sample_seq == 'random':
             sample_index = np.random.choice(np.arange(len(pickle['test'])))
             sample_seq = [ pickle['test'][sample_index][i, :] 
                 for i in range(pickle['test'][sample_index].shape[0]) ]
-            sampling_length = len(sample_seq)
 
         chord = sample_seq[0]
         seq = [chord]
@@ -90,9 +89,9 @@
         else:
             # writer = midi_util.MidiWriter()
             # sampler = sampling.Sampler(verbose=False)
-            raise Exception("")
+            raise Exception("Other datasets not yet implemented")
 
-        for i in range(max(sampling_length - len(seq), 0)):
+        for i in range(max(args.sample_length - len(seq), 0)):
             seq_input = np.reshape(chord, [1, 1, config.input_dim])
             feed = {
                 sampling_model.seq_input: seq_input,

diff --git a/rnn_separate.py b/rnn_separate.py
@@ -43,7 +43,7 @@
         input_dim = pickle["train"][0].shape[1]
         print 'Finished loading data, input dim: {}'.format(input_dim)
     else:
-        raise Exception("Implement other datasets (TBD)")
+        raise Exception("Other datasets not yet implemented")
 
 
     initializer = tf.random_uniform_initializer(-0.1, 0.1)
@@ -86,7 +86,7 @@
             data = util.load_data('', time_step, config.time_batch_len, config.max_time_batches, nottingham=pickle)
             config.input_dim = data["input_dim"]
         else:
-            raise Exception("Implement other datasets")
+            raise Exception("Other datasets not yet implemented")
 
         # cut away unnecessary parts
         r = nottingham_util.NOTTINGHAM_MELODY_RANGE

diff --git a/rnn_test.py b/rnn_test.py
@@ -54,7 +54,7 @@
             test_data = util.batch_data(pickle['test'], time_batch_len = 1, 
                 max_time_batches = -1, softmax = True)
     else:
-        raise Exception("")
+        raise Exception("Other datasets not yet implemented")
 
     print config