diff --git a/digits/config/__init__.py b/digits/config/__init__.py
index a41910005..3495ed6c2 100644
--- a/digits/config/__init__.py
+++ b/digits/config/__init__.py
@@ -21,4 +21,3 @@ def config_value(option):
     Return the current configuration value for the given option
     """
     return option_list[option]
-
diff --git a/digits/config/tensorflow.py b/digits/config/tensorflow.py
index 98dc3e60e..bbf6f46b7 100644
--- a/digits/config/tensorflow.py
+++ b/digits/config/tensorflow.py
@@ -3,26 +3,27 @@
 
 import os
 import platform
-from subprocess import Popen,PIPE
+from subprocess import Popen, PIPE
 
 from . import option_list
 
 VARNAME_ENV_TFPY = 'TENSORFLOW_PYTHON'
-DEFAULT_PYTHON_EXE = 'python2' # @TODO(tzaman) - use the python executable that was used to launch digits?
+DEFAULT_PYTHON_EXE = 'python2'  # @TODO(tzaman) - use the python executable that was used to launch digits?
 
 if platform.system() == 'Darwin':
     # DYLD_LIBRARY_PATH and LD_LIBRARY_PATH is sometimes stripped, and the cuda libraries might need it
-    if not "DYLD_LIBRARY_PATH" in os.environ:
+    if "DYLD_LIBRARY_PATH" not in os.environ:
         if "CUDA_HOME" in os.environ:
             os.environ["DYLD_LIBRARY_PATH"] = str(os.environ["CUDA_HOME"] + '/lib')
 
+
 def test_tf_import(python_exe):
     """
     Tests if tensorflow can be imported, returns if it went okay and optional error.
     """
     p = Popen([python_exe, "-c", "import tensorflow"], stdout=PIPE, stderr=PIPE)
     (out, err) = p.communicate()
-    return p.returncode==0, str(err)
+    return p.returncode == 0, str(err)
 
 if VARNAME_ENV_TFPY in os.environ:
     tf_python_exe = os.environ[VARNAME_ENV_TFPY]
diff --git a/digits/dataset/views.py b/digits/dataset/views.py
index 3d40c28cd..cb0a42244 100644
--- a/digits/dataset/views.py
+++ b/digits/dataset/views.py
@@ -6,6 +6,7 @@
 
 from . import images as dataset_images
 from . import generic
+from digits import extensions
 from digits.utils.routing import job_from_request, request_wants_json
 from digits.webapp import scheduler
 
@@ -54,3 +55,31 @@ def summary():
         return generic.views.summary(job)
     else:
         raise werkzeug.exceptions.BadRequest('Invalid job type')
+
+
+@blueprint.route('/inference-form/<extension_id>/<job_id>', methods=['GET'])
+def inference_form(extension_id, job_id):
+    """
+    Returns a rendering of an inference form
+    """
+    inference_form_html = ""
+
+    if extension_id != "all-default":
+        extension_class = extensions.data.get_extension(extension_id)
+        if not extension_class:
+            raise RuntimeError("Unable to find data extension with ID=%s"
+                               % job_id.dataset.extension_id)
+        job = scheduler.get_job(job_id)
+        if hasattr(job, 'extension_userdata'):
+            extension_userdata = job.extension_userdata
+        else:
+            extension_userdata = {}
+        extension_userdata.update({'is_inference_db': True})
+        extension = extension_class(**extension_userdata)
+
+        form = extension.get_inference_form()
+        if form:
+            template, context = extension.get_inference_template(form)
+            inference_form_html = flask.render_template_string(template, **context)
+
+    return inference_form_html
diff --git a/digits/extensions/view/imageOutput/config_template.html b/digits/extensions/view/imageOutput/config_template.html
index e9a2d11ad..57988295c 100644
--- a/digits/extensions/view/imageOutput/config_template.html
+++ b/digits/extensions/view/imageOutput/config_template.html
@@ -23,3 +23,9 @@
     {{ form.pixel_conversion.tooltip }}
     {{ form.pixel_conversion(class='form-control') }}
 </div>
+
+<div class="form-group{{mark_errors([form.show_input])}}">
+    {{ form.show_input.label }}
+    {{ form.show_input.tooltip }}
+    {{ form.show_input(class='form-control') }}
+</div>
diff --git a/digits/extensions/view/imageOutput/forms.py b/digits/extensions/view/imageOutput/forms.py
index 4361d1ea5..c53d99764 100644
--- a/digits/extensions/view/imageOutput/forms.py
+++ b/digits/extensions/view/imageOutput/forms.py
@@ -45,3 +45,13 @@ class ConfigForm(Form):
         tooltip='Select method to convert pixel values to the target bit '
                 'range'
     )
+
+    show_input = utils.forms.SelectField(
+        'Show input as image',
+        choices=[
+            ('yes', 'Yes'),
+            ('no', 'No'),
+        ],
+        default='no',
+        tooltip='Show input as image'
+    )
diff --git a/digits/extensions/view/imageOutput/view.py b/digits/extensions/view/imageOutput/view.py
index 1ea635010..d4ef0ec79 100644
--- a/digits/extensions/view/imageOutput/view.py
+++ b/digits/extensions/view/imageOutput/view.py
@@ -31,6 +31,7 @@ def __init__(self, dataset, **kwargs):
         self.channel_order = kwargs['channel_order'].upper()
         self.data_order = kwargs['data_order'].upper()
         self.normalize = (kwargs['pixel_conversion'] == 'normalize')
+        self.show_input = (kwargs['show_input'] == 'yes')
 
     @staticmethod
     def get_config_form():
@@ -70,7 +71,8 @@ def get_view_template(self, data):
           - context is a dictionary of context variables to use for rendering
           the form
         """
-        return self.view_template, {'image': digits.utils.image.embed_image_html(data)}
+        return self.view_template, {'image_input': digits.utils.image.embed_image_html(data[0]),
+                                    'image_output': digits.utils.image.embed_image_html(data[1])}
 
     @override
     def process_data(self, input_id, input_data, output_data):
@@ -78,9 +80,19 @@ def process_data(self, input_id, input_data, output_data):
         Process one inference and return data to visualize
         """
 
-        data = output_data[output_data.keys()[0]].astype('float32')
+        if self.show_input:
+            data_input = input_data.astype('float32')
+            image_input = self.process_image(self.data_order, data_input)
+        else:
+            image_input = None
+
+        data_output = output_data[output_data.keys()[0]].astype('float32')
+        image_output = self.process_image(self.data_order, data_output)
+
+        return [image_input, image_output]
 
-        if self.data_order == 'HWC':
+    def process_image(self, data_order, data):
+        if data_order == 'HWC':
             data = (data.transpose((2, 0, 1)))
 
         # assume CHW at this point
diff --git a/digits/extensions/view/imageOutput/view_template.html b/digits/extensions/view/imageOutput/view_template.html
index 483fe8bb0..de1b12b4a 100644
--- a/digits/extensions/view/imageOutput/view_template.html
+++ b/digits/extensions/view/imageOutput/view_template.html
@@ -1,3 +1,6 @@
 {# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
 
-<img src="{{image}}" style="max-width:100%;" />
+{% if image_input %}
+    <img src="{{image_input}}" style="max-width:100%;" />
+{% endif %}
+<img src="{{image_output}}" style="max-width:100%;" />
diff --git a/digits/frameworks/__init__.py b/digits/frameworks/__init__.py
index 60636bd40..41c09dfb5 100644
--- a/digits/frameworks/__init__.py
+++ b/digits/frameworks/__init__.py
@@ -3,7 +3,6 @@
 
 from .caffe_framework import CaffeFramework
 from .framework import Framework
-from .tensorflow_framework import TensorflowFramework
 from .torch_framework import TorchFramework
 from digits.config import config_value
 
@@ -13,6 +12,10 @@
     'TorchFramework',
 ]
 
+if config_value('tensorflow')['enabled']:
+    from .tensorflow_framework import TensorflowFramework
+    __all__.append('TensorflowFramework')
+
 #
 #  create framework instances
 #
diff --git a/digits/frameworks/caffe_framework.py b/digits/frameworks/caffe_framework.py
index 40c0c2040..0b241b367 100644
--- a/digits/frameworks/caffe_framework.py
+++ b/digits/frameworks/caffe_framework.py
@@ -153,7 +153,6 @@ def can_accumulate_gradients(self):
         if config_value('caffe')['flavor'] == 'BVLC':
             return True
         elif config_value('caffe')['flavor'] == 'NVIDIA':
-            return (parse_version(config_value('caffe')['version'])
-                    > parse_version('0.14.0-alpha'))
+            return (parse_version(config_value('caffe')['version']) > parse_version('0.14.0-alpha'))
         else:
             raise ValueError('Unknown flavor.  Support NVIDIA and BVLC flavors only.')
diff --git a/digits/frameworks/tensorflow_framework.py b/digits/frameworks/tensorflow_framework.py
index 3885a12b7..3e0273943 100644
--- a/digits/frameworks/tensorflow_framework.py
+++ b/digits/frameworks/tensorflow_framework.py
@@ -1,16 +1,12 @@
 # Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
 from __future__ import absolute_import
 
-import numpy as np
 import os
 import re
 import subprocess
-import time
 import tempfile
 
-import flask
-
-from .errors import Error, NetworkVisualizationError, BadNetworkError
+from .errors import NetworkVisualizationError
 from .framework import Framework
 import digits
 from digits import utils
@@ -18,6 +14,7 @@
 from digits.model.tasks import TensorflowTrainTask
 from digits.utils import subclass, override, constants
 
+
 @subclass
 class TensorflowFramework(Framework):
     """
@@ -35,7 +32,7 @@ class TensorflowFramework(Framework):
     SUPPORTS_PYTHON_LAYERS_FILE = False
     SUPPORTS_TIMELINE_TRACING = True
 
-    SUPPORTED_SOLVER_TYPES = ['SGD','ADADELTA','ADAGRAD','ADAGRADDA','MOMENTUM','ADAM','FTRL','RMSPROP']
+    SUPPORTED_SOLVER_TYPES = ['SGD', 'ADADELTA', 'ADAGRAD', 'ADAGRADDA', 'MOMENTUM', 'ADAM', 'FTRL', 'RMSPROP']
 
     SUPPORTED_DATA_TRANSFORMATION_TYPES = ['MEAN_SUBTRACTION', 'CROPPING']
     SUPPORTED_DATA_AUGMENTATION_TYPES = ['FLIPPING', 'NOISE', 'CONTRAST', 'WHITENING', 'HSV_SHIFTING']
@@ -50,7 +47,7 @@ def create_train_task(self, **kwargs):
         """
         create train task
         """
-        return TensorflowTrainTask(framework_id = self.framework_id, **kwargs)
+        return TensorflowTrainTask(framework_id=self.framework_id, **kwargs)
 
     @override
     def get_standard_network_desc(self, network):
@@ -126,10 +123,10 @@ def get_network_visualization(self, **kwargs):
         # Another for the HTML
         _, temp_html_path = tempfile.mkstemp(suffix='.html')
 
-        try: # do this in a try..finally clause to make sure we delete the temp file
+        try:  # do this in a try..finally clause to make sure we delete the temp file
             # build command line
             args = [config_value('tensorflow')['executable'],
-                    os.path.join(os.path.dirname(digits.__file__),'tools','tensorflow','main.py'),
+                    os.path.join(os.path.dirname(digits.__file__), 'tools', 'tensorflow', 'main.py'),
                     '--network=%s' % os.path.basename(temp_network_path),
                     '--networkDirectory=%s' % os.path.dirname(temp_network_path),
                     '--visualizeModelPath=%s' % temp_graphdef_path,
@@ -141,7 +138,7 @@ def get_network_visualization(self, **kwargs):
 
             if use_mean and use_mean != 'none':
                 mean_file = dataset.get_mean_file()
-                assert mean_file != None, 'Failed to retrieve mean file.'
+                assert mean_file is not None, 'Failed to retrieve mean file.'
                 args.append('--subtractMean=%s' % use_mean)
                 args.append('--mean=%s' % dataset.path(mean_file))
 
@@ -163,15 +160,14 @@ def get_network_visualization(self, **kwargs):
 
             env = os.environ.copy()
             # make only a selected number of GPUs visible. The ID is not important for just the vis
-            env['CUDA_VISIBLE_DEVICES'] = ",".join([str(i) for i in range(0,int(num_gpus))])
+            env['CUDA_VISIBLE_DEVICES'] = ",".join([str(i) for i in range(0, int(num_gpus))])
 
             # execute command
             p = subprocess.Popen(args,
-                        stdout=subprocess.PIPE,
-                        stderr=subprocess.STDOUT,
-                        close_fds=True,
-                        env=env
-                        )
+                                 stdout=subprocess.PIPE,
+                                 stderr=subprocess.STDOUT,
+                                 close_fds=True,
+                                 env=env)
 
             stdout_log = ''
             while p.poll() is None:
@@ -181,7 +177,7 @@ def get_network_visualization(self, **kwargs):
                         stdout_log += line
             if p.returncode:
                 raise NetworkVisualizationError(stdout_log)
-            else: # Success!
+            else:  # Success!
                 return repr(str(open(temp_graphdef_path).read()))
         finally:
             os.remove(temp_network_path)
diff --git a/digits/model/forms.py b/digits/model/forms.py
index 7df36652a..86c9d3224 100644
--- a/digits/model/forms.py
+++ b/digits/model/forms.py
@@ -121,13 +121,14 @@ def validate_py_ext(form, field):
         tooltip="How many epochs of training between running through one pass of the validation data?"
     )
 
-    traces_interval = utils.forms.IntegerField('Tracing Interval (in steps)',
-            validators=[
-                validators.NumberRange(min=0)
-            ],
-            default=0,
-            tooltip="Generation of a timeline trace every few steps"
-            )
+    traces_interval = utils.forms.IntegerField(
+        'Tracing Interval (in steps)',
+        validators=[
+            validators.NumberRange(min=0)
+        ],
+        default=0,
+        tooltip="Generation of a timeline trace every few steps"
+    )
 
     random_seed = utils.forms.IntegerField(
         'Random seed',
@@ -311,10 +312,11 @@ def validate_lr_multistep_values(form, field):
     )
 
     def validate_custom_network_snapshot(form, field):
-        if form.method.data == 'custom':
-            for filename in field.data.strip().split(os.path.pathsep):
-                if filename and not os.path.exists(filename):
-                    raise validators.ValidationError('File "%s" does not exist' % filename)
+        pass
+        #if form.method.data == 'custom':
+        #    for filename in field.data.strip().split(os.path.pathsep):
+        #        if filename and not os.path.exists(filename):
+        #            raise validators.ValidationError('File "%s" does not exist' % filename)
 
     # Select one of several GPUs
     select_gpu = wtforms.RadioField(
diff --git a/digits/model/images/classification/job.py b/digits/model/images/classification/job.py
index 600f06163..4797e4c7f 100644
--- a/digits/model/images/classification/job.py
+++ b/digits/model/images/classification/job.py
@@ -28,7 +28,7 @@ def job_type(self):
     def download_files(self, epoch=-1):
         task = self.train_task()
 
-        snapshot_filename = task.get_snapshot(epoch)
+        snapshot_filename = task.get_snapshot(epoch, download=True)
 
         # get model files
         model_files = task.get_model_files()
diff --git a/digits/model/images/classification/test_views.py b/digits/model/images/classification/test_views.py
index 085db789c..1c33a5e83 100644
--- a/digits/model/images/classification/test_views.py
+++ b/digits/model/images/classification/test_views.py
@@ -3,7 +3,6 @@
 
 import itertools
 import json
-import math
 import os
 import shutil
 import tempfile
@@ -17,17 +16,13 @@
     from StringIO import StringIO
 
 from bs4 import BeautifulSoup
-from google.protobuf import text_format
 
 from digits.config import config_value
 import digits.dataset.images.classification.test_views
-from digits.frameworks import CaffeFramework
 import digits.test_views
 from digits import test_utils
 import digits.webapp
 
-import caffe_pb2
-
 # May be too short on a slow system
 TIMEOUT_DATASET = 45
 TIMEOUT_MODEL = 60
@@ -98,19 +93,22 @@ class BaseViewsTest(digits.test_views.BaseViewsTest):
 """
 
     TENSORFLOW_NETWORK = \
-"""
-def build_model(params):
-    ninputs = params['input_shape'][0] * params['input_shape'][1] * params['input_shape'][2]
-    W = tf.get_variable('W', [ninputs, params['nclasses']], initializer=tf.constant_initializer(0.0))
-    b = tf.get_variable('b', [params['nclasses']], initializer=tf.constant_initializer(0.0)),
-    model = tf.reshape(params['x'], shape=[-1, ninputs])
-    model = tf.add(tf.matmul(model, W), b)
-    def loss(y):
-        return digits.classification_loss(model, y)
-    return {
-        'model' : model,
-        'loss' : loss
-        }
+        """
+class UserModel(Tower):
+
+    @model_property
+    def inference(self):
+        ninputs = self.input_shape[0] * self.input_shape[1] * self.input_shape[2]
+        W = tf.get_variable('W', [ninputs, self.nclasses], initializer=tf.constant_initializer(0.0))
+        b = tf.get_variable('b', [self.nclasses], initializer=tf.constant_initializer(0.0)),
+        model = tf.reshape(self.x, shape=[-1, ninputs])
+        model = tf.add(tf.matmul(model, W), b)
+        return model
+
+    @model_property
+    def loss(self):
+        loss = digits.classification_loss(self.inference, self.y)
+        return loss
 """
 
     @classmethod
@@ -142,15 +140,16 @@ def delete_model(cls, job_id):
 
     @classmethod
     def network(cls):
-        if cls.FRAMEWORK=='torch':
+        if cls.FRAMEWORK == 'torch':
             return cls.TORCH_NETWORK
-        elif cls.FRAMEWORK=='caffe':
+        elif cls.FRAMEWORK == 'caffe':
             return cls.CAFFE_NETWORK
-        elif cls.FRAMEWORK=='tensorflow':
+        elif cls.FRAMEWORK == 'tensorflow':
             return cls.TENSORFLOW_NETWORK
         else:
             raise Exception('Unknown cls.FRAMEWORK "%s"' % cls.FRAMEWORK)
 
+
 class BaseViewsTestWithDataset(BaseViewsTest,
                                digits.dataset.images.classification.test_views.BaseViewsTestWithDataset):
     """
@@ -521,17 +520,17 @@ def test_bad_network_definition(self):
                 """
         elif self.FRAMEWORK == 'tensorflow':
             bogus_net = """
-                def build_model(params):
-                    model = BogusCode(0)
+class UserModel(Tower):
 
-                    def loss(y):
-                        return BogusCode(0)
+    @model_property
+    def inference(self):
+        model = BogusCode(0)
+        return model
 
-                    return {
-                        'model' : model,
-                        'loss' : loss,
-                    }
-                """
+    @model_property
+    def loss(y):
+        return BogusCode(0)
+"""
         job_id = self.create_model(json=True, network=bogus_net)
         assert self.model_wait_completion(job_id) == 'Error', 'job should have failed'
         job_info = self.job_info_html(job_id=job_id, job_type='models')
@@ -840,6 +839,9 @@ def test_inference_while_training(self):
         # if no GPUs, just test inference during a normal training job
 
         # get number of GPUs
+        if self.FRAMEWORK == 'tensorflow':
+            raise unittest.SkipTest('Tensorflow CPU inference during training not supported')
+
         gpu_count = 1
         if (config_value('gpu_list') and
                 config_value('caffe')['cuda_enabled'] and
@@ -1047,7 +1049,7 @@ class BaseTestCreatedCropInNetwork(BaseTestCreated):
 end
 """
     TENSORFLOW_NETWORK = \
-"""
+        """
 @TODO(tzaman)
 """
 
@@ -1309,29 +1311,31 @@ def test_sweep(self):
             assert not self.model_exists(job_id), 'model exists after delete'
 
 
-## Tensorflow
+# Tensorflow
 
-#class TestTensorflowViews(BaseTestViews, test_utils.TensorflowMixin):
-#    # @TODO(tzaman) For TF i need to pass a proper dataset too - how to do this best?
-#    pass
 
 class TestTensorflowCreation(BaseTestCreation, test_utils.TensorflowMixin):
     pass
 
-class TestTensorflowCreatedUnencodedShuffle(BaseTestCreated, test_utils.TensorflowMixin):
+
+class TestTensorflowCreatedWideUnencodedShuffle(BaseTestCreatedWide, test_utils.TensorflowMixin):
     ENCODING = 'none'
     SHUFFLE = True
 
+
 class TestTensorflowCreatedHdf5(BaseTestCreated, test_utils.TensorflowMixin):
     BACKEND = 'hdf5'
 
+
 class TestTensorflowCreatedTallHdf5Shuffle(BaseTestCreatedTall, test_utils.TensorflowMixin):
     BACKEND = 'hdf5'
     SHUFFLE = True
 
+
 class TestTensorflowDatasetModelInteractions(BaseTestDatasetModelInteractions, test_utils.TensorflowMixin):
     pass
 
+
 class TestTensorflowCreatedDataAug(BaseTestCreatedDataAug, test_utils.TensorflowMixin):
     AUG_FLIP = 'fliplrud'
     AUG_NOISE = 0.03
@@ -1343,10 +1347,12 @@ class TestTensorflowCreatedDataAug(BaseTestCreatedDataAug, test_utils.Tensorflow
     AUG_HSV_V = 0.06
     TRAIN_EPOCHS = 2
 
+
 class TestTensorflowCreatedWideMultiStepLR(BaseTestCreatedWide, test_utils.TensorflowMixin):
     LR_POLICY = 'multistep'
     LR_MULTISTEP_VALUES = '50,75,90'
 
+
 class TestTensorflowLeNet(BaseTestCreated, test_utils.TensorflowMixin):
     IMAGE_WIDTH = 28
     IMAGE_HEIGHT = 28
@@ -1354,11 +1360,11 @@ class TestTensorflowLeNet(BaseTestCreated, test_utils.TensorflowMixin):
 
     # standard lenet model will adjust to color
     # or grayscale images
-    TENSORFLOW_NETWORK=open(
-            os.path.join(
-                os.path.dirname(digits.__file__),
-                'standard-networks', 'tensorflow', 'lenet.py')
-            ).read()
+    TENSORFLOW_NETWORK = open(os.path.join(os.path.dirname(digits.__file__),
+                                           'standard-networks',
+                                           'tensorflow',
+                                           'lenet.py')).read()
+
 
 class TestTensorflowLeNetSlim(BaseTestCreated, test_utils.TensorflowMixin):
     IMAGE_WIDTH = 28
@@ -1367,8 +1373,7 @@ class TestTensorflowLeNetSlim(BaseTestCreated, test_utils.TensorflowMixin):
 
     # standard lenet model will adjust to color
     # or grayscale images
-    TENSORFLOW_NETWORK=open(
-            os.path.join(
-                os.path.dirname(digits.__file__),
-                'standard-networks', 'tensorflow', 'lenet_slim.py')
-            ).read()
+    TENSORFLOW_NETWORK = open(os.path.join(os.path.dirname(digits.__file__),
+                                           'standard-networks',
+                                           'tensorflow',
+                                           'lenet_slim.py')).read()
diff --git a/digits/model/images/classification/views.py b/digits/model/images/classification/views.py
index 709fffe54..f63f00753 100644
--- a/digits/model/images/classification/views.py
+++ b/digits/model/images/classification/views.py
@@ -190,11 +190,8 @@ def create():
                         elif epoch == -1:
                             pretrained_model = old_job.train_task().pretrained_model
                         else:
-                            for filename, e in old_job.train_task().snapshots:
-                                if e == epoch:
-                                    pretrained_model = filename
-                                    break
-
+                            # verify snapshot exists
+                            pretrained_model = old_job.train_task().get_snapshot(epoch, download=True)
                             if pretrained_model is None:
                                 raise werkzeug.exceptions.BadRequest(
                                     "For the job %s, selected pretrained_model for epoch %d is invalid!"
@@ -204,6 +201,8 @@ def create():
                                     "Pretrained_model for the selected epoch doesn't exist. "
                                     "May be deleted by another user/process. "
                                     "Please restart the server to load the correct pretrained_model details.")
+                            # get logical path
+                            pretrained_model = old_job.train_task().get_snapshot(epoch)
                         break
 
             elif form.method.data == 'pretrained':
@@ -270,7 +269,7 @@ def create():
             data_aug['scale'] = form.aug_scale.data
             data_aug['noise'] = form.aug_noise.data
             data_aug['contrast'] = form.aug_contrast.data
-            data_aug['whitening']= form.aug_whitening.data
+            data_aug['whitening'] = form.aug_whitening.data
             data_aug['hsv_use'] = form.aug_hsv_use.data
             data_aug['hsv_h'] = form.aug_hsv_h.data
             data_aug['hsv_s'] = form.aug_hsv_s.data
@@ -356,6 +355,7 @@ def timeline_tracing():
 
     return flask.render_template('models/timeline_tracing.html', job=job)
 
+
 @blueprint.route('/large_graph', methods=['GET'])
 def large_graph():
     """
@@ -706,8 +706,8 @@ def top_n():
 
 def get_datasets():
     return [(j.id(), j.name()) for j in sorted(
-        [j for j in scheduler.jobs.values() if isinstance(j, ImageClassificationDatasetJob)
-         and (j.status.is_running() or j.status == Status.DONE)],
+        [j for j in scheduler.jobs.values() if isinstance(j, ImageClassificationDatasetJob) and
+         (j.status.is_running() or j.status == Status.DONE)],
         cmp=lambda x, y: cmp(y.id(), x.id())
     )
     ]
diff --git a/digits/model/images/forms.py b/digits/model/images/forms.py
index 08e4a6f62..99a4375bf 100644
--- a/digits/model/images/forms.py
+++ b/digits/model/images/forms.py
@@ -89,10 +89,13 @@ class ImageModelForm(ModelForm):
     aug_contrast = utils.forms.FloatField(
         'Contrast (factor)',
         default=0,
-        validators=[ 
+        validators=[
             validators.NumberRange(min=0, max=5)
         ],
-        tooltip="Per channel, the mean of the channel is computed and then adjusts each component x of each pixel to (x - mean) * contrast_factor + mean. The contrast_factor is picked form a random uniform distribution to yield a value between [1-contrast_factor, 1+contrast_factor]. Suggested value is 0.8."
+        tooltip="Per channel, the mean of the channel is computed and then adjusts each component x "
+                "of each pixel to (x - mean) * contrast_factor + mean. The contrast_factor is picked "
+                "form a random uniform distribution to yield a value between [1-contrast_factor, "
+                "1+contrast_factor]. Suggested value is 0.8."
     )
 
     aug_whitening = utils.forms.BooleanField(
diff --git a/digits/model/images/generic/job.py b/digits/model/images/generic/job.py
index df03b7bf1..01af6a02c 100644
--- a/digits/model/images/generic/job.py
+++ b/digits/model/images/generic/job.py
@@ -28,7 +28,7 @@ def job_type(self):
     def download_files(self, epoch=-1):
         task = self.train_task()
 
-        snapshot_filename = task.get_snapshot(epoch)
+        snapshot_filename = task.get_snapshot(epoch, download=True)
 
         # get model files
         model_files = task.get_model_files()
diff --git a/digits/model/images/generic/test_views.py b/digits/model/images/generic/test_views.py
index 6e7748bc5..08f3de324 100644
--- a/digits/model/images/generic/test_views.py
+++ b/digits/model/images/generic/test_views.py
@@ -27,8 +27,6 @@
 import digits.webapp
 
 
-import numpy as np
-
 # May be too short on a slow system
 TIMEOUT_DATASET = 45
 TIMEOUT_MODEL = 60
@@ -95,19 +93,21 @@ class BaseViewsTest(digits.test_views.BaseViewsTest):
 
     TENSORFLOW_NETWORK = \
         """
-def build_model(params):
-    ninputs = params['input_shape'][0] * params['input_shape'][1] * params['input_shape'][2]
-    W = tf.get_variable('W', [ninputs, 2], initializer=tf.constant_initializer(0.0))
-    b = tf.get_variable('b', [2], initializer=tf.constant_initializer(0.0)),
-    model = tf.reshape(params['x'], shape=[-1, ninputs])
-    model = tf.add(tf.matmul(model, W), b)
-    def loss(y):
-        y = tf.reshape(y, shape=[-1, 2])
-        return digits.mse_loss(model, y)
-    return {
-        'model' : model,
-        'loss' : loss
-        }
+class UserModel(Tower):
+
+    @model_property
+    def inference(self):
+        ninputs = self.input_shape[0] * self.input_shape[1] * self.input_shape[2]
+        W = tf.get_variable('W', [ninputs, 2], initializer=tf.constant_initializer(0.0))
+        b = tf.get_variable('b', [2], initializer=tf.constant_initializer(0.0)),
+        model = tf.reshape(self.x, shape=[-1, ninputs]) * 0.004
+        model = tf.add(tf.matmul(model, W), b)
+        return model
+
+    @model_property
+    def loss(self):
+        y = tf.reshape(self.y, shape=[-1, 2])
+        return digits.mse_loss(self.inference, y)
 """
 
     @classmethod
@@ -135,11 +135,11 @@ def delete_model(cls, job_id):
 
     @classmethod
     def network(cls):
-        if cls.FRAMEWORK=='torch':
+        if cls.FRAMEWORK == 'torch':
             return cls.TORCH_NETWORK
-        elif cls.FRAMEWORK=='caffe':
+        elif cls.FRAMEWORK == 'caffe':
             return cls.CAFFE_NETWORK
-        elif cls.FRAMEWORK=='tensorflow':
+        elif cls.FRAMEWORK == 'tensorflow':
             return cls.TENSORFLOW_NETWORK
         else:
             raise ValueError('Unknown framework %s' % cls.FRAMEWORK)
@@ -776,6 +776,24 @@ class BaseTestCreatedWithImageProcessingExtension(
 end
 """
 
+    TENSORFLOW_NETWORK = \
+        """
+class UserModel(Tower):
+
+    @model_property
+    def inference(self):
+        scale = tf.get_variable('scale', [1], initializer=tf.constant_initializer(1.0))
+        offset = tf.get_variable('offset', [1], initializer=tf.constant_initializer(0.))
+        offset = tf.Print(offset,[scale, offset], message='scale offset')
+        model = self.x + offset
+        self.model = model
+        return tf.transpose(model, (0, 3, 2, 1))  # net output expected in NCHW format
+
+    @model_property
+    def loss(self):
+        return digits.mse_loss(self.model, self.y)
+"""
+
     EXTENSION_ID = "image-processing"
     VARIABLE_SIZE_DATASET = False
     NUM_IMAGES = 100
@@ -813,9 +831,17 @@ def test_infer_one_json(self):
         data = json.loads(rv.data)
         data_shape = np.array(data['outputs']['output']).shape
         if not self.VARIABLE_SIZE_DATASET:
-            assert data_shape == (1, self.CHANNELS, self.IMAGE_WIDTH, self.IMAGE_HEIGHT)
+            if data_shape != (1, self.CHANNELS, self.IMAGE_WIDTH, self.IMAGE_HEIGHT):
+                raise ValueError("Shapes differ: got %s expected %s" % (repr(data_shape),
+                                                                        repr((1,
+                                                                              self.CHANNELS,
+                                                                              self.IMAGE_WIDTH,
+                                                                              self.IMAGE_HEIGHT))))
 
     def test_infer_one_noresize_json(self):
+        if self.FRAMEWORK == 'tensorflow' and self.MEAN == 'image':
+            raise unittest.SkipTest('Mean image subtraction not supported on '
+                                    'variable-size input with Tensorflow')
         # create large random image
         shape = (self.CHANNELS, 10 * self.IMAGE_HEIGHT, 5 * self.IMAGE_WIDTH)
         x = np.random.randint(
@@ -841,7 +867,8 @@ def test_infer_one_noresize_json(self):
         assert rv.status_code == 200, 'POST failed with %s' % rv.status_code
         data = json.loads(rv.data)
         data_shape = np.array(data['outputs']['output']).shape
-        assert data_shape == (1,) + shape
+        if data_shape != (1,) + shape:
+                raise ValueError("Shapes differ: got %s expected %s" % (repr(data_shape), repr((1,) + shape)))
 
     def test_infer_db(self):
         if self.VARIABLE_SIZE_DATASET:
@@ -1282,39 +1309,54 @@ class TestAllInOneNetwork(BaseTestCreation, BaseTestCreated, test_utils.CaffeMix
 }
 """
 
-#class TestTensorflowViews(BaseTestViews, test_utils.TensorflowMixin):
-#    # @TODO(tzaman) For TF i need to pass a proper dataset too - how to do this best?
-#    pass
 
 class TestTensorflowCreation(BaseTestCreation, test_utils.TensorflowMixin):
     pass
 
+
 class TestTensorflowCreated(BaseTestCreated, test_utils.TensorflowMixin):
     pass
 
-class TestTensorflowCreatedWithGradientDataExtension(BaseTestCreatedWithGradientDataExtension, test_utils.TensorflowMixin):
+
+class TestTensorflowCreatedWithGradientDataExtension(BaseTestCreatedWithGradientDataExtension,
+                                                     test_utils.TensorflowMixin):
     pass
 
-class TestTensorflowCreatedWithGradientDataExtensionNoValSet(BaseTestCreatedWithGradientDataExtension, test_utils.TensorflowMixin):
+
+class TestTensorflowCreatedWithGradientDataExtensionNoValSet(BaseTestCreatedWithGradientDataExtension,
+                                                             test_utils.TensorflowMixin):
     @classmethod
     def setUpClass(cls):
         super(TestTensorflowCreatedWithGradientDataExtensionNoValSet, cls).setUpClass(val_image_count=0)
 
-class TestTensorflowCreatedWithImageProcessingExtensionMeanImage(BaseTestCreatedWithImageProcessingExtension, test_utils.TensorflowMixin):
-    MEAN = 'image'
 
-class TestTensorflowCreatedWithImageProcessingExtensionMeanPixel(BaseTestCreatedWithImageProcessingExtension, test_utils.TensorflowMixin):
-    MEAN = 'pixel'
+# class TestTensorflowCreatedWithImageProcessingExtensionMeanImage(BaseTestCreatedWithImageProcessingExtension,
+#                                                                  test_utils.TensorflowMixin):
+#     MEAN = 'image'
+#
+#
+# class TestTensorflowCreatedWithImageProcessingExtensionMeanPixel(BaseTestCreatedWithImageProcessingExtension,
+#                                                                  test_utils.TensorflowMixin):
+#     MEAN = 'pixel'
+#
+#
+# class TestTensorflowCreatedWithImageProcessingExtensionMeanNone(BaseTestCreatedWithImageProcessingExtension,
+#                                                                 test_utils.TensorflowMixin):
+#     MEAN = 'none'
 
-class TestTensorflowCreatedWithImageProcessingExtensionMeanNone(BaseTestCreatedWithImageProcessingExtension, test_utils.TensorflowMixin):
-    MEAN = 'none'
 
 class TestTensorflowCreatedVariableSizeDataset(BaseTestCreatedWithImageProcessingExtension, test_utils.TensorflowMixin):
     MEAN = 'none'
     VARIABLE_SIZE_DATASET = True
 
+    @classmethod
+    def setUpClass(cls):
+        raise unittest.SkipTest('Variable-size dataset not supported in Tensorflow/DIGITS')
+
+
 class TestTensorflowCreatedCropInForm(BaseTestCreatedCropInForm, test_utils.TensorflowMixin):
     pass
 
+
 class TestTensorflowDatasetModelInteractions(BaseTestDatasetModelInteractions, test_utils.TensorflowMixin):
     pass
diff --git a/digits/model/images/generic/views.py b/digits/model/images/generic/views.py
index eff94bba9..913dd0890 100644
--- a/digits/model/images/generic/views.py
+++ b/digits/model/images/generic/views.py
@@ -153,11 +153,8 @@ def create(extension_id=None):
                         elif epoch == -1:
                             pretrained_model = old_job.train_task().pretrained_model
                         else:
-                            for filename, e in old_job.train_task().snapshots:
-                                if e == epoch:
-                                    pretrained_model = filename
-                                    break
-
+                            # verify snapshot exists
+                            pretrained_model = old_job.train_task().get_snapshot(epoch, download=True)
                             if pretrained_model is None:
                                 raise werkzeug.exceptions.BadRequest(
                                     "For the job %s, selected pretrained_model for epoch %d is invalid!"
@@ -167,6 +164,8 @@ def create(extension_id=None):
                                     "Pretrained_model for the selected epoch doesn't exist. "
                                     "May be deleted by another user/process. "
                                     "Please restart the server to load the correct pretrained_model details.")
+                            # get logical path
+                            pretrained_model = old_job.train_task().get_snapshot(epoch)
                         break
             elif form.method.data == 'pretrained':
                 pretrained_job = scheduler.get_job(form.pretrained_networks.data)
@@ -229,7 +228,7 @@ def create(extension_id=None):
             data_aug['scale'] = form.aug_scale.data
             data_aug['noise'] = form.aug_noise.data
             data_aug['contrast'] = form.aug_contrast.data
-            data_aug['whitening']= form.aug_whitening.data
+            data_aug['whitening'] = form.aug_whitening.data
             data_aug['hsv_use'] = form.aug_hsv_use.data
             data_aug['hsv_h'] = form.aug_hsv_h.data
             data_aug['hsv_s'] = form.aug_hsv_s.data
@@ -295,31 +294,18 @@ def show(job, related_jobs=None):
     """
     Called from digits.model.views.models_show()
     """
+    data_extensions = get_data_extensions()
     view_extensions = get_view_extensions()
 
-    inference_form_html = None
-    if isinstance(job.dataset, GenericDatasetJob):
-        extension_class = extensions.data.get_extension(job.dataset.extension_id)
-        if not extension_class:
-            raise RuntimeError("Unable to find data extension with ID=%s"
-                               % job.dataset.extension_id)
-        extension_userdata = job.dataset.extension_userdata
-        extension_userdata.update({'is_inference_db': True})
-        extension = extension_class(**extension_userdata)
-
-        form = extension.get_inference_form()
-        if form:
-            template, context = extension.get_inference_template(form)
-            inference_form_html = flask.render_template_string(template, **context)
-
     return flask.render_template(
         'models/images/generic/show.html',
         job=job,
+        data_extensions=data_extensions,
         view_extensions=view_extensions,
         related_jobs=related_jobs,
-        inference_form_html=inference_form_html,
     )
 
+
 @blueprint.route('/timeline_tracing', methods=['GET'])
 def timeline_tracing():
     """
@@ -329,6 +315,7 @@ def timeline_tracing():
 
     return flask.render_template('models/timeline_tracing.html', job=job)
 
+
 @blueprint.route('/large_graph', methods=['GET'])
 def large_graph():
     """
@@ -444,8 +431,13 @@ def infer_extension():
 
     inference_db_job = None
     try:
+        if 'data_extension_id' in flask.request.form:
+            data_extension_id = flask.request.form['data_extension_id']
+        else:
+            data_extension_id = model_job.dataset.extension_id
+
         # create an inference database
-        inference_db_job = create_inference_db(model_job)
+        inference_db_job = create_inference_db(model_job, data_extension_id)
         db_path = inference_db_job.get_feature_db_path(constants.TEST_DB)
 
         # create database creation job
@@ -726,10 +718,13 @@ def infer_many():
         ), status_code
 
 
-def create_inference_db(model_job):
+def create_inference_db(model_job, data_extension_id):
     # create instance of extension class
-    extension_class = extensions.data.get_extension(model_job.dataset.extension_id)
-    extension_userdata = model_job.dataset.extension_userdata
+    extension_class = extensions.data.get_extension(data_extension_id)
+    if hasattr(model_job.dataset, 'extension_userdata'):
+        extension_userdata = model_job.dataset.extension_userdata
+    else:
+        extension_userdata = {}
     extension_userdata.update({'is_inference_db': True})
     extension = extension_class(**extension_userdata)
 
@@ -753,7 +748,7 @@ def create_inference_db(model_job):
         batch_size=1,
         num_threads=1,
         force_same_shape=0,
-        extension_id=model_job.dataset.extension_id,
+        extension_id=data_extension_id,
         extension_userdata=extension.get_user_data(),
     )
 
@@ -777,13 +772,12 @@ def create_inference_db(model_job):
 def get_datasets(extension_id):
     if extension_id:
         jobs = [j for j in scheduler.jobs.values()
-                if isinstance(j, GenericDatasetJob)
-                and j.extension_id == extension_id
-                and (j.status.is_running() or j.status == Status.DONE)]
+                if isinstance(j, GenericDatasetJob) and
+                j.extension_id == extension_id and (j.status.is_running() or j.status == Status.DONE)]
     else:
         jobs = [j for j in scheduler.jobs.values()
-                if (isinstance(j, GenericImageDatasetJob) or isinstance(j, GenericDatasetJob))
-                and (j.status.is_running() or j.status == Status.DONE)]
+                if (isinstance(j, GenericImageDatasetJob) or isinstance(j, GenericDatasetJob)) and
+                (j.status.is_running() or j.status == Status.DONE)]
     return [(j.id(), j.name())
             for j in sorted(jobs, cmp=lambda x, y: cmp(y.id(), x.id()))]
 
@@ -873,6 +867,17 @@ def get_pretrained_networks_fulldetails():
     ]
 
 
+def get_data_extensions():
+    """
+    return all enabled data extensions
+    """
+    data_extensions = {"all-default": "Default"}
+    all_extensions = extensions.data.get_extensions()
+    for extension in all_extensions:
+        data_extensions[extension.get_id()] = extension.get_title()
+    return data_extensions
+
+
 def get_view_extensions():
     """
     return all enabled view extensions
diff --git a/digits/model/tasks/__init__.py b/digits/model/tasks/__init__.py
index 15746527a..505430044 100644
--- a/digits/model/tasks/__init__.py
+++ b/digits/model/tasks/__init__.py
@@ -2,7 +2,6 @@
 from __future__ import absolute_import
 
 from .caffe_train import CaffeTrainTask
-from .tensorflow_train import TensorflowTrainTask
 from .torch_train import TorchTrainTask
 from .train import TrainTask
 
@@ -11,3 +10,9 @@
     'TorchTrainTask',
     'TrainTask',
 ]
+
+from digits.config import config_value  # noqa
+
+if config_value('tensorflow')['enabled']:
+    from .tensorflow_train import TensorflowTrainTask  # noqa
+    __all__.append('TensorflowTrainTask')
diff --git a/digits/model/tasks/caffe_train.py b/digits/model/tasks/caffe_train.py
index 981c6a805..c1001a694 100644
--- a/digits/model/tasks/caffe_train.py
+++ b/digits/model/tasks/caffe_train.py
@@ -934,8 +934,7 @@ def task_arguments(self, resources, env):
                 args.append('--gpu=%s' % identifiers[0])
             elif len(identifiers) > 1:
                 if config_value('caffe')['flavor'] == 'NVIDIA':
-                    if (utils.parse_version(config_value('caffe')['version'])
-                            < utils.parse_version('0.14.0-alpha')):
+                    if (utils.parse_version(config_value('caffe')['version']) < utils.parse_version('0.14.0-alpha')):
                         # Prior to version 0.14, NVcaffe used the --gpus switch
                         args.append('--gpus=%s' % ','.join(identifiers))
                     else:
diff --git a/digits/model/tasks/tensorflow_train.py b/digits/model/tasks/tensorflow_train.py
index 5bfd28124..7abe5eeee 100644
--- a/digits/model/tasks/tensorflow_train.py
+++ b/digits/model/tasks/tensorflow_train.py
@@ -11,16 +11,13 @@
 
 import h5py
 import numpy as np
-import PIL.Image
 
 from .train import TrainTask
 import digits
 from digits import utils
 from digits.config import config_value
 from digits.utils import subclass, override, constants
-
-# Must import after importing digit.config
-import caffe_pb2
+import tensorflow as tf
 
 # NOTE: Increment this everytime the pickled object changes
 PICKLE_VERSION = 1
@@ -30,6 +27,19 @@
 TENSORFLOW_SNAPSHOT_PREFIX = 'snapshot'
 TIMELINE_PREFIX = 'timeline'
 
+
+def _int64_feature(value):
+    return tf.train.Feature(int64_list=tf.train.Int64List(value=[value]))
+
+
+def _bytes_feature(value):
+    return tf.train.Feature(bytes_list=tf.train.BytesList(value=[value]))
+
+
+def _float_array_feature(value):
+    return tf.train.Feature(float_list=tf.train.FloatList(value=value))
+
+
 def subprocess_visible_devices(gpus):
     """
     Calculates CUDA_VISIBLE_DEVICES for a subprocess
@@ -50,6 +60,7 @@ def subprocess_visible_devices(gpus):
             real_gpus.append(map_visible_to_real[visible_gpu])
     return ','.join(str(g) for g in real_gpus)
 
+
 @subclass
 class TensorflowTrainTask(TrainTask):
     """
@@ -111,8 +122,7 @@ def __setstate__(self, state):
         self.image_mean = None
         self.classifier = None
 
-    ### Task overrides
-
+    # Task overrides
     @override
     def name(self):
         return 'Train Tensorflow Model'
@@ -129,11 +139,36 @@ def before_run(self):
         self.temp_unrecognized_output = []
         return True
 
+    @override
+    def get_snapshot(self, epoch=-1, download=False):
+        """
+        return snapshot file for specified epoch
+        """
+        snapshot_filename = None
+
+        if len(self.snapshots) == 0:
+            return "no snapshots"
+
+        if epoch == -1 or not epoch:
+            epoch = self.snapshots[-1][1]
+            snapshot_filename = self.snapshots[-1][0]
+        else:
+            for f, e in self.snapshots:
+                if e == epoch:
+                    snapshot_filename = f
+                    break
+        if not snapshot_filename:
+            raise ValueError('Invalid epoch')
+        if download:
+            snapshot_filename = snapshot_filename + ".data-00000-of-00001"
+
+        return snapshot_filename
+
     @override
     def task_arguments(self, resources, env):
-                
+
         args = [config_value('tensorflow')['executable'],
-                os.path.join(os.path.dirname(os.path.abspath(digits.__file__)),'tools', 'tensorflow', 'main.py'),
+                os.path.join(os.path.dirname(os.path.abspath(digits.__file__)), 'tools', 'tensorflow', 'main.py'),
                 '--network=%s' % self.model_file,
                 '--epoch=%d' % int(self.train_epochs),
                 '--networkDirectory=%s' % self.job_dir,
@@ -149,7 +184,7 @@ def task_arguments(self, resources, env):
 
         if self.use_mean != 'none':
             mean_file = self.dataset.get_mean_file()
-            assert mean_file != None, 'Failed to retrieve mean file.'
+            assert mean_file is not None, 'Failed to retrieve mean file.'
             args.append('--mean=%s' % self.dataset.path(mean_file))
 
         if hasattr(self.dataset, 'labels_file'):
@@ -168,7 +203,7 @@ def task_arguments(self, resources, env):
         if val_label_db_path:
             args.append('--validation_labels=%s' % val_label_db_path)
 
-        #learning rate policy input parameters
+        # learning rate policy input parameters
         if self.lr_policy['policy'] == 'fixed':
             pass
         elif self.lr_policy['policy'] == 'step':
@@ -226,7 +261,7 @@ def task_arguments(self, resources, env):
         if self.val_interval is not None:
             args.append('--validation_interval=%d' % self.val_interval)
 
-        #if self.traces_interval is not None:
+        # if self.traces_interval is not None:
         args.append('--log_runtime_stats_per_step=%d' % self.traces_interval)
 
         if 'gpus' in resources:
@@ -300,10 +335,10 @@ def process_output(self, line):
             pattern_key_val = re.compile(r'([\w\-_]+)\ =\ ([^,^\ ]+)')
             # Now iterate through the keys and values on this line dynamically
             for (key, value) in re.findall(pattern_key_val, kvlist):
-                assert not('Inf' in value or 'NaN' in value), 'Network reported %s for %s.'  % (value, key)
+                assert not('Inf' in value or 'NaN' in value), 'Network reported %s for %s.' % (value, key)
                 value = float(value)
                 if key == 'lr':
-                    key = 'learning_rate' # Convert to special DIGITS key for learning rate
+                    key = 'learning_rate'  # Convert to special DIGITS key for learning rate
                 if stage == 'Training':
                     self.save_train_output(key, key, value)
                 elif stage == 'Validation':
@@ -367,11 +402,11 @@ def preprocess_output_tensorflow(line):
                 level = 'warning'
             elif level == 'ERROR':
                 level = 'error'
-            elif level == 'FAIL': #FAIL
+            elif level == 'FAIL':  # FAIL
                 level = 'critical'
             return (timestamp, level, message)
         else:
-            #self.logger.warning('Unrecognized task output "%s"' % line)
+            # self.logger.warning('Unrecognized task output "%s"' % line)
             return (None, None, None)
 
     def send_snapshot_update(self):
@@ -381,17 +416,13 @@ def send_snapshot_update(self):
         # TODO: move to TrainTask
         from digits.webapp import socketio
 
-        socketio.emit('task update',
-                {
-                    'task': self.html_id(),
-                    'update': 'snapshots',
-                    'data': self.snapshot_list(),
-                    },
-                namespace='/jobs',
-                room=self.job_id,
-                )
-
-    ### TrainTask overrides
+        socketio.emit('task update', {'task': self.html_id(),
+                                      'update': 'snapshots',
+                                      'data': self.snapshot_list()},
+                      namespace='/jobs',
+                      room=self.job_id)
+
+    # TrainTask overrides
     @override
     def after_run(self):
         if self.temp_unrecognized_output:
@@ -414,7 +445,7 @@ def after_runtime_error(self):
                 if message:
                     lines.append(message)
             # return the last 20 lines
-            traceback = '\n\nLast output:\n' + '\n'.join(lines[len(lines)-20:]) if len(lines)>0 else ''
+            traceback = '\n\nLast output:\n' + '\n'.join(lines[len(lines)-20:]) if len(lines) > 0 else ''
             if self.traceback:
                 self.traceback = self.traceback + traceback
             else:
@@ -431,7 +462,7 @@ def detect_timeline_traces(self):
             match = re.match(r'%s_(.*)\.json$' % TIMELINE_PREFIX, filename)
             if match:
                 step = int(match.group(1))
-                timeline_traces.append((os.path.join(self.job_dir, filename), step ))
+                timeline_traces.append((os.path.join(self.job_dir, filename), step))
         self.timeline_traces = sorted(timeline_traces, key=lambda tup: tup[1])
         return len(self.timeline_traces) > 0
 
@@ -441,18 +472,16 @@ def detect_snapshots(self):
         snapshots = []
         for filename in os.listdir(self.job_dir):
             # find models
-            match = re.match(r'%s_(\d+)\.?(\d*)\.ckpt$' % self.snapshot_prefix, filename)
+            match = re.match(r'%s_(\d+)\.?(\d*)\.ckpt\.index$' % self.snapshot_prefix, filename)
             if match:
                 epoch = 0
+                # remove '.index' suffix from filename
+                filename = filename[:-6]
                 if match.group(2) == '':
                     epoch = int(match.group(1))
                 else:
                     epoch = float(match.group(1) + '.' + match.group(2))
-                snapshots.append( (
-                        os.path.join(self.job_dir, filename),
-                        epoch
-                        )
-                    )
+                snapshots.append((os.path.join(self.job_dir, filename), epoch))
         self.snapshots = sorted(snapshots, key=lambda tup: tup[1])
         return len(self.snapshots) > 0
 
@@ -489,20 +518,27 @@ def infer_one_image(self, image, snapshot_epoch=None, layers=None, gpu=None):
         snapshot_epoch -- which snapshot to use
         layers -- which layer activation[s] and weight[s] to visualize
         """
-        temp_image_handle, temp_image_path = tempfile.mkstemp(suffix='.png')
+        temp_image_handle, temp_image_path = tempfile.mkstemp(suffix='.tfrecords')
         os.close(temp_image_handle)
-        image = PIL.Image.fromarray(image)
-        try:
-            image.save(temp_image_path, format='png')
-        except KeyError:
-            error_message = 'Unable to save file to "%s"' % temp_image_path
-            self.logger.error(error_message)
-            raise digits.inference.errors.InferenceError(error_message)
+        if image.ndim < 3:
+            image = image[..., np.newaxis]
+        writer = tf.python_io.TFRecordWriter(temp_image_path)
+
+        image = image.astype('float')
+        record = tf.train.Example(features=tf.train.Features(feature={
+            'height': _int64_feature(image.shape[0]),
+            'width': _int64_feature(image.shape[1]),
+            'depth': _int64_feature(image.shape[2]),
+            'image_raw': _float_array_feature(image.flatten()),
+            'label': _int64_feature(0),
+            'encoding': _int64_feature(0)}))
+        writer.write(record.SerializeToString())
+        writer.close()
 
         file_to_load = self.get_snapshot(snapshot_epoch)
 
         args = [config_value('tensorflow')['executable'],
-                os.path.join(os.path.dirname(os.path.abspath(digits.__file__)),'tools', 'tensorflow', 'main.py'),
+                os.path.join(os.path.dirname(os.path.abspath(digits.__file__)), 'tools', 'tensorflow', 'main.py'),
                 '--inference_db=%s' % temp_image_path,
                 '--network=%s' % self.model_file,
                 '--networkDirectory=%s' % self.job_dir,
@@ -515,7 +551,7 @@ def infer_one_image(self, image, snapshot_epoch=None, layers=None, gpu=None):
 
         if self.use_mean != 'none':
             mean_file = self.dataset.get_mean_file()
-            assert mean_file != None, 'Failed to retrieve mean file.'
+            assert mean_file is not None, 'Failed to retrieve mean file.'
             args.append('--mean=%s' % self.dataset.path(mean_file))
 
         if self.use_mean == 'pixel':
@@ -528,7 +564,7 @@ def infer_one_image(self, image, snapshot_epoch=None, layers=None, gpu=None):
         if self.crop_size:
             args.append('--croplen=%d' % self.crop_size)
 
-        if layers=='all':
+        if layers == 'all':
             args.append('--visualize_inf=1')
             args.append('--save=%s' % self.job_dir)
 
@@ -547,25 +583,24 @@ def infer_one_image(self, image, snapshot_epoch=None, layers=None, gpu=None):
             # make only the selected GPU visible
             env['CUDA_VISIBLE_DEVICES'] = subprocess_visible_devices([gpu])
 
-
         p = subprocess.Popen(args,
-                stdout=subprocess.PIPE,
-                stderr=subprocess.STDOUT,
-                cwd=self.job_dir,
-                close_fds=True,
-                env=env,
-                )
+                             stdout=subprocess.PIPE,
+                             stderr=subprocess.STDOUT,
+                             cwd=self.job_dir,
+                             close_fds=True,
+                             env=env)
 
         try:
             while p.poll() is None:
                 for line in utils.nonblocking_readlines(p.stdout):
                     if self.aborted.is_set():
                         p.terminate()
-                        raise digits.inference.errors.InferenceError('%s classify one task got aborted. error code - %d' % (self.get_framework_id(), p.returncode))
+                        raise digits.inference.errors.InferenceError('%s classify one task got aborted. error code - %d' % (self.get_framework_id(), p.returncode))  # noqa
 
                     if line is not None and len(line) > 1:
                         if not self.process_test_output(line, predictions, 'one'):
-                            self.logger.warning('%s classify one task unrecognized input: %s' % (self.get_framework_id(), line.strip()))
+                            self.logger.warning('%s classify one task unrecognized input: %s' % (
+                                self.get_framework_id(), line.strip()))
                             unrecognized_output.append(line)
                     else:
                         time.sleep(0.05)
@@ -576,7 +611,8 @@ def infer_one_image(self, image, snapshot_epoch=None, layers=None, gpu=None):
             if type(e) == digits.inference.errors.InferenceError:
                 error_message = e.__str__()
             else:
-                error_message = '%s classify one task failed with error code %d \n %s' % (self.get_framework_id(), p.returncode, str(e))
+                error_message = '%s classify one task failed with error code %d \n %s' % (
+                    self.get_framework_id(), p.returncode, str(e))
             self.logger.error(error_message)
             if unrecognized_output:
                 unrecognized_output = '\n'.join(unrecognized_output)
@@ -600,7 +636,7 @@ def infer_one_image(self, image, snapshot_epoch=None, layers=None, gpu=None):
 
         visualizations = []
 
-        if layers=='all' and self.visualization_file:
+        if layers == 'all' and self.visualization_file:
             vis_db = h5py.File(self.visualization_file, 'r')
             # the HDF5 database is organized as follows:
             # <root>
@@ -611,68 +647,68 @@ def infer_one_image(self, image, snapshot_epoch=None, layers=None, gpu=None):
             #    |  |- activations
             #    |  |- weights
             #    |- 2
-            for layer_id,layer in vis_db['layers'].items():
+            for layer_id, layer in vis_db['layers'].items():
                 op_name = layer.attrs['op']
                 var_name = layer.attrs['var']
-                layer_desc = "%s\n%s" % (op_name,var_name)
+                layer_desc = "%s\n%s" % (op_name, var_name)
                 idx = int(layer_id)
                 # activations (tf: operation outputs)
                 if 'activations' in layer:
                     data = np.array(layer['activations'][...])
-                    if len(data.shape)>1 and data.shape[0]==1:
+                    if len(data.shape) > 1 and data.shape[0] == 1:
                         # skip batch dimension
                         data = data[0]
                     if len(data.shape) == 3:
                         data = data.transpose(2, 0, 1)
                     elif len(data.shape) == 4:
-                        data = data.transpose(3,2,0,1)
+                        data = data.transpose(3, 2, 0, 1)
                     vis = utils.image.get_layer_vis_square(data)
                     mean, std, hist = self.get_layer_statistics(data)
                     visualizations.append(
-                                             {
-                                                 'id':         idx,
-                                                 'name':       layer_desc,
-                                                 'vis_type':   'Activations',
-                                                 'vis': vis,
-                                                 'data_stats': {
-                                                                  'shape':      data.shape,
-                                                                  'mean':       mean,
-                                                                  'stddev':     std,
-                                                                  'histogram':  hist,
-                                                 }
-                                             }
-                                         )
+                        {
+                            'id': idx,
+                            'name': layer_desc,
+                            'vis_type': 'Activations',
+                            'vis': vis,
+                            'data_stats': {
+                                'shape': data.shape,
+                                'mean':  mean,
+                                'stddev':  std,
+                                'histogram': hist,
+                            }
+                        }
+                    )
                 # weights (tf: variables)
                 if 'weights' in layer:
                     data = np.array(layer['weights'][...])
                     if len(data.shape) == 3:
                         data = data.transpose(2, 0, 1)
                     elif len(data.shape) == 4:
-                        data = data.transpose(3,2,0,1)
+                        data = data.transpose(3, 2, 0, 1)
                     if 'MatMul' in layer_desc:
-                        vis = None # too many layers to display?
+                        vis = None  # too many layers to display?
                     else:
                         vis = utils.image.get_layer_vis_square(data)
                     mean, std, hist = self.get_layer_statistics(data)
                     parameter_count = reduce(operator.mul, data.shape, 1)
                     visualizations.append(
-                                           {
-                                               'id':          idx,
-                                               'name':        layer_desc,
-                                               'vis_type':    'Weights',
-                                               'vis':  vis,
-                                               'param_count': parameter_count,
-                                               'data_stats': {
-                                                                 'shape':      data.shape,
-                                                                 'mean':       mean,
-                                                                 'stddev':     std,
-                                                                 'histogram':  hist,
-                                               }
-                                           }
-                                         )
+                        {
+                            'id':  idx,
+                            'name': layer_desc,
+                            'vis_type': 'Weights',
+                            'vis': vis,
+                            'param_count': parameter_count,
+                            'data_stats': {
+                                'shape': data.shape,
+                                'mean': mean,
+                                'stddev': std,
+                                'histogram': hist,
+                            }
+                        }
+                    )
             # sort by layer ID
-            visualizations = sorted(visualizations,key=lambda x:x['id'])
-        return (predictions,visualizations)
+            visualizations = sorted(visualizations, key=lambda x: x['id'])
+        return (predictions, visualizations)
 
     def get_layer_statistics(self, data):
         """
@@ -688,12 +724,11 @@ def get_layer_statistics(self, data):
         std = np.std(data)
         y, x = np.histogram(data, bins=20)
         y = list(y)
-        ticks = x[[0,len(x)/2,-1]]
+        ticks = x[[0, len(x)/2, -1]]
         x = [(x[i]+x[i+1])/2.0 for i in xrange(len(x)-1)]
         ticks = list(ticks)
         return (mean, std, [y, x, ticks])
 
-
     def after_test_run(self, temp_image_path):
         try:
             os.remove(temp_image_path)
@@ -714,11 +749,11 @@ def process_test_output(self, line, predictions, test_category):
         float_exp = '([-]?inf|nan|[-+]?[0-9]*\.?[0-9]+(e[-+]?[0-9]+)?)'
 
         # format of output while testing single image
-        match = re.match(r'For image \d+, predicted class \d+: \d+ \((.*?)\) %s'  % (float_exp), message)
+        match = re.match(r'For image \d+, predicted class \d+: \d+ \((.*?)\) %s' % (float_exp), message)
         if match:
             label = match.group(1)
             confidence = match.group(2)
-            assert not('inf' in confidence or 'nan' in confidence), 'Network reported %s for confidence value. Please check image and network'  % label
+            assert not('inf' in confidence or 'nan' in confidence), 'Network reported %s for confidence value. Please check image and network' % label  # noqa
             confidence = float(confidence)
             predictions.append((label, confidence))
             return True
@@ -747,9 +782,10 @@ def process_test_output(self, line, predictions, test_category):
             return True
 
         if level in ['error', 'critical']:
-            raise digits.inference.errors.InferenceError('%s classify %s task failed with error message - %s' % (self.get_framework_id(), test_category, message))
+            raise digits.inference.errors.InferenceError('%s classify %s task failed with error message - %s' % (
+                self.get_framework_id(), test_category, message))
 
-        return False # control should never reach this line.
+        return False  # control should never reach this line.
 
     @override
     def infer_many(self, data, snapshot_epoch=None, gpu=None, resize=True):
@@ -776,30 +812,34 @@ def infer_many_images(self, images, snapshot_epoch=None, gpu=None):
 
         # create a temporary folder to store images and a temporary file
         # to store a list of paths to the images
-        temp_dir_path = tempfile.mkdtemp()
-        try: # this try...finally clause is used to clean up the temp directory in any case
-            temp_imglist_handle, temp_imglist_path = tempfile.mkstemp(dir=temp_dir_path, suffix='.txt')
-            for image in images:
-                temp_image_handle, temp_image_path = tempfile.mkstemp(
-                        dir=temp_dir_path, suffix='.png')
-                image = PIL.Image.fromarray(image)
-                try:
-                    image.save(temp_image_path, format='png')
-                except KeyError:
-                    error_message = 'Unable to save file to "%s"' % temp_image_path
-                    self.logger.error(error_message)
-                    raise digits.inference.errors.InferenceError(error_message)
-                os.write(temp_imglist_handle, "%s\n" % temp_image_path)
-                os.close(temp_image_handle)
-            os.close(temp_imglist_handle)
+        temp_dir_path = tempfile.mkdtemp(suffix='.tfrecords')
+        try:  # this try...finally clause is used to clean up the temp directory in any case
+            with open(os.path.join(temp_dir_path, 'list.txt'), 'w') as imglist_file:
+                for image in images:
+                    if image.ndim < 3:
+                        image = image[..., np.newaxis]
+                    image = image.astype('float')
+                    temp_image_handle, temp_image_path = tempfile.mkstemp(dir=temp_dir_path, suffix='.tfrecords')
+                    writer = tf.python_io.TFRecordWriter(temp_image_path)
+                    record = tf.train.Example(features=tf.train.Features(feature={
+                        'height': _int64_feature(image.shape[0]),
+                        'width': _int64_feature(image.shape[1]),
+                        'depth': _int64_feature(image.shape[2]),
+                        'image_raw': _float_array_feature(image.flatten()),
+                        'label': _int64_feature(0),
+                        'encoding': _int64_feature(0)}))
+                    writer.write(record.SerializeToString())
+                    writer.close()
+                    imglist_file.write("%s\n" % temp_image_path)
+                    os.close(temp_image_handle)
 
             file_to_load = self.get_snapshot(snapshot_epoch)
 
             args = [config_value('tensorflow')['executable'],
-                    os.path.join(os.path.dirname(os.path.abspath(digits.__file__)),'tools', 'tensorflow', 'main.py'),
+                    os.path.join(os.path.dirname(os.path.abspath(digits.__file__)), 'tools', 'tensorflow', 'main.py'),
                     '--testMany=1',
-                    '--allPredictions=1',   #all predictions are grabbed and formatted as required by DIGITS
-                    '--inference_db=%s' % str(temp_imglist_path),
+                    '--allPredictions=1',  # all predictions are grabbed and formatted as required by DIGITS
+                    '--inference_db=%s' % str(temp_dir_path),
                     '--network=%s' % self.model_file,
                     '--networkDirectory=%s' % self.job_dir,
                     '--weights=%s' % file_to_load,
@@ -810,7 +850,7 @@ def infer_many_images(self, images, snapshot_epoch=None, gpu=None):
 
             if self.use_mean != 'none':
                 mean_file = self.dataset.get_mean_file()
-                assert mean_file != None, 'Failed to retrieve mean file.'
+                assert mean_file is not None, 'Failed to retrieve mean file.'
                 args.append('--mean=%s' % self.dataset.path(mean_file))
 
             if self.use_mean == 'pixel':
@@ -835,23 +875,25 @@ def infer_many_images(self, images, snapshot_epoch=None, gpu=None):
             unrecognized_output = []
             predictions = []
             p = subprocess.Popen(args,
-                    stdout=subprocess.PIPE,
-                    stderr=subprocess.STDOUT,
-                    cwd=self.job_dir,
-                    close_fds=True,
-                    env=env
-                    )
+                                 stdout=subprocess.PIPE,
+                                 stderr=subprocess.STDOUT,
+                                 cwd=self.job_dir,
+                                 close_fds=True,
+                                 env=env)
 
             try:
                 while p.poll() is None:
                     for line in utils.nonblocking_readlines(p.stdout):
                         if self.aborted.is_set():
                             p.terminate()
-                            raise digits.inference.errors.InferenceError('%s classify many task got aborted. error code - %d' % (self.get_framework_id(), p.returncode))
+                            raise digits.inference.errors.InferenceError('%s classify many task got aborted.'
+                                                                         'error code - %d' % (self.get_framework_id(),
+                                                                                              p.returncode))
 
                         if line is not None and len(line) > 1:
                             if not self.process_test_output(line, predictions, 'many'):
-                                self.logger.warning('%s classify many task unrecognized input: %s' % (self.get_framework_id(), line.strip()))
+                                self.logger.warning('%s classify many task unrecognized input: %s' % (
+                                    self.get_framework_id(), line.strip()))
                                 unrecognized_output.append(line)
                         else:
                             time.sleep(0.05)
@@ -862,7 +904,8 @@ def infer_many_images(self, images, snapshot_epoch=None, gpu=None):
                 if type(e) == digits.inference.errors.InferenceError:
                     error_message = e.__str__()
                 else:
-                    error_message = '%s classify many task failed with error code %d \n %s' % (self.get_framework_id(), p.returncode, str(e))
+                    error_message = '%s classify many task failed with error code %d \n %s' % (
+                        self.get_framework_id(), p.returncode, str(e))
                 self.logger.error(error_message)
                 if unrecognized_output:
                     unrecognized_output = '\n'.join(unrecognized_output)
@@ -870,7 +913,8 @@ def infer_many_images(self, images, snapshot_epoch=None, gpu=None):
                 raise digits.inference.errors.InferenceError(error_message)
 
             if p.returncode != 0:
-                error_message = '%s classify many task failed with error code %d' % (self.get_framework_id(), p.returncode)
+                error_message = '%s classify many task failed with error code %d' % (self.get_framework_id(),
+                                                                                     p.returncode)
                 self.logger.error(error_message)
                 if unrecognized_output:
                     unrecognized_output = '\n'.join(unrecognized_output)
@@ -895,21 +939,19 @@ def get_model_files(self):
         """
         return paths to model files
         """
-        return {
-                "Network": self.model_file
-                }
+        return {"Network": self.model_file}
 
     @override
     def get_network_desc(self):
         """
         return text description of network
         """
-        with open (os.path.join(self.job_dir,TENSORFLOW_MODEL_FILE), "r") as infile:
+        with open(os.path.join(self.job_dir, TENSORFLOW_MODEL_FILE), "r") as infile:
             desc = infile.read()
         return desc
 
     @override
-    def get_task_stats(self,epoch=-1):
+    def get_task_stats(self, epoch=-1):
         """
         return a dictionary of task statistics
         """
@@ -924,13 +966,13 @@ def get_task_stats(self,epoch=-1):
             "framework": "tensorflow"
         }
 
-        if hasattr(self,"digits_version"):
+        if hasattr(self, "digits_version"):
             stats.update({"digits version": self.digits_version})
 
-        if hasattr(self.dataset,"resize_mode"):
+        if hasattr(self.dataset, "resize_mode"):
             stats.update({"image resize mode": self.dataset.resize_mode})
 
-        if hasattr(self.dataset,"labels_file"):
+        if hasattr(self.dataset, "labels_file"):
             stats.update({"labels file": self.dataset.labels_file})
 
         return stats
diff --git a/digits/model/tasks/train.py b/digits/model/tasks/train.py
index cc9c173d1..9c5cf4c07 100644
--- a/digits/model/tasks/train.py
+++ b/digits/model/tasks/train.py
@@ -435,7 +435,7 @@ def infer_many(self, data, model_epoch=None):
         """
         return None
 
-    def get_snapshot(self, epoch=-1):
+    def get_snapshot(self, epoch=-1, download=False):
         """
         return snapshot file for specified epoch
         """
diff --git a/digits/model/views.py b/digits/model/views.py
index 40f02a51c..ce5b7bff4 100644
--- a/digits/model/views.py
+++ b/digits/model/views.py
@@ -15,7 +15,7 @@
 from . import ModelJob
 from digits.pretrained_model.job import PretrainedModelJob
 from digits import frameworks, extensions
-from digits.utils import time_filters, auth
+from digits.utils import auth
 from digits.utils.routing import request_wants_json, job_from_request, get_request_arg
 from digits.webapp import scheduler
 
@@ -139,13 +139,14 @@ def visualize_network():
         dataset = scheduler.get_job(flask.request.form['dataset_id'])
 
     fw = frameworks.get_framework_by_id(framework)
-    ret = fw.get_network_visualization(desc=flask.request.form['custom_network'],
-            dataset=dataset,
-            solver_type=flask.request.form['solver_type'] if 'solver_type' in flask.request.form else None,
-            use_mean=flask.request.form['use_mean'] if 'use_mean' in flask.request.form else None,
-            crop_size=flask.request.form['crop_size'] if 'crop_size' in flask.request.form else None,
-            num_gpus=flask.request.form['num_gpus'] if 'num_gpus' in flask.request.form else None,
-            )
+    ret = fw.get_network_visualization(
+        desc=flask.request.form['custom_network'],
+        dataset=dataset,
+        solver_type=flask.request.form['solver_type'] if 'solver_type' in flask.request.form else None,
+        use_mean=flask.request.form['use_mean'] if 'use_mean' in flask.request.form else None,
+        crop_size=flask.request.form['crop_size'] if 'crop_size' in flask.request.form else None,
+        num_gpus=flask.request.form['num_gpus'] if 'num_gpus' in flask.request.form else None,
+    )
     return ret
 
 
diff --git a/digits/scheduler.py b/digits/scheduler.py
index 557c17ffc..d9e06ddc9 100644
--- a/digits/scheduler.py
+++ b/digits/scheduler.py
@@ -107,7 +107,7 @@ def __init__(self, gpu_list=None, verbose=False):
         self.resources = {
             # TODO: break this into CPU cores, memory usage, IO usage, etc.
             'parse_folder_task_pool': [Resource()],
-            'create_db_task_pool': [Resource(max_value=2)],
+            'create_db_task_pool': [Resource(max_value=4)],
             'analyze_db_task_pool': [Resource(max_value=4)],
             'inference_task_pool': [Resource(max_value=4)],
             'gpus': [Resource(identifier=index)
diff --git a/digits/standard-networks/tensorflow/lenet.py b/digits/standard-networks/tensorflow/lenet.py
index 302c3c621..677c905d6 100644
--- a/digits/standard-networks/tensorflow/lenet.py
+++ b/digits/standard-networks/tensorflow/lenet.py
@@ -15,6 +15,9 @@ def maxpool2d(x, k, s, padding='VALID'):
 
         # Create model
         def conv_net(x, weights, biases):
+            # scale (divide by MNIST std)
+            x = x * 0.0125
+
             # Convolution Layer
             conv1 = conv2d(x, weights['wc1'], biases['bc1'], s=1, padding='VALID')
             # Max Pooling (down-sampling)
@@ -30,7 +33,7 @@ def conv_net(x, weights, biases):
             fc1 = tf.reshape(conv2, [-1, weights['wd1'].get_shape().as_list()[0]])
             fc1 = tf.add(tf.matmul(fc1, weights['wd1']), biases['bd1'])
             fc1 = tf.nn.relu(fc1)
-            
+
             # Apply Dropout
             if self.is_training:
                 fc1 = tf.nn.dropout(fc1, 0.5)
diff --git a/digits/standard-networks/tensorflow/lenet_slim.py b/digits/standard-networks/tensorflow/lenet_slim.py
index fb7b4310b..58f64f020 100644
--- a/digits/standard-networks/tensorflow/lenet_slim.py
+++ b/digits/standard-networks/tensorflow/lenet_slim.py
@@ -3,7 +3,9 @@ class UserModel(Tower):
     @model_property
     def inference(self):
         x = tf.reshape(self.x, shape=[-1, self.input_shape[0], self.input_shape[1], self.input_shape[2]])
-        with slim.arg_scope([slim.conv2d, slim.fully_connected], 
+        # scale (divide by MNIST std)
+        x = x * 0.0125
+        with slim.arg_scope([slim.conv2d, slim.fully_connected],
                             weights_initializer=tf.contrib.layers.xavier_initializer(),
                             weights_regularizer=slim.l2_regularizer(0.0005) ):
             model = slim.conv2d(x, 20, [5, 5], padding='VALID', scope='conv1')
diff --git a/digits/templates/models/images/generic/show.html b/digits/templates/models/images/generic/show.html
index 84a043881..6e98e1d81 100644
--- a/digits/templates/models/images/generic/show.html
+++ b/digits/templates/models/images/generic/show.html
@@ -29,6 +29,8 @@
                 <dt>Pretrained Model</dt>
                 <dd>{{task.pretrained_model}}</dd>
                 {% endif %}
+                <dt>Visualizations</dt>
+                <dd><a href="http://localhost:6006/" target="new">Tensorboard</a></dd>
             </dl>
         </div>
     </div>
@@ -214,30 +216,54 @@ <h3>Inference Options</h3>
                     </div>
                 </div>
 
-{% if inference_form_html %}
-{{ inference_form_html|safe }}
-<div class="form-group">
-    <label for="show_visualizations">
-        <input id="show_visualizations" name="show_visualizations" type="checkbox" value="y">
-        Show visualizations and statistics
-    </label>
-    <span name="show_visualizations_explanation"
-        class="explanation-tooltip glyphicon glyphicon-question-sign"
-        data-container="body"
-        title="For each layer in the network, show statistics for the weights/activations and attempt to represent the data visually. Can delay classification considerably."
-        ></span>
-</div>
+                <div class="row">
+                    <div class="form-group">
+                        <div class="col-sm-6">
+                            <h3>Select Inference form</h3>
+                            <div class="form-group">
+                                <select id="data_extension_id" name="data_extension_id" class="form-control">
+                                    {% for key in data_extensions.keys()|sort %}
+                                        <option value="{{ key }}">{{ data_extensions[key] }}</option>
+                                    {% endfor %}
+                                </select>
+                            </div>
+                        </div>
+                    </div>
+                </div>
+
+                <div class="row" id="custom-inference-form" >
+                    <div id="custom-inference-form-html">
+                    </div>
+                </div>
 
-<button name="infer-db-btn"
-    formaction="{{url_for('digits.model.images.generic.views.infer_extension', job_id=job.id())}}"
-    formmethod="post"
-    formenctype="multipart/form-data"
-    formtarget="_blank"
-    class="btn btn-primary">
-    Test
-</button>
-{% else %}
                 <div class="row">
+                    <div class="col-sm-6">
+                        <div class="form-group">
+                            <label for="show_visualizations">
+                                <input id="show_visualizations" name="show_visualizations" type="checkbox" value="y">
+                                Show visualizations and statistics
+                            </label>
+                            <span name="show_visualizations_explanation"
+                                class="explanation-tooltip glyphicon glyphicon-question-sign"
+                                data-container="body"
+                                title="For each layer in the network, show statistics for the weights/activations and attempt to represent the data visually. Can delay classification considerably."
+                                ></span>
+                        </div>
+
+                        <input type="hidden" name="Language" value="English">
+
+                        <button name="infer-db-btn"
+                            formaction="{{url_for('digits.model.images.generic.views.infer_extension', job_id=job.id())}}"
+                            formmethod="post"
+                            formenctype="multipart/form-data"
+                            formtarget="_blank"
+                            class="btn btn-primary">
+                            Test
+                        </button>
+                    </div>
+                </div>
+
+                <div class="row" id="default-inference-form">
                     <div class="col-sm-6">
                         <h3>Test a single image</h3>
                         <div class="form-group">
@@ -344,10 +370,40 @@ <h3>Test a list of images</h3>
                             ></span>
                     </div>
                 </div>
-{% endif %}
             </form>
         </div>
     </div>
 </div>
 
+<script>
+$("#data_extension_id").change(function() {
+    if ($(this).val()) {
+
+        $.ajax("/datasets/inference-form/" + $(this).val() + "/" + "{{ job.dataset.id() }}",
+            {
+                type: "GET",
+                }
+            )
+        .done(function(data) {
+                if (data.length > 0)
+                {
+                    $("#default-inference-form").hide();
+                    $("#custom-inference-form-html").html(data);
+                    $("#custom-inference-form-html").show();
+                }
+                else
+                {
+                    $("#custom-inference-form-html").hide();
+                    $("#default-inference-form").show();
+                }
+            })
+        .fail(function(data) {
+            $("#custom-inference-form-html").html("");
+            errorAlert(data);
+            });
+        }
+    });
+$("#data_extension_id").change();
+</script>
+
 {% endblock %}
diff --git a/digits/tools/create_db.py b/digits/tools/create_db.py
index 035d18173..2cde630e0 100755
--- a/digits/tools/create_db.py
+++ b/digits/tools/create_db.py
@@ -34,7 +34,10 @@
 import caffe.io  # noqa
 import caffe_pb2  # noqa
 
-import tensorflow as tf # @TODO(tzaman) - remove TF dependency
+if digits.config.config_value('tensorflow')['enabled']:
+    import tensorflow as tf
+else:
+    tf = None
 
 logger = logging.getLogger('digits.tools.create_db')
 
@@ -306,16 +309,20 @@ def create_db(input_file, output_dir,
 
 
 def _create_tfrecords(image_count, write_queue, batch_size, output_dir,
-        summary_queue, num_threads,
-        mean_files      = None,
-        encoding        = None,
-        lmdb_map_size   = None,
-        **kwargs):
+                      summary_queue, num_threads,
+                      mean_files=None,
+                      encoding=None,
+                      lmdb_map_size=None,
+                      **kwargs):
     """
     Creates the TFRecords database(s)
     """
     LIST_FILENAME = 'list.txt'
-    
+
+    if not tf:
+        raise ValueError("Can't create TFRecords as support for Tensorflow "
+                         "is not enabled.")
+
     wait_time = time.time()
     threads_done = 0
     images_loaded = 0
@@ -323,13 +330,12 @@ def _create_tfrecords(image_count, write_queue, batch_size, output_dir,
     image_sum = None
     compute_mean = bool(mean_files)
 
-
     os.makedirs(output_dir)
 
     # We need shards to achieve good mixing properties because TFRecords
     # is a sequential/streaming reader, and has no random access.
 
-    num_shards = 16 # @TODO(tzaman) put some logic behind this
+    num_shards = 16  # @TODO(tzaman) put some logic behind this
 
     writers = []
     with open(os.path.join(output_dir, LIST_FILENAME), 'w') as outfile:
@@ -387,7 +393,6 @@ def _create_tfrecords(image_count, write_queue, batch_size, output_dir,
         writer.close()
 
 
-
 def _create_lmdb(image_count, write_queue, batch_size, output_dir,
                  summary_queue, num_threads,
                  mean_files=None,
@@ -702,10 +707,12 @@ def _initial_image_sum(width, height, channels):
 
 
 def _int64_feature(value):
-  return tf.train.Feature(int64_list=tf.train.Int64List(value=[value]))
+    return tf.train.Feature(int64_list=tf.train.Int64List(value=[value]))
+
 
 def _bytes_feature(value):
-  return tf.train.Feature(bytes_list=tf.train.BytesList(value=[value]))
+    return tf.train.Feature(bytes_list=tf.train.BytesList(value=[value]))
+
 
 def _array_to_tf_feature(image, label, encoding):
     """
@@ -725,23 +732,24 @@ def _array_to_tf_feature(image, label, encoding):
         else:
             raise ValueError('Invalid encoding type')
         image_raw = s.getvalue()
-        
-    depth = image.shape[2] if len(image.shape)>2 else 1
+
+    depth = image.shape[2] if len(image.shape) > 2 else 1
 
     example = tf.train.Example(
-            features=tf.train.Features(
-                feature={
-                    'height': _int64_feature(image.shape[0]),
-                    'width': _int64_feature(image.shape[1]),
-                    'depth': _int64_feature(depth),
-                    'label': _int64_feature(label),
-                    'image_raw': _bytes_feature(image_raw),
-                    'encoding' :  _int64_feature(encoding_id),
-                    # @TODO(tzaman) - add bitdepth flag?
-                }
-            ))
+        features=tf.train.Features(
+            feature={
+                'height': _int64_feature(image.shape[0]),
+                'width': _int64_feature(image.shape[1]),
+                'depth': _int64_feature(depth),
+                'label': _int64_feature(label),
+                'image_raw': _bytes_feature(image_raw),
+                'encoding':  _int64_feature(encoding_id),
+                # @TODO(tzaman) - add bitdepth flag?
+            }
+        ))
     return example.SerializeToString()
 
+
 def _array_to_datum(image, label, encoding):
     """
     Create a caffe Datum from a numpy.ndarray
@@ -891,8 +899,8 @@ def _save_means(image_sum, image_count, mean_files):
                         help='Database compression format (gzip)'
                         )
     parser.add_argument('-b', '--backend',
-            default='lmdb',
-            help='The database backend - lmdb[default], hdf5 or tfrecords')
+                        default='lmdb',
+                        help='The database backend - lmdb[default], hdf5 or tfrecords')
     parser.add_argument('--lmdb_map_size',
                         type=int,
                         help='The initial map size for LMDB (in MB)')
diff --git a/digits/tools/tensorflow/_test.py b/digits/tools/tensorflow/_test.py
deleted file mode 100755
index 4bfd751be..000000000
--- a/digits/tools/tensorflow/_test.py
+++ /dev/null
@@ -1,127 +0,0 @@
-#!/usr/bin/python
-
-# This file is a scratchpad used to test main.py
-
-import os
-import subprocess
-
-#dataset_dir = "/Users/tzaman/jobs/20160715-230349-5f23" #CIFAR100
-#dataset_dir = "/Users/tzaman/jobs/20160715-230434-21a4" #CIFAR10 LMDB
-#dataset_dir = "/Users/tzaman/jobs/20160615-215643-75fd" #MNIST LMDB
-#dataset_dir = "/Users/tzaman/jobs/gradient_regression" #Gradient Regression
-#dataset_dir = "/Users/tzaman/jobs/20161002-185828-d0cd" #Triangle-segmentation
-#dataset_dir = "/Users/tzaman/jobs/20161014-112206-c4ec" #MNIST HDF5 Uncompressed
-#dataset_dir = "/Users/tzaman/jobs/20161014-112335-a0f1" #MNIST HDF5 GZIP
-#dataset_dir = "/Users/tzaman/jobs/20161014-151839-2c91" #CIFAR10 HDF5 32x32
-
-dataset_dir = "/home/tzaman/jobs/20161011-143422-78cb" #MNIST
-#dataset_dir = "/home/tzaman/jobs/20161019-200547-1dcb" #CIFAR10
-#dataset_dir = "/home/tzaman/jobs/20161019-204719-79a4" #CIFAR10-256
-
-# TIM'S OVERRIDES:
-args = ""
-
-if 1:
-	args = args + (
-	" --labels=" + dataset_dir + "/labels.txt"
-	" --networkDirectory=../../standard-networks/tensorflow"
-	#" --network=gradient.py"
-	" --network=lenet.py"
-	#" --network=alexnet-from-28.py"
-	#" --network=alexnet.py"
-	#" --network=siamese_simple.py"
-	#" --network=lenet_slim.py"
-	#" --network=rnn_mnist.py"
-	#" --network=autoencoder.py"
-	#" --network=binary_segmentation.py"
-	" --mean=" + dataset_dir + "/mean.binaryproto"
-	" --subtractMean=pixel"
-	#" --subtractMean=image"
-#	" --croplen=224"
-	" --train_db=" + dataset_dir + "/train_db"
-	" --validation_db=" + dataset_dir + "/val_db"
-	" --summaries_dir=/tmp/tb/"
-#	" --save=/Users/tzaman/Desktop/result"
-	" --seed=1"
-	" --epoch=1"
-	" --interval=1"
-	#" --tf_summaries_dir=/Users/tzaman/Desktop/tb/"
-	" --shuffle=False"
-	#" --optimization=adam"
-	#" --weights=/Users/tzaman/Desktop/result/loadme2"
-	" --batch_size=128"
-	" --log_runtime_stats_per_step=0"
-	" --snapshotInterval=0"
-	" --type=cpu"
-	)
-
-if 0: #TFRecords
-	args = args + (
-		#" --train_db=/Users/tzaman/Desktop/tfrecords_mnist/train.tfrecords"
-		" --train_db=/home/tzaman/tfrecords_mnist/train.tfrecords"
-		)
-
-if 0: #Load weights for plain lenet
-	args = args + (
-		" --weights=/Users/tzaman/jobs/20161014-173513-623a/snapshot_1.0_Model/Model.ckpt"
-		" --croplen=28"
-		)
-
-if 0: #LR and Optimizer
-	args = args + (
-		" --lr_policy=exp"
-		" --lr_gamma=0.98"
-		#" --lr_power=1"
-		" --lr_base_rate=0.1"
-		" --optimization=sgd"
-		)
-
-if 0: #Visualize Network
-	args = args + (
-	" --networkDirectory=../../digits/standard-networks/tensorflow"
-	" --network=lenet_slim.py"
-	" --visualizeModelPath=/Users/tzaman/Desktop/graphtest/x/test.pbtxt"
-	)
-
-if 0: # toggle if using a dataset with labels in a db
-	args = args + (
-		" --train_labels=" + dataset_dir + "/train_db_labels"
-		" --validation_labels=" + dataset_dir + "/val_db_labels"
-		)
-
-if 0: # Inference
-	dataset_dir = "/Users/tzaman/jobs/20160615-215643-75fd" #MNIST
-	network_dir = "/Users/tzaman/jobs/20161015-162923-2ce8" #MNIST
-	inference_db = "/Users/tzaman/Desktop/zes.png"
-	#inference_db = "/Users/tzaman/Desktop/list.txt"
-	args = args + (
-		" --inference_db=" + inference_db + ""
-		" --batch_size=1"
-		" --labels=" + dataset_dir + "/labels.txt"
-		" --mean=" + dataset_dir + "/mean.binaryproto"
-		" --subtractMean=pixel"
-		" --network=network.py"
-		" --networkDirectory=" + network_dir + ""
-		" --weights=" + network_dir + "/snapshot_1.0.ckpt"
-		#" --allPredictions=1"
-		#" --visualization=False"
-		#" --testMany=False"
-		#" --testUntil=-1"
-		)
-	if 1: #with visualize
-		args = args + (
-			" --visualize_inf=1"
-			)
-
-
-
-# For some reason, the DYLD_LIBRARY_PATH is not copied with it, so supply in-line:
-
-#cmd = "DYLD_LIBRARY_PATH=$DYLD_LIBRARY_PATH:$CUDA_HOME/lib /opt/local/bin/python2.7 main.py" + args
-cmd = "python main.py" + args
-
-p = subprocess.Popen(cmd,
-        close_fds=True,
-        env=os.environ.copy(),
-        shell=True
-        ).wait()
diff --git a/digits/tools/tensorflow/caffe_tf_pb2.py b/digits/tools/tensorflow/caffe_tf_pb2.py
index 20d919b12..fe99857ee 100644
--- a/digits/tools/tensorflow/caffe_tf_pb2.py
+++ b/digits/tools/tensorflow/caffe_tf_pb2.py
@@ -2,244 +2,241 @@
 # source: caffe_tf.proto
 
 import sys
-_b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
 from google.protobuf import descriptor as _descriptor
 from google.protobuf import message as _message
 from google.protobuf import reflection as _reflection
 from google.protobuf import symbol_database as _symbol_database
-from google.protobuf import descriptor_pb2
+from google.protobuf import descriptor_pb2  # noqa
 # @@protoc_insertion_point(imports)
 
-_sym_db = _symbol_database.Default()
-
+_b = (sys.version_info[0] < 3 and (lambda x: x)) or (lambda x: x.encode('latin1'))
 
+_sym_db = _symbol_database.Default()
 
 
 DESCRIPTOR = _descriptor.FileDescriptor(
-  name='caffe_tf.proto',
-  package='',
-  serialized_pb=_b('\n\x0e\x63\x61\x66\x66\x65_tf.proto\"\x1c\n\tBlobShape\x12\x0f\n\x03\x64im\x18\x01 \x03(\x03\x42\x02\x10\x01\"\xc6\x01\n\tBlobProto\x12\x19\n\x05shape\x18\x07 \x01(\x0b\x32\n.BlobShape\x12\x10\n\x04\x64\x61ta\x18\x05 \x03(\x02\x42\x02\x10\x01\x12\x10\n\x04\x64iff\x18\x06 \x03(\x02\x42\x02\x10\x01\x12\x17\n\x0b\x64ouble_data\x18\x08 \x03(\x01\x42\x02\x10\x01\x12\x17\n\x0b\x64ouble_diff\x18\t \x03(\x01\x42\x02\x10\x01\x12\x0e\n\x03num\x18\x01 \x01(\x05:\x01\x30\x12\x13\n\x08\x63hannels\x18\x02 \x01(\x05:\x01\x30\x12\x11\n\x06height\x18\x03 \x01(\x05:\x01\x30\x12\x10\n\x05width\x18\x04 \x01(\x05:\x01\x30\",\n\x0f\x42lobProtoVector\x12\x19\n\x05\x62lobs\x18\x01 \x03(\x0b\x32\n.BlobProto\"\x81\x01\n\x05\x44\x61tum\x12\x10\n\x08\x63hannels\x18\x01 \x01(\x05\x12\x0e\n\x06height\x18\x02 \x01(\x05\x12\r\n\x05width\x18\x03 \x01(\x05\x12\x0c\n\x04\x64\x61ta\x18\x04 \x01(\x0c\x12\r\n\x05label\x18\x05 \x01(\x05\x12\x12\n\nfloat_data\x18\x06 \x03(\x02\x12\x16\n\x07\x65ncoded\x18\x07 \x01(\x08:\x05\x66\x61lse')
+    name='caffe_tf.proto',
+    package='',
+    serialized_pb=_b('\n\x0e\x63\x61\x66\x66\x65_tf.proto\"\x1c\n\tBlobShape\x12\x0f\n\x03\x64im\x18\x01 \x03(\x03\x42\x02\x10\x01\"\xc6\x01\n\tBlobProto\x12\x19\n\x05shape\x18\x07 \x01(\x0b\x32\n.BlobShape\x12\x10\n\x04\x64\x61ta\x18\x05 \x03(\x02\x42\x02\x10\x01\x12\x10\n\x04\x64iff\x18\x06 \x03(\x02\x42\x02\x10\x01\x12\x17\n\x0b\x64ouble_data\x18\x08 \x03(\x01\x42\x02\x10\x01\x12\x17\n\x0b\x64ouble_diff\x18\t \x03(\x01\x42\x02\x10\x01\x12\x0e\n\x03num\x18\x01 \x01(\x05:\x01\x30\x12\x13\n\x08\x63hannels\x18\x02 \x01(\x05:\x01\x30\x12\x11\n\x06height\x18\x03 \x01(\x05:\x01\x30\x12\x10\n\x05width\x18\x04 \x01(\x05:\x01\x30\",\n\x0f\x42lobProtoVector\x12\x19\n\x05\x62lobs\x18\x01 \x03(\x0b\x32\n.BlobProto\"\x81\x01\n\x05\x44\x61tum\x12\x10\n\x08\x63hannels\x18\x01 \x01(\x05\x12\x0e\n\x06height\x18\x02 \x01(\x05\x12\r\n\x05width\x18\x03 \x01(\x05\x12\x0c\n\x04\x64\x61ta\x18\x04 \x01(\x0c\x12\r\n\x05label\x18\x05 \x01(\x05\x12\x12\n\nfloat_data\x18\x06 \x03(\x02\x12\x16\n\x07\x65ncoded\x18\x07 \x01(\x08:\x05\x66\x61lse')  # noqa
 )
 _sym_db.RegisterFileDescriptor(DESCRIPTOR)
 
 
-
-
 _BLOBSHAPE = _descriptor.Descriptor(
-  name='BlobShape',
-  full_name='BlobShape',
-  filename=None,
-  file=DESCRIPTOR,
-  containing_type=None,
-  fields=[
-    _descriptor.FieldDescriptor(
-      name='dim', full_name='BlobShape.dim', index=0,
-      number=1, type=3, cpp_type=2, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
-  ],
-  extensions=[
-  ],
-  nested_types=[],
-  enum_types=[
-  ],
-  options=None,
-  is_extendable=False,
-  extension_ranges=[],
-  oneofs=[
-  ],
-  serialized_start=18,
-  serialized_end=46,
+    name='BlobShape',
+    full_name='BlobShape',
+    filename=None,
+    file=DESCRIPTOR,
+    containing_type=None,
+    fields=[
+        _descriptor.FieldDescriptor(
+            name='dim', full_name='BlobShape.dim', index=0,
+            number=1, type=3, cpp_type=2, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
+    ],
+    extensions=[
+    ],
+    nested_types=[],
+    enum_types=[
+    ],
+    options=None,
+    is_extendable=False,
+    extension_ranges=[],
+    oneofs=[
+    ],
+    serialized_start=18,
+    serialized_end=46,
 )
 
 
 _BLOBPROTO = _descriptor.Descriptor(
-  name='BlobProto',
-  full_name='BlobProto',
-  filename=None,
-  file=DESCRIPTOR,
-  containing_type=None,
-  fields=[
-    _descriptor.FieldDescriptor(
-      name='shape', full_name='BlobProto.shape', index=0,
-      number=7, type=11, cpp_type=10, label=1,
-      has_default_value=False, default_value=None,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='data', full_name='BlobProto.data', index=1,
-      number=5, type=2, cpp_type=6, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
-    _descriptor.FieldDescriptor(
-      name='diff', full_name='BlobProto.diff', index=2,
-      number=6, type=2, cpp_type=6, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
-    _descriptor.FieldDescriptor(
-      name='double_data', full_name='BlobProto.double_data', index=3,
-      number=8, type=1, cpp_type=5, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
-    _descriptor.FieldDescriptor(
-      name='double_diff', full_name='BlobProto.double_diff', index=4,
-      number=9, type=1, cpp_type=5, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
-    _descriptor.FieldDescriptor(
-      name='num', full_name='BlobProto.num', index=5,
-      number=1, type=5, cpp_type=1, label=1,
-      has_default_value=True, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='channels', full_name='BlobProto.channels', index=6,
-      number=2, type=5, cpp_type=1, label=1,
-      has_default_value=True, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='height', full_name='BlobProto.height', index=7,
-      number=3, type=5, cpp_type=1, label=1,
-      has_default_value=True, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='width', full_name='BlobProto.width', index=8,
-      number=4, type=5, cpp_type=1, label=1,
-      has_default_value=True, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-  ],
-  extensions=[
-  ],
-  nested_types=[],
-  enum_types=[
-  ],
-  options=None,
-  is_extendable=False,
-  extension_ranges=[],
-  oneofs=[
-  ],
-  serialized_start=49,
-  serialized_end=247,
+    name='BlobProto',
+    full_name='BlobProto',
+    filename=None,
+    file=DESCRIPTOR,
+    containing_type=None,
+    fields=[
+        _descriptor.FieldDescriptor(
+            name='shape', full_name='BlobProto.shape', index=0,
+            number=7, type=11, cpp_type=10, label=1,
+            has_default_value=False, default_value=None,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='data', full_name='BlobProto.data', index=1,
+            number=5, type=2, cpp_type=6, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
+        _descriptor.FieldDescriptor(
+            name='diff', full_name='BlobProto.diff', index=2,
+            number=6, type=2, cpp_type=6, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
+        _descriptor.FieldDescriptor(
+            name='double_data', full_name='BlobProto.double_data', index=3,
+            number=8, type=1, cpp_type=5, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
+        _descriptor.FieldDescriptor(
+            name='double_diff', full_name='BlobProto.double_diff', index=4,
+            number=9, type=1, cpp_type=5, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))),
+        _descriptor.FieldDescriptor(
+            name='num', full_name='BlobProto.num', index=5,
+            number=1, type=5, cpp_type=1, label=1,
+            has_default_value=True, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='channels', full_name='BlobProto.channels', index=6,
+            number=2, type=5, cpp_type=1, label=1,
+            has_default_value=True, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='height', full_name='BlobProto.height', index=7,
+            number=3, type=5, cpp_type=1, label=1,
+            has_default_value=True, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='width', full_name='BlobProto.width', index=8,
+            number=4, type=5, cpp_type=1, label=1,
+            has_default_value=True, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+    ],
+    extensions=[
+    ],
+    nested_types=[],
+    enum_types=[
+    ],
+    options=None,
+    is_extendable=False,
+    extension_ranges=[],
+    oneofs=[
+    ],
+    serialized_start=49,
+    serialized_end=247,
 )
 
 
 _BLOBPROTOVECTOR = _descriptor.Descriptor(
-  name='BlobProtoVector',
-  full_name='BlobProtoVector',
-  filename=None,
-  file=DESCRIPTOR,
-  containing_type=None,
-  fields=[
-    _descriptor.FieldDescriptor(
-      name='blobs', full_name='BlobProtoVector.blobs', index=0,
-      number=1, type=11, cpp_type=10, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-  ],
-  extensions=[
-  ],
-  nested_types=[],
-  enum_types=[
-  ],
-  options=None,
-  is_extendable=False,
-  extension_ranges=[],
-  oneofs=[
-  ],
-  serialized_start=249,
-  serialized_end=293,
+    name='BlobProtoVector',
+    full_name='BlobProtoVector',
+    filename=None,
+    file=DESCRIPTOR,
+    containing_type=None,
+    fields=[
+        _descriptor.FieldDescriptor(
+            name='blobs', full_name='BlobProtoVector.blobs', index=0,
+            number=1, type=11, cpp_type=10, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+    ],
+    extensions=[
+    ],
+    nested_types=[],
+    enum_types=[
+    ],
+    options=None,
+    is_extendable=False,
+    extension_ranges=[],
+    oneofs=[
+    ],
+    serialized_start=249,
+    serialized_end=293,
 )
 
 
 _DATUM = _descriptor.Descriptor(
-  name='Datum',
-  full_name='Datum',
-  filename=None,
-  file=DESCRIPTOR,
-  containing_type=None,
-  fields=[
-    _descriptor.FieldDescriptor(
-      name='channels', full_name='Datum.channels', index=0,
-      number=1, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='height', full_name='Datum.height', index=1,
-      number=2, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='width', full_name='Datum.width', index=2,
-      number=3, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='data', full_name='Datum.data', index=3,
-      number=4, type=12, cpp_type=9, label=1,
-      has_default_value=False, default_value=_b(""),
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='label', full_name='Datum.label', index=4,
-      number=5, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='float_data', full_name='Datum.float_data', index=5,
-      number=6, type=2, cpp_type=6, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='encoded', full_name='Datum.encoded', index=6,
-      number=7, type=8, cpp_type=7, label=1,
-      has_default_value=True, default_value=False,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-  ],
-  extensions=[
-  ],
-  nested_types=[],
-  enum_types=[
-  ],
-  options=None,
-  is_extendable=False,
-  extension_ranges=[],
-  oneofs=[
-  ],
-  serialized_start=296,
-  serialized_end=425,
+    name='Datum',
+    full_name='Datum',
+    filename=None,
+    file=DESCRIPTOR,
+    containing_type=None,
+    fields=[
+        _descriptor.FieldDescriptor(
+            name='channels', full_name='Datum.channels', index=0,
+            number=1, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='height', full_name='Datum.height', index=1,
+            number=2, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='width', full_name='Datum.width', index=2,
+            number=3, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='data', full_name='Datum.data', index=3,
+            number=4, type=12, cpp_type=9, label=1,
+            has_default_value=False, default_value=_b(""),
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='label', full_name='Datum.label', index=4,
+            number=5, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='float_data', full_name='Datum.float_data', index=5,
+            number=6, type=2, cpp_type=6, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='encoded', full_name='Datum.encoded', index=6,
+            number=7, type=8, cpp_type=7, label=1,
+            has_default_value=True, default_value=False,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+    ],
+    extensions=[
+    ],
+    nested_types=[],
+    enum_types=[
+    ],
+    options=None,
+    is_extendable=False,
+    extension_ranges=[],
+    oneofs=[
+    ],
+    serialized_start=296,
+    serialized_end=425,
 )
 
 _BLOBPROTO.fields_by_name['shape'].message_type = _BLOBSHAPE
@@ -250,42 +247,47 @@
 DESCRIPTOR.message_types_by_name['Datum'] = _DATUM
 
 BlobShape = _reflection.GeneratedProtocolMessageType('BlobShape', (_message.Message,), dict(
-  DESCRIPTOR = _BLOBSHAPE,
-  __module__ = 'caffe_tf_pb2'
-  # @@protoc_insertion_point(class_scope:BlobShape)
-  ))
+    DESCRIPTOR=_BLOBSHAPE,
+    __module__='caffe_tf_pb2'
+    # @@protoc_insertion_point(class_scope:BlobShape)
+    ))
 _sym_db.RegisterMessage(BlobShape)
 
 BlobProto = _reflection.GeneratedProtocolMessageType('BlobProto', (_message.Message,), dict(
-  DESCRIPTOR = _BLOBPROTO,
-  __module__ = 'caffe_tf_pb2'
-  # @@protoc_insertion_point(class_scope:BlobProto)
-  ))
+    DESCRIPTOR=_BLOBPROTO,
+    __module__='caffe_tf_pb2'
+    # @@protoc_insertion_point(class_scope:BlobProto)
+    ))
 _sym_db.RegisterMessage(BlobProto)
 
 BlobProtoVector = _reflection.GeneratedProtocolMessageType('BlobProtoVector', (_message.Message,), dict(
-  DESCRIPTOR = _BLOBPROTOVECTOR,
-  __module__ = 'caffe_tf_pb2'
-  # @@protoc_insertion_point(class_scope:BlobProtoVector)
-  ))
+    DESCRIPTOR=_BLOBPROTOVECTOR,
+    __module__='caffe_tf_pb2'
+    # @@protoc_insertion_point(class_scope:BlobProtoVector)
+    ))
 _sym_db.RegisterMessage(BlobProtoVector)
 
 Datum = _reflection.GeneratedProtocolMessageType('Datum', (_message.Message,), dict(
-  DESCRIPTOR = _DATUM,
-  __module__ = 'caffe_tf_pb2'
-  # @@protoc_insertion_point(class_scope:Datum)
-  ))
+    DESCRIPTOR=_DATUM,
+    __module__='caffe_tf_pb2'
+    # @@protoc_insertion_point(class_scope:Datum)
+    ))
 _sym_db.RegisterMessage(Datum)
 
 
 _BLOBSHAPE.fields_by_name['dim'].has_options = True
-_BLOBSHAPE.fields_by_name['dim']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))
+_BLOBSHAPE.fields_by_name['dim']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(),
+                                                                      _b('\020\001'))
 _BLOBPROTO.fields_by_name['data'].has_options = True
-_BLOBPROTO.fields_by_name['data']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))
+_BLOBPROTO.fields_by_name['data']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(),
+                                                                       _b('\020\001'))
 _BLOBPROTO.fields_by_name['diff'].has_options = True
-_BLOBPROTO.fields_by_name['diff']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))
+_BLOBPROTO.fields_by_name['diff']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(),
+                                                                       _b('\020\001'))
 _BLOBPROTO.fields_by_name['double_data'].has_options = True
-_BLOBPROTO.fields_by_name['double_data']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))
+_BLOBPROTO.fields_by_name['double_data']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(),
+                                                                              _b('\020\001'))
 _BLOBPROTO.fields_by_name['double_diff'].has_options = True
-_BLOBPROTO.fields_by_name['double_diff']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001'))
+_BLOBPROTO.fields_by_name['double_diff']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(),
+                                                                              _b('\020\001'))
 # @@protoc_insertion_point(module_scope)
diff --git a/digits/tools/tensorflow/datum_pb2.py b/digits/tools/tensorflow/datum_pb2.py
index bcb4d508c..9f0bc91a4 100644
--- a/digits/tools/tensorflow/datum_pb2.py
+++ b/digits/tools/tensorflow/datum_pb2.py
@@ -2,107 +2,105 @@
 # source: datum.proto
 
 import sys
-_b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
+
 from google.protobuf import descriptor as _descriptor
 from google.protobuf import message as _message
 from google.protobuf import reflection as _reflection
 from google.protobuf import symbol_database as _symbol_database
-from google.protobuf import descriptor_pb2
+from google.protobuf import descriptor_pb2  # noqa
 # @@protoc_insertion_point(imports)
 
-_sym_db = _symbol_database.Default()
-
+_b = (sys.version_info[0] < 3 and (lambda x: x)) or (lambda x: x.encode('latin1'))
 
+_sym_db = _symbol_database.Default()
 
 
 DESCRIPTOR = _descriptor.FileDescriptor(
-  name='datum.proto',
-  package='',
-  serialized_pb=_b('\n\x0b\x64\x61tum.proto\"\x81\x01\n\x05\x44\x61tum\x12\x10\n\x08\x63hannels\x18\x01 \x01(\x05\x12\x0e\n\x06height\x18\x02 \x01(\x05\x12\r\n\x05width\x18\x03 \x01(\x05\x12\x0c\n\x04\x64\x61ta\x18\x04 \x01(\x0c\x12\r\n\x05label\x18\x05 \x01(\x05\x12\x12\n\nfloat_data\x18\x06 \x03(\x02\x12\x16\n\x07\x65ncoded\x18\x07 \x01(\x08:\x05\x66\x61lse')
+    name='datum.proto',
+    package='',
+    serialized_pb=_b('\n\x0b\x64\x61tum.proto\"\x81\x01\n\x05\x44\x61tum\x12\x10\n\x08\x63hannels\x18\x01 \x01(\x05\x12\x0e\n\x06height\x18\x02 \x01(\x05\x12\r\n\x05width\x18\x03 \x01(\x05\x12\x0c\n\x04\x64\x61ta\x18\x04 \x01(\x0c\x12\r\n\x05label\x18\x05 \x01(\x05\x12\x12\n\nfloat_data\x18\x06 \x03(\x02\x12\x16\n\x07\x65ncoded\x18\x07 \x01(\x08:\x05\x66\x61lse')  # noqa
 )
 _sym_db.RegisterFileDescriptor(DESCRIPTOR)
 
 
-
-
 _DATUM = _descriptor.Descriptor(
-  name='Datum',
-  full_name='Datum',
-  filename=None,
-  file=DESCRIPTOR,
-  containing_type=None,
-  fields=[
-    _descriptor.FieldDescriptor(
-      name='channels', full_name='Datum.channels', index=0,
-      number=1, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='height', full_name='Datum.height', index=1,
-      number=2, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='width', full_name='Datum.width', index=2,
-      number=3, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='data', full_name='Datum.data', index=3,
-      number=4, type=12, cpp_type=9, label=1,
-      has_default_value=False, default_value=_b(""),
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='label', full_name='Datum.label', index=4,
-      number=5, type=5, cpp_type=1, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='float_data', full_name='Datum.float_data', index=5,
-      number=6, type=2, cpp_type=6, label=3,
-      has_default_value=False, default_value=[],
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='encoded', full_name='Datum.encoded', index=6,
-      number=7, type=8, cpp_type=7, label=1,
-      has_default_value=True, default_value=False,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-  ],
-  extensions=[
-  ],
-  nested_types=[],
-  enum_types=[
-  ],
-  options=None,
-  is_extendable=False,
-  extension_ranges=[],
-  oneofs=[
-  ],
-  serialized_start=16,
-  serialized_end=145,
+    name='Datum',
+    full_name='Datum',
+    filename=None,
+    file=DESCRIPTOR,
+    containing_type=None,
+    fields=[
+        _descriptor.FieldDescriptor(
+            name='channels', full_name='Datum.channels', index=0,
+            number=1, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='height', full_name='Datum.height', index=1,
+            number=2, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='width', full_name='Datum.width', index=2,
+            number=3, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='data', full_name='Datum.data', index=3,
+            number=4, type=12, cpp_type=9, label=1,
+            has_default_value=False, default_value=_b(""),
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='label', full_name='Datum.label', index=4,
+            number=5, type=5, cpp_type=1, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='float_data', full_name='Datum.float_data', index=5,
+            number=6, type=2, cpp_type=6, label=3,
+            has_default_value=False, default_value=[],
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='encoded', full_name='Datum.encoded', index=6,
+            number=7, type=8, cpp_type=7, label=1,
+            has_default_value=True, default_value=False,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+    ],
+    extensions=[
+    ],
+    nested_types=[],
+    enum_types=[
+    ],
+    options=None,
+    is_extendable=False,
+    extension_ranges=[],
+    oneofs=[
+    ],
+    serialized_start=16,
+    serialized_end=145,
 )
 
 DESCRIPTOR.message_types_by_name['Datum'] = _DATUM
 
 Datum = _reflection.GeneratedProtocolMessageType('Datum', (_message.Message,), dict(
-  DESCRIPTOR = _DATUM,
-  __module__ = 'datum_pb2'
-  # @@protoc_insertion_point(class_scope:Datum)
-  ))
+    DESCRIPTOR=_DATUM,
+    __module__='datum_pb2'
+    # @@protoc_insertion_point(class_scope:Datum)
+    ))
 _sym_db.RegisterMessage(Datum)
 
 
diff --git a/digits/tools/tensorflow/gan_grid.py b/digits/tools/tensorflow/gan_grid.py
new file mode 100644
index 000000000..ddbe37071
--- /dev/null
+++ b/digits/tools/tensorflow/gan_grid.py
@@ -0,0 +1,815 @@
+#!/usr/bin/env python2
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+#
+# This document should comply with PEP-8 Style Guide
+# Linter: pylint
+
+"""
+TensorFlow training executable for DIGITS
+Defines the training procedure
+
+Usage:
+See the self-documenting flags below.
+
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import threading
+import time
+
+import datetime
+import inspect
+import json
+import logging
+import math
+import numpy as np
+import os
+import pickle
+import time
+
+from six.moves import xrange  # noqa
+import tensorflow as tf
+import tensorflow.contrib.slim as slim  # noqa
+from tensorflow.python.client import timeline, device_lib  # noqa
+from tensorflow.python.ops import template  # noqa
+from tensorflow.python.lib.io import file_io
+from tensorflow.core.framework import summary_pb2
+
+
+# Local imports
+import utils as digits
+import lr_policy
+from model import Model, Tower  # noqa
+from utils import model_property  # noqa
+
+import tf_data
+import gandisplay
+
+
+
+# Constants
+TF_INTRA_OP_THREADS = 0
+TF_INTER_OP_THREADS = 0
+MIN_LOGS_PER_TRAIN_EPOCH = 8  # torch default: 8
+
+
+CELEBA_ALL_ATTRIBUTES = """
+                         5_o_Clock_Shadow Arched_Eyebrows Attractive Bags_Under_Eyes Bald Bangs
+                         Big_Lips Big_Nose Black_Hair Blond_Hair Blurry Brown_Hair Bushy_Eyebrows
+                         Chubby Double_Chin Eyeglasses Goatee Gray_Hair Heavy_Makeup High_Cheekbones
+                         Male Mouth_Slightly_Open Mustache Narrow_Eyes No_Beard Oval_Face Pale_Skin
+                         Pointy_Nose Receding_Hairline Rosy_Cheeks Sideburns Smiling Straight_Hair
+                         Wavy_Hair Wearing_Earrings Wearing_Hat Wearing_Lipstick Wearing_Necklace
+                         Wearing_Necktie Young
+                        """.split()
+
+CELEBA_EDITABLE_ATTRIBUTES = [
+    'Bald', 'Black_Hair', 'Blond_Hair', 'Eyeglasses', 'Male', 'Mustache', 'Smiling', 'Young', 'Attractive', 'Pale_Skin', 'Big_Nose'
+]
+
+CELEBA_EDITABLE_ATTRIBUTES_IDS = [CELEBA_ALL_ATTRIBUTES.index(attr) for attr in CELEBA_EDITABLE_ATTRIBUTES]
+
+
+logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',
+                    datefmt='%Y-%m-%d %H:%M:%S',
+                    level=logging.INFO)
+
+FLAGS = tf.app.flags.FLAGS
+
+# Basic model parameters. #float, integer, boolean, string
+tf.app.flags.DEFINE_integer('batch_size', 16, """Number of images to process in a batch""")
+tf.app.flags.DEFINE_integer(
+    'croplen', 0, """Crop (x and y). A zero value means no cropping will be applied""")
+tf.app.flags.DEFINE_integer('epoch', 1, """Number of epochs to train, -1 for unbounded""")
+tf.app.flags.DEFINE_string('inference_db', '', """Directory with inference file source""")
+tf.app.flags.DEFINE_integer(
+    'validation_interval', 1, """Number of train epochs to complete, to perform one validation""")
+tf.app.flags.DEFINE_string('labels_list', '', """Text file listing label definitions""")
+tf.app.flags.DEFINE_string('mean', '', """Mean image file""")
+tf.app.flags.DEFINE_float('momentum', '0.9', """Momentum""")  # Not used by DIGITS front-end
+tf.app.flags.DEFINE_string('network', '', """File containing network (model)""")
+tf.app.flags.DEFINE_string('networkDirectory', '', """Directory in which network exists""")
+tf.app.flags.DEFINE_string('optimization', 'sgd', """Optimization method""")
+tf.app.flags.DEFINE_string('save', 'results', """Save directory""")
+tf.app.flags.DEFINE_integer('seed', 0, """Fixed input seed for repeatable experiments""")
+tf.app.flags.DEFINE_boolean('shuffle', False, """Shuffle records before training""")
+tf.app.flags.DEFINE_float(
+    'snapshotInterval', 1.0,
+    """Specifies the training epochs to be completed before taking a snapshot""")
+tf.app.flags.DEFINE_string('snapshotPrefix', '', """Prefix of the weights/snapshots""")
+tf.app.flags.DEFINE_string(
+    'subtractMean', 'none',
+    """Select mean subtraction method. Possible values are 'image', 'pixel' or 'none'""")
+tf.app.flags.DEFINE_string('train_db', '', """Directory with training file source""")
+tf.app.flags.DEFINE_string(
+    'train_labels', '',
+    """Directory with an optional and seperate labels file source for training""")
+tf.app.flags.DEFINE_string('validation_db', '', """Directory with validation file source""")
+tf.app.flags.DEFINE_string(
+    'validation_labels', '',
+    """Directory with an optional and seperate labels file source for validation""")
+tf.app.flags.DEFINE_string(
+    'visualizeModelPath', '', """Constructs the current model for visualization""")
+tf.app.flags.DEFINE_boolean(
+    'visualize_inf', False, """Will output weights and activations for an inference job.""")
+tf.app.flags.DEFINE_string(
+    'weights', '', """Filename for weights of a model to use for fine-tuning""")
+
+# @TODO(tzaman): is the bitdepth in line with the DIGITS team?
+tf.app.flags.DEFINE_integer('bitdepth', 8, """Specifies an image's bitdepth""")
+
+# @TODO(tzaman); remove torch mentions below
+tf.app.flags.DEFINE_float('lr_base_rate', '0.01', """Learning rate""")
+tf.app.flags.DEFINE_string(
+    'lr_policy', 'fixed',
+    """Learning rate policy. (fixed, step, exp, inv, multistep, poly, sigmoid)""")
+tf.app.flags.DEFINE_float(
+    'lr_gamma', -1,
+    """Required to calculate learning rate. Applies to: (step, exp, inv, multistep, sigmoid)""")
+tf.app.flags.DEFINE_float(
+    'lr_power', float('Inf'),
+    """Required to calculate learning rate. Applies to: (inv, poly)""")
+tf.app.flags.DEFINE_string(
+    'lr_stepvalues', '',
+    """Required to calculate stepsize of the learning rate. Applies to: (step, multistep, sigmoid).
+    For the 'multistep' lr_policy you can input multiple values seperated by commas""")
+
+# Tensorflow-unique arguments for DIGITS
+tf.app.flags.DEFINE_string(
+    'save_vars', 'all',
+    """Sets the collection of variables to be saved: 'all' or only 'trainable'.""")
+tf.app.flags.DEFINE_string('summaries_dir', '', """Directory of Tensorboard Summaries (logdir)""")
+tf.app.flags.DEFINE_boolean(
+    'serving_export', False, """Flag for exporting an Tensorflow Serving model""")
+tf.app.flags.DEFINE_boolean('log_device_placement', False, """Whether to log device placement.""")
+tf.app.flags.DEFINE_integer(
+    'log_runtime_stats_per_step', 0,
+    """Logs runtime statistics for Tensorboard every x steps, defaults to 0 (off).""")
+
+# Augmentation
+tf.app.flags.DEFINE_string(
+    'augFlip', 'none',
+    """The flip options {none, fliplr, flipud, fliplrud} as randompre-processing augmentation""")
+tf.app.flags.DEFINE_float(
+    'augNoise', 0., """The stddev of Noise in AWGN as pre-processing augmentation""")
+tf.app.flags.DEFINE_float(
+    'augContrast', 0., """The contrast factor's bounds as sampled from a random-uniform distribution
+     as pre-processing  augmentation""")
+tf.app.flags.DEFINE_bool(
+    'augWhitening', False, """Performs per-image whitening by subtracting off its own mean and
+    dividing by its own standard deviation.""")
+tf.app.flags.DEFINE_float(
+    'augHSVh', 0., """The stddev of HSV's Hue shift as pre-processing  augmentation""")
+tf.app.flags.DEFINE_float(
+    'augHSVs', 0., """The stddev of HSV's Saturation shift as pre-processing  augmentation""")
+tf.app.flags.DEFINE_float(
+    'augHSVv', 0., """The stddev of HSV's Value shift as pre-processing augmentation""")
+
+# GAN Grid
+tf.app.flags.DEFINE_string('zs_file', 'zs.pkl', """Pickle file containing z vectors to use""")
+tf.app.flags.DEFINE_string('attributes_file', 'attributes.pkl', """Pickle file containing attribute vectors""")
+
+
+def save_timeline_trace(run_metadata, save_dir, step):
+    tl = timeline.Timeline(run_metadata.step_stats)
+    ctf = tl.generate_chrome_trace_format(show_memory=True)
+    tl_fn = os.path.join(save_dir, 'timeline_%s.json' % step)
+    with open(tl_fn, 'w') as f:
+        f.write(ctf)
+    logging.info('Timeline trace written to %s', tl_fn)
+
+
+def strip_data_from_graph_def(graph_def):
+    strip_def = tf.GraphDef()
+    for n0 in graph_def.node:
+        n = strip_def.node.add()
+        n.MergeFrom(n0)
+        if n.op == 'Const':
+            tensor = n.attr['value'].tensor
+            if (tensor.tensor_content):
+                tensor.tensor_content = ''
+            if (tensor.string_val):
+                del tensor.string_val[:]
+    return strip_def
+
+
+def visualize_graph(graph_def, path):
+    graph_def = strip_data_from_graph_def(graph_def)
+    logging.info('Writing Graph Definition..')
+    file_io.write_string_to_file(path, str(graph_def))
+    logging.info('Graph Definition Written.')
+
+
+def average_head_keys(tags, vals):
+    """ Averages keys with same end (head) name.
+    Example: foo1/bar=1 and foo2/bar=2 should collapse to bar=1.5
+    """
+    tail_tags = [w.split('/')[-1] for w in tags]
+    sums = {}
+    nums = {}
+    for a, b in zip(tail_tags, vals):
+        if a not in sums:
+            sums[a] = b
+            nums[a] = 1
+        else:
+            sums[a] += b
+            nums[a] += 1
+    tags_clean = sums.keys()
+    return tags_clean, np.asarray(sums.values())/np.asarray(nums.values())
+
+
+def summary_to_lists(summary_str):
+    """ Takes a Tensorflow stringified Summary object and returns only
+    the scalar values to a list of tags and a list of values
+    Args:
+        summary_str: string of a Tensorflow Summary object
+    Returns:
+        tags: list of tags
+        vals: list of values corresponding to the tag list
+
+    """
+    summ = summary_pb2.Summary()
+    summ.ParseFromString(summary_str)
+    tags = []
+    vals = []
+    for s in summ.value:
+        if s.HasField('simple_value'):  # and s.simple_value: # Only parse scalar_summaries
+            if s.simple_value == float('Inf') or np.isnan(s.simple_value):
+                raise ValueError('Model diverged with %s = %s : Try decreasing your learning rate' %
+                                 (s.tag, s.simple_value))
+            tags.append(s.tag)
+            vals.append(s.simple_value)
+    tags, vals = average_head_keys(tags, vals)
+    vals = np.asarray(vals)
+    return tags, vals
+
+
+def print_summarylist(tags, vals):
+    """ Prints a nice one-line listing of tags and their values in a nice format
+    that corresponds to how the DIGITS regex reads it.
+    Args:
+        tags: an array of tags
+        vals: an array of values
+    Returns:
+        print_list: a string containing formatted tags and values
+    """
+    print_list = ''
+    for i, key in enumerate(tags):
+        if vals[i] == float('Inf'):
+            raise ValueError('Infinite value %s = Inf' % key)
+        print_list = print_list + key + " = " + "{:.6f}".format(vals[i])
+        if i < len(tags)-1:
+            print_list = print_list + ", "
+    return print_list
+
+
+def dump(obj):
+    for attr in dir(obj):
+        print("obj.%s = %s" % (attr, getattr(obj, attr)))
+
+
+def load_snapshot(sess, weight_path, var_candidates):
+    """ Loads a snapshot into a session from a weight path. Will only load the
+    weights that are both in the weight_path file and the passed var_candidates."""
+    logging.info("Loading weights from pretrained model - %s ", weight_path)
+    reader = tf.train.NewCheckpointReader(weight_path)
+    var_map = reader.get_variable_to_shape_map()
+
+    # Only obtain all the variables that are [in the current graph] AND [in the checkpoint]
+    vars_restore = []
+    for vt in var_candidates:
+        for vm in var_map.keys():
+            if vt.name.split(':')[0] == vm:
+                if ("global_step" not in vt.name) and not (vt.name.startswith("train/")):
+                    vars_restore.append(vt)
+                    logging.info('restoring %s -> %s' % (vm, vt.name))
+                else:
+                    logging.info('NOT restoring %s -> %s' % (vm, vt.name))
+
+    logging.info('Restoring %s variable ops.' % len(vars_restore))
+    tf.train.Saver(vars_restore, max_to_keep=0, sharded=FLAGS.serving_export).restore(sess, weight_path)
+    logging.info('Variables restored.')
+
+
+def save_snapshot(sess, saver, save_dir, snapshot_prefix, epoch, for_serving=False):
+    """
+    Saves a snapshot of the current session, saving all variables previously defined
+    in the ctor of the saver. Also saves the flow of the graph itself (only once).
+    """
+    number_dec = str(FLAGS.snapshotInterval-int(FLAGS.snapshotInterval))[2:]
+    if number_dec is '':
+        number_dec = '0'
+    epoch_fmt = "{:." + number_dec + "f}"
+
+    snapshot_file = os.path.join(save_dir, snapshot_prefix + '_' + epoch_fmt.format(epoch) + '.ckpt')
+
+    logging.info('Snapshotting to %s', snapshot_file)
+    saver.save(sess, snapshot_file)
+    logging.info('Snapshot saved.')
+
+    if for_serving:
+        # @TODO(tzaman) : we could further extend this by supporting tensorflow-serve
+        logging.error('NotImplementedError: Tensorflow-Serving support.')
+        exit(-1)
+
+    # Past this point the graph shouldn't be changed, so saving it once is enough
+    filename_graph = os.path.join(save_dir, snapshot_prefix + '.graph_def')
+    if not os.path.isfile(filename_graph):
+        with open(filename_graph, 'wb') as f:
+            logging.info('Saving graph to %s', filename_graph)
+            f.write(sess.graph_def.SerializeToString())
+            logging.info('Saved graph to %s', filename_graph)
+        # meta_graph_def = tf.train.export_meta_graph(filename='?')
+
+
+def save_weight_visualization(w_names, a_names, w, a):
+    try:
+        import h5py
+    except ImportError:
+        logging.error("Attempt to create HDF5 Loader but h5py is not installed.")
+        exit(-1)
+    fn = os.path.join(FLAGS.save, 'vis.h5')
+    vis_db = h5py.File(fn, 'w')
+    db_layers = vis_db.create_group("layers")
+
+    logging.info('Saving visualization to %s', fn)
+    for i in range(0, len(w)):
+        dset = db_layers.create_group(str(i))
+        dset.attrs['var'] = w_names[i].name
+        dset.attrs['op'] = a_names[i]
+        if w[i].shape:
+            dset.create_dataset('weights', data=w[i])
+        if a[i].shape:
+            dset.create_dataset('activations', data=a[i])
+    vis_db.close()
+
+
+def Inference(sess, model):
+    """
+    Runs one inference (evaluation) epoch (all the files in the loader)
+    """
+
+    inference_op = model.towers[0].inference
+    if FLAGS.labels_list:  # Classification -> assume softmax usage
+        # Append a softmax op
+        inference_op = tf.nn.softmax(inference_op)
+
+    weight_vars = []
+    activation_ops = []
+    if FLAGS.visualize_inf:
+        trainable_weights = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES)
+        # Retrace the origin op of each variable
+        for n in tf.get_default_graph().as_graph_def().node:
+            for tw in trainable_weights:
+                tw_name_reader = tw.name.split(':')[0] + '/read'
+                if tw_name_reader in n.input:
+                    node_op_name = n.name + ':0'  # @TODO(tzaman) this assumes exactly 1 output - allow to be dynamic!
+                    weight_vars.append(tw)
+                    activation_ops.append(node_op_name)
+                    continue
+
+    try:
+        t = 0
+
+        with open(FLAGS.attributes_file, 'rb') as f:
+            attribute_zs = pickle.load(f)
+
+        while not False: # model.queue_coord.should_stop():
+
+            attributes = app.GetAttributes()
+
+            z = np.zeros(100)
+
+            for idx, attr_scale in enumerate(attributes):
+                z += (attr_scale / 25. ) * attribute_zs[CELEBA_EDITABLE_ATTRIBUTES_IDS[idx]]
+
+            feed_dict = {model.time_placeholder: float(t),
+                         model.attribute_placeholder: z}
+            preds = sess.run(fetches=inference_op, feed_dict=feed_dict)
+
+            if FLAGS.visualize_inf:
+                save_weight_visualization(weight_vars, activation_ops, w, a)
+
+            # @TODO(tzaman): error on no output?
+            #for i in range(len(keys)):
+            #    #    for j in range(len(preds)):
+            #    # We're allowing multiple predictions per image here. DIGITS doesnt support that iirc
+            #    logging.info('Predictions for image ' + str(model.dataloader.get_key_index(keys[i])) +
+            #                 ': ' + json.dumps(preds[i].tolist()))
+            #logging.info('Predictions shape: %s' % str(preds.shape))
+            app.DisplayCell(preds)
+
+            t += 1e-5 * app.GetSpeed() * FLAGS.batch_size
+
+    except tf.errors.OutOfRangeError:
+        print('Done: tf.errors.OutOfRangeError')
+
+
+def Validation(sess, model, current_epoch):
+    """
+    Runs one validation epoch.
+    """
+
+    # @TODO(tzaman): utilize the coordinator by resetting the queue after 1 epoch.
+    # see https://github.com/tensorflow/tensorflow/issues/4535#issuecomment-248990633
+
+    print_vals_sum = 0
+    steps = 0
+    while (steps * model.dataloader.batch_size) < model.dataloader.get_total():
+        summary_str = sess.run(model.summary)
+        # Parse the summary
+        tags, print_vals = summary_to_lists(summary_str)
+        print_vals_sum = print_vals + print_vals_sum
+        steps += 1
+
+    print_list = print_summarylist(tags, print_vals_sum/steps)
+
+    logging.info("Validation (epoch " + str(current_epoch) + "): " + print_list)
+
+
+def loadLabels(filename):
+    with open(filename) as f:
+        return f.readlines()
+
+
+def input_generator(zs_file, batch_size):
+
+    time_placeholder = tf.placeholder(dtype=tf.float32, shape=())
+    attribute_placeholder = tf.placeholder(dtype=tf.float32, shape=(100,))
+
+    def l2_norm(x):
+        euclidean_norm = tf.sqrt(tf.reduce_sum(tf.square(x)))
+        return euclidean_norm
+
+    def dot_product(x, y):
+        return tf.reduce_sum(tf.mul(x,y))
+
+    def slerp(initial, final, progress):
+        omega = tf.acos(dot_product(initial / l2_norm(initial), final / l2_norm(final)))
+        so = tf.sin(omega)
+        return tf.sin((1.0-progress)*omega) / so * initial + tf.sin(progress*omega)/so * final
+
+    with open(zs_file, 'rb') as f:
+        zs = pickle.load(f)
+        img_count = len(zs)
+        zs = tf.constant(zs, dtype=tf.float32)
+
+    tensors = []
+
+    epoch = tf.to_int32(time_placeholder)
+    indices = tf.range(batch_size)
+    indices_init = (indices * batch_size + epoch) % img_count
+    indices_final = (indices_init + 1) % img_count
+
+    for i in xrange(batch_size):
+        z_init = zs[indices_init[i]]
+        z_final = zs[indices_final[i]]
+
+        progress = tf.mod(time_placeholder, 1)
+
+        # progress = tf.Print(progress, [progress])
+
+        z = slerp(z_init, z_final, progress)
+
+        tensors.append(z)
+
+    batch = tf.pack(tensors) + attribute_placeholder
+
+    return batch, time_placeholder, attribute_placeholder
+
+def main(_):
+
+    # Always keep the cpu as default
+    with tf.Graph().as_default(), tf.device('/cpu:0'):
+
+        if FLAGS.validation_interval == 0:
+            FLAGS.validation_db = None
+
+        # Set Tensorboard log directory
+        if FLAGS.summaries_dir:
+            # The following gives a nice but unrobust timestamp
+            FLAGS.summaries_dir = os.path.join(FLAGS.summaries_dir, datetime.datetime.now().strftime("%Y%m%d_%H%M%S"))
+
+        if not FLAGS.train_db and not FLAGS.validation_db and not FLAGS.inference_db and not FLAGS.visualizeModelPath:
+            logging.error("At least one of the following file sources should be specified: "
+                          "train_db, validation_db or inference_db")
+            exit(-1)
+
+        if FLAGS.seed:
+            tf.set_random_seed(FLAGS.seed)
+
+        batch_size_train = FLAGS.batch_size
+        batch_size_val = FLAGS.batch_size
+        logging.info("Train batch size is %s and validation batch size is %s", batch_size_train, batch_size_val)
+
+        # This variable keeps track of next epoch, when to perform validation.
+        next_validation = FLAGS.validation_interval
+        logging.info("Training epochs to be completed for each validation : %s", next_validation)
+
+        # This variable keeps track of next epoch, when to save model weights.
+        next_snapshot_save = FLAGS.snapshotInterval
+        logging.info("Training epochs to be completed before taking a snapshot : %s", next_snapshot_save)
+        last_snapshot_save_epoch = 0
+
+        snapshot_prefix = FLAGS.snapshotPrefix if FLAGS.snapshotPrefix else FLAGS.network.split('.')[0]
+        logging.info("Model weights will be saved as %s_<EPOCH>_Model.ckpt", snapshot_prefix)
+
+        if not os.path.exists(FLAGS.save):
+            os.makedirs(FLAGS.save)
+            logging.info("Created a directory %s to save all the snapshots", FLAGS.save)
+
+        # Load mean variable
+        if FLAGS.subtractMean == 'none':
+            mean_loader = None
+        else:
+            if not FLAGS.mean:
+                logging.error("subtractMean parameter not set to 'none' yet mean image path is unset")
+                exit(-1)
+            logging.info("Loading mean tensor from %s file", FLAGS.mean)
+            mean_loader = tf_data.MeanLoader(FLAGS.mean, FLAGS.subtractMean, FLAGS.bitdepth)
+
+        classes = 0
+        nclasses = 0
+        if FLAGS.labels_list:
+            logging.info("Loading label definitions from %s file", FLAGS.labels_list)
+            classes = loadLabels(FLAGS.labels_list)
+            nclasses = len(classes)
+            if not classes:
+                logging.error("Reading labels file %s failed.", FLAGS.labels_list)
+                exit(-1)
+            logging.info("Found %s classes", nclasses)
+
+        # Create a data-augmentation dict
+        aug_dict = {
+            'aug_flip': FLAGS.augFlip,
+            'aug_noise': FLAGS.augNoise,
+            'aug_contrast': FLAGS.augContrast,
+            'aug_whitening': FLAGS.augWhitening,
+            'aug_HSV': {
+                'h': FLAGS.augHSVh,
+                's': FLAGS.augHSVs,
+                'v': FLAGS.augHSVv,
+            },
+        }
+
+        # hard-code GAN inference
+        FLAGS.inference_db = "grid.gan"
+
+        # Import the network file
+        path_network = os.path.join(os.path.dirname(os.path.realpath(__file__)), FLAGS.networkDirectory, FLAGS.network)
+        exec(open(path_network).read(), globals())
+
+        try:
+            UserModel
+        except NameError:
+            logging.error("The user model class 'UserModel' is not defined.")
+            exit(-1)
+        if not inspect.isclass(UserModel):  # noqa
+            logging.error("The user model class 'UserModel' is not a class.")
+            exit(-1)
+        # @TODO(tzaman) - add mode checks to UserModel
+
+        if FLAGS.train_db:
+            with tf.name_scope(digits.STAGE_TRAIN) as stage_scope:
+                train_model = Model(digits.STAGE_TRAIN, FLAGS.croplen, nclasses, FLAGS.optimization, FLAGS.momentum)
+                train_model.create_dataloader(FLAGS.train_db)
+                train_model.dataloader.setup(FLAGS.train_labels,
+                                             FLAGS.shuffle,
+                                             FLAGS.bitdepth,
+                                             batch_size_train,
+                                             FLAGS.epoch,
+                                             FLAGS.seed)
+                train_model.dataloader.set_augmentation(mean_loader, aug_dict)
+                train_model.create_model(UserModel, stage_scope)  # noqa
+
+        if FLAGS.validation_db:
+            with tf.name_scope(digits.STAGE_VAL) as stage_scope:
+                val_model = Model(digits.STAGE_VAL, FLAGS.croplen, nclasses)
+                val_model.create_dataloader(FLAGS.validation_db)
+                val_model.dataloader.setup(FLAGS.validation_labels,
+                                           False,
+                                           FLAGS.bitdepth,
+                                           batch_size_val,
+                                           1e9,
+                                           FLAGS.seed)  # @TODO(tzaman): set numepochs to 1
+                val_model.dataloader.set_augmentation(mean_loader)
+                val_model.create_model(UserModel, stage_scope)  # noqa
+
+        if FLAGS.inference_db:
+            with tf.name_scope(digits.STAGE_INF) as stage_scope:
+                inf_model = Model(digits.STAGE_INF, FLAGS.croplen, nclasses)
+                inf_model.create_dataloader(FLAGS.inference_db)
+                inf_model.dataloader.setup(None, False, FLAGS.bitdepth, FLAGS.batch_size, 1, FLAGS.seed)
+                inf_model.dataloader.set_augmentation(mean_loader)
+
+                batch_x, time_placeholder, attribute_placeholder = input_generator(FLAGS.zs_file, FLAGS.batch_size)
+
+                inf_model.create_model(UserModel, stage_scope, batch_x=batch_x)  # noqa
+
+                inf_model.time_placeholder = time_placeholder
+                inf_model.attribute_placeholder = attribute_placeholder
+
+        # Start running operations on the Graph. allow_soft_placement must be set to
+        # True to build towers on GPU, as some of the ops do not have GPU
+        # implementations.
+        sess = tf.Session(config=tf.ConfigProto(
+                          allow_soft_placement=True,  # will automatically do non-gpu supported ops on cpu
+                          inter_op_parallelism_threads=TF_INTER_OP_THREADS,
+                          intra_op_parallelism_threads=TF_INTRA_OP_THREADS,
+                          log_device_placement=FLAGS.log_device_placement))
+
+        if FLAGS.visualizeModelPath:
+            visualize_graph(sess.graph_def, FLAGS.visualizeModelPath)
+            exit(0)
+
+        # Saver creation.
+        if FLAGS.save_vars == 'all':
+            vars_to_save = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES)
+        elif FLAGS.save_vars == 'trainable':
+            vars_to_save = tf.all_variables()
+        else:
+            logging.error('Unknown save_var flag (%s)' % FLAGS.save_vars)
+            exit(-1)
+        saver = tf.train.Saver(vars_to_save, max_to_keep=0, sharded=FLAGS.serving_export)
+
+        # Initialize variables
+        init_op = tf.group(tf.global_variables_initializer(), tf.local_variables_initializer())
+        sess.run(init_op)
+
+        # If weights option is set, preload weights from existing models appropriately
+        if FLAGS.weights:
+            load_snapshot(sess, FLAGS.weights, tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES))
+
+        # Tensorboard: Merge all the summaries and write them out
+        writer = tf.train.SummaryWriter(os.path.join(FLAGS.summaries_dir, 'tb'), sess.graph)
+
+        # If we are inferencing, only do that.
+        if FLAGS.inference_db:
+            inf_model.start_queue_runners(sess)
+            Inference(sess, inf_model)
+
+        queue_size_op = []
+        for n in tf.get_default_graph().as_graph_def().node:
+            if '_Size' in n.name:
+                queue_size_op.append(n.name+':0')
+
+        start = time.time()  # @TODO(tzaman) - removeme
+
+        # Initial Forward Validation Pass
+        if FLAGS.validation_db:
+            val_model.start_queue_runners(sess)
+            Validation(sess, val_model, 0)
+
+        if FLAGS.train_db:
+            # During training, a log output should occur at least X times per epoch or every X images, whichever lower
+            train_steps_per_epoch = train_model.dataloader.get_total() / batch_size_train
+            if math.ceil(train_steps_per_epoch/MIN_LOGS_PER_TRAIN_EPOCH) < math.ceil(5000/batch_size_train):
+                logging_interval_step = int(math.ceil(train_steps_per_epoch/MIN_LOGS_PER_TRAIN_EPOCH))
+            else:
+                logging_interval_step = int(math.ceil(5000/batch_size_train))
+            logging.info("During training. details will be logged after every %s steps (batches)",
+                         logging_interval_step)
+
+            # epoch value will be calculated for every batch size. To maintain unique epoch value between batches,
+            # it needs to be rounded to the required number of significant digits.
+            epoch_round = 0  # holds the required number of significant digits for round function.
+            tmp_batchsize = batch_size_train*logging_interval_step
+            while tmp_batchsize <= train_model.dataloader.get_total():
+                tmp_batchsize = tmp_batchsize * 10
+                epoch_round += 1
+            logging.info("While logging, epoch value will be rounded to %s significant digits", epoch_round)
+
+            # Create the learning rate policy
+            total_training_steps = train_model.dataloader.num_epochs * train_model.dataloader.get_total() / \
+                train_model.dataloader.batch_size
+            lrpolicy = lr_policy.LRPolicy(FLAGS.lr_policy,
+                                          FLAGS.lr_base_rate,
+                                          FLAGS.lr_gamma,
+                                          FLAGS.lr_power,
+                                          total_training_steps,
+                                          FLAGS.lr_stepvalues)
+            train_model.start_queue_runners(sess)
+
+            # Training
+            logging.info('Started training the model')
+
+            current_epoch = 0
+            try:
+                step = 0
+                step_last_log = 0
+                print_vals_sum = 0
+                while not train_model.queue_coord.should_stop():
+                    log_runtime = FLAGS.log_runtime_stats_per_step and (step % FLAGS.log_runtime_stats_per_step == 0)
+
+                    run_options = None
+                    run_metadata = None
+                    if log_runtime:
+                        # For a HARDWARE_TRACE you need NVIDIA CUPTI, a 'CUDA-EXTRA'
+                        # SOFTWARE_TRACE HARDWARE_TRACE FULL_TRACE
+                        run_options = tf.RunOptions(trace_level=tf.RunOptions.FULL_TRACE)
+                        run_metadata = tf.RunMetadata()
+
+                    feed_dict = {train_model.learning_rate: lrpolicy.get_learning_rate(step)}
+
+                    if False:
+                        for op in train_model.train:
+                            _, summary_str, step = sess.run([op, train_model.summary, train_model.global_step],
+                                                            feed_dict=feed_dict,
+                                                            options=run_options,
+                                                            run_metadata=run_metadata)
+                    else:
+                        _, summary_str, step = sess.run([train_model.train,
+                                                         train_model.summary,
+                                                         train_model.global_step],
+                                                        feed_dict=feed_dict,
+                                                        options=run_options,
+                                                        run_metadata=run_metadata)
+
+                    # HACK
+                    step = step / len(train_model.train)
+
+                    # logging.info(sess.run(queue_size_op)) # DEVELOPMENT: for checking the queue size
+
+                    if log_runtime:
+                        writer.add_run_metadata(run_metadata, str(step))
+                        save_timeline_trace(run_metadata, FLAGS.save, int(step))
+
+                    writer.add_summary(summary_str, step)
+
+                    # Parse the summary
+                    tags, print_vals = summary_to_lists(summary_str)
+
+                    print_vals_sum = print_vals + print_vals_sum
+
+                    # @TODO(tzaman): account for variable batch_size value on very last epoch
+                    current_epoch = round((step * batch_size_train) / train_model.dataloader.get_total(), epoch_round)
+
+                    # Start with a forward pass
+                    if ((step % logging_interval_step) == 0):
+                        steps_since_log = step - step_last_log
+                        print_list = print_summarylist(tags, print_vals_sum/steps_since_log)
+                        logging.info("Training (epoch " + str(current_epoch) + "): " + print_list)
+                        print_vals_sum = 0
+                        step_last_log = step
+
+                    # Potential Validation Pass
+                    if FLAGS.validation_db and current_epoch >= next_validation:
+                        Validation(sess, val_model, current_epoch)
+                        # Find next nearest epoch value that exactly divisible by FLAGS.validation_interval:
+                        next_validation = (round(float(current_epoch)/FLAGS.validation_interval) + 1) * \
+                            FLAGS.validation_interval
+
+                    # Saving Snapshot
+                    if FLAGS.snapshotInterval > 0 and current_epoch >= next_snapshot_save:
+                        save_snapshot(sess, saver, FLAGS.save, snapshot_prefix, current_epoch, FLAGS.serving_export)
+
+                        # To find next nearest epoch value that exactly divisible by FLAGS.snapshotInterval
+                        next_snapshot_save = (round(float(current_epoch)/FLAGS.snapshotInterval) + 1) * \
+                            FLAGS.snapshotInterval
+                        last_snapshot_save_epoch = current_epoch
+                    writer.flush()
+            except tf.errors.OutOfRangeError:
+                logging.info('Done training for epochs: tf.errors.OutOfRangeError')
+            except ValueError as err:
+                logging.error(err.args[0])
+                exit(-1)  # DIGITS wants a dirty error.
+            except (KeyboardInterrupt):
+                logging.info('Interrupt signal received.')
+
+            # If required, perform final snapshot save
+            if FLAGS.snapshotInterval > 0 and FLAGS.epoch > last_snapshot_save_epoch:
+                save_snapshot(sess, saver, FLAGS.save, snapshot_prefix, FLAGS.epoch, FLAGS.serving_export)
+
+        print('Training wall-time:', time.time()-start)  # @TODO(tzaman) - removeme
+
+        # If required, perform final Validation pass
+        if FLAGS.validation_db and current_epoch >= next_validation:
+            Validation(sess, val_model, current_epoch)
+
+        if FLAGS.train_db:
+            del train_model
+        if FLAGS.validation_db:
+            del val_model
+        if FLAGS.inference_db:
+            del inf_model
+
+        # We need to call sess.close() because we've used a with block
+        sess.close()
+
+        writer.close()
+        logging.info('END')
+        exit(0)
+
+if __name__ == '__main__':
+
+    app = gandisplay.DemoApp(0,
+                             grid_size=np.sqrt(FLAGS.batch_size)*64,
+                             attributes=CELEBA_EDITABLE_ATTRIBUTES)
+
+    t = threading.Thread(target=tf.app.run, args=())
+    t.start()
+
+    app.MainLoop()
diff --git a/digits/tools/tensorflow/gandisplay.py b/digits/tools/tensorflow/gandisplay.py
new file mode 100644
index 000000000..9f8d6d8df
--- /dev/null
+++ b/digits/tools/tensorflow/gandisplay.py
@@ -0,0 +1,259 @@
+import wxversion
+
+import wx
+import numpy as np
+import random
+import time
+
+
+# This has been set up to optionally use the wx.BufferedDC if
+# USE_BUFFERED_DC is True, it will be used. Otherwise, it uses the raw
+# wx.Memory DC , etc.
+
+#USE_BUFFERED_DC = False
+USE_BUFFERED_DC = True
+
+myEVT = wx.NewEventType()
+DISPLAY_GRID_EVT = wx.PyEventBinder(myEVT, 1)
+
+class MyEvent(wx.PyCommandEvent):
+    """Event to signal that a count value is ready"""
+    def __init__(self, etype, eid, value=None):
+        """Creates the event object"""
+        wx.PyCommandEvent.__init__(self, etype, eid)
+        self._value = value
+
+    def GetValue(self):
+        """Returns the value from the event.
+        @return: the value of this event
+
+        """
+        return self._value
+
+class BufferedWindow(wx.Window):
+
+    """
+
+    A Buffered window class.
+
+    To use it, subclass it and define a Draw(DC) method that takes a DC
+    to draw to. In that method, put the code needed to draw the picture
+    you want. The window will automatically be double buffered, and the
+    screen will be automatically updated when a Paint event is received.
+
+    When the drawing needs to change, you app needs to call the
+    UpdateDrawing() method. Since the drawing is stored in a bitmap, you
+    can also save the drawing to file by calling the
+    SaveToFile(self, file_name, file_type) method.
+
+    """
+    def __init__(self, *args, **kwargs):
+        # make sure the NO_FULL_REPAINT_ON_RESIZE style flag is set.
+        kwargs['style'] = kwargs.setdefault('style', wx.NO_FULL_REPAINT_ON_RESIZE) | wx.NO_FULL_REPAINT_ON_RESIZE
+        wx.Window.__init__(self, *args, **kwargs)
+
+        wx.EVT_PAINT(self, self.OnPaint)
+        wx.EVT_SIZE(self, self.OnSize)
+
+        # OnSize called to make sure the buffer is initialized.
+        # This might result in OnSize getting called twice on some
+        # platforms at initialization, but little harm done.
+        self.OnSize(None)
+        self.paint_count = 0
+
+    def Draw(self, dc):
+        ## just here as a place holder.
+        ## This method should be over-ridden when subclassed
+        pass
+
+
+    def OnPaint(self, event):
+        # All that is needed here is to draw the buffer to screen
+        if USE_BUFFERED_DC:
+            dc = wx.BufferedPaintDC(self, self._Buffer)
+        else:
+            dc = wx.PaintDC(self)
+            dc.DrawBitmap(self._Buffer, 0, 0)
+
+    def OnSize(self,event):
+        # The Buffer init is done here, to make sure the buffer is always
+        # the same size as the Window
+        #Size  = self.GetClientSizeTuple()
+        Size  = self.ClientSize
+
+        # Make new offscreen bitmap: this bitmap will always have the
+        # current drawing in it, so it can be used to save the image to
+        # a file, or whatever.
+        self._Buffer = wx.EmptyBitmap(*Size)
+        self.UpdateDrawing()
+
+    def SaveToFile(self, FileName, FileType=wx.BITMAP_TYPE_PNG):
+        ## This will save the contents of the buffer
+        ## to the specified file. See the wxWindows docs for
+        ## wx.Bitmap::SaveFile for the details
+        self._Buffer.SaveFile(FileName, FileType)
+
+    def UpdateDrawing(self):
+        """
+        This would get called if the drawing needed to change, for whatever reason.
+
+        The idea here is that the drawing is based on some data generated
+        elsewhere in the system. If that data changes, the drawing needs to
+        be updated.
+
+        This code re-draws the buffer, then calls Update, which forces a paint event.
+        """
+        dc = wx.MemoryDC()
+        dc.SelectObject(self._Buffer)
+        self.Draw(dc)
+        del dc # need to get rid of the MemoryDC before Update() is called.
+        self.Refresh()
+        self.Update()
+
+class DrawWindow(BufferedWindow):
+    def __init__(self, *args, **kwargs):
+        ## Any data the Draw() function needs must be initialized before
+        ## calling BufferedWindow.__init__, as it will call the Draw
+        ## function.
+        self.DrawData = {}
+        BufferedWindow.__init__(self, *args, **kwargs)
+
+    def Draw(self, dc):
+        dc.SetBackground( wx.Brush("White") )
+        dc.Clear() # make sure you clear the bitmap!
+
+        # Here's the actual drawing code.
+        for key, data in self.DrawData.items():
+            if key == "text":
+                dc.DrawText(data, 0, 0)
+            elif key == "np":
+                data = data.astype('uint8')
+                img_count = data.shape[0]
+                height = data.shape[1]
+                width = data.shape[2]
+                channels = data.shape[3]
+
+                grid_size = int(np.sqrt(img_count))
+
+                size = (grid_size * width, grid_size * height)
+                if True: # self.size != size:
+                    self.size = size
+                    self.SetSize(size)
+
+                image = wx.EmptyImage(width,height)
+                for i in xrange(img_count):
+                    x = width * (i // grid_size)
+                    y = height * (i % grid_size)
+                    s = data[i].tostring()
+                    image.SetData(s)
+                    wxBitmap = image.ConvertToBitmap()       #
+                    dc.DrawBitmap(wxBitmap, x=x, y=y)
+
+
+class TestFrame(wx.Frame):
+
+    SLIDER_WIDTH = 100
+    SLIDER_BORDER = 50
+    STATUS_HEIGHT = 20
+
+    def __init__(self, parent=None, grid_size=640, attributes=[]):
+        wx.Frame.__init__(self, parent,
+                          size = (grid_size + self.SLIDER_WIDTH + self.SLIDER_BORDER, grid_size + self.STATUS_HEIGHT),
+                          title="GAN Demo",
+                          style=wx.DEFAULT_FRAME_STYLE ^ wx.RESIZE_BORDER)
+
+        ## Set up the MenuBar
+        MenuBar = wx.MenuBar()
+
+        file_menu = wx.Menu()
+
+        item = file_menu.Append(wx.ID_EXIT, text="&Exit")
+        self.Bind(wx.EVT_MENU, self.OnQuit, item)
+        MenuBar.Append(file_menu, "&File")
+
+        self.SetMenuBar(MenuBar)
+
+        self.statusbar = self.CreateStatusBar()
+        self.statusbar.SetStatusText('Initialising...')
+
+        # Set up UI elements
+        panel = wx.Panel(self)
+        self.Window = DrawWindow(panel, size=(grid_size, grid_size))
+
+        hbox = wx.BoxSizer(wx.HORIZONTAL)
+        hbox.Add(self.Window, 1, wx.ALIGN_LEFT)
+
+        # Sliders
+        vbox = wx.BoxSizer(wx.VERTICAL)
+        self.speed_slider = wx.Slider(panel, -1, value=5, minValue=0, maxValue=10, pos=wx.DefaultPosition, size=(self.SLIDER_WIDTH, -1),
+                                 style=wx.SL_AUTOTICKS | wx.SL_HORIZONTAL | wx.SL_LABELS)
+        slider_text = wx.StaticText(panel, label='Speed')
+        vbox.Add(slider_text, 0, wx.ALIGN_CENTRE)
+        vbox.Add(self.speed_slider, 0, wx.ALIGN_CENTRE)
+
+        self.attribute_sliders = []
+        for attribute in attributes:
+            slider_text = wx.StaticText(panel, label=attribute)
+            slider = wx.Slider(panel, -1, value=0, minValue=-100, maxValue=100, pos=wx.DefaultPosition, size=(self.SLIDER_WIDTH, -1),
+                                 style=wx.SL_AUTOTICKS | wx.SL_HORIZONTAL | wx.SL_LABELS)
+            vbox.Add(slider_text, 0, wx.ALIGN_CENTRE)
+            vbox.Add(slider, 0, wx.ALIGN_CENTRE)
+            self.attribute_sliders.append(slider)
+
+        hbox.Add(vbox, 0, wx.ALIGN_RIGHT)
+        panel.SetSizer(hbox)
+
+        self.Window.DrawData = {'text': u'Initialising...'}
+        self.Window.UpdateDrawing()
+
+        # to measure frames per second
+        self.last_frame_timestamp = None
+        self.last_fps_update = None
+
+        # add panel to frame
+        frameSizer = wx.BoxSizer(wx.VERTICAL)
+        frameSizer.Add(panel, 0, wx.EXPAND | wx.ALIGN_LEFT)
+        self.SetSizer(frameSizer)
+
+        self.Show()
+
+        self.Fit()
+
+        self.Bind(DISPLAY_GRID_EVT, self.OnDisplayCell)
+
+    def OnQuit(self,event):
+        self.Close(True)
+
+    def OnDisplayCell(self, evt):
+        array = evt.GetValue()
+        self.Window.DrawData = {'np': array}
+        self.Window.UpdateDrawing()
+
+        if self.last_frame_timestamp is not None:
+            fps = 1. / (time.time() - self.last_frame_timestamp)
+            if (self.last_fps_update is None) or (time.time() - self.last_fps_update > 0.5):
+                self.statusbar.SetStatusText('%.1ffps' % fps)
+                self.last_fps_update = time.time()
+        self.last_frame_timestamp = time.time()
+
+class DemoApp(wx.App):
+
+    def __init__(self, arg, grid_size, attributes):
+        self.gan_grid_size = grid_size
+        self.attributes = attributes
+        super(DemoApp, self).__init__(arg)
+
+    def OnInit(self):
+        self.frame = TestFrame(grid_size=self.gan_grid_size, attributes=self.attributes)
+        self.SetTopWindow(self.frame)
+        return True
+
+    def DisplayCell(self, array):
+        evt = MyEvent(myEVT, -1, array)
+        wx.PostEvent(self.frame, evt)
+
+    def GetSpeed(self):
+        return self.frame.speed_slider.GetValue()
+
+    def GetAttributes(self):
+        return [s.GetValue() for s in self.frame.attribute_sliders]
diff --git a/digits/tools/tensorflow/lr_policy.py b/digits/tools/tensorflow/lr_policy.py
index 3619e4006..d8221c362 100644
--- a/digits/tools/tensorflow/lr_policy.py
+++ b/digits/tools/tensorflow/lr_policy.py
@@ -15,7 +15,10 @@
 import logging
 import math
 
-logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',datefmt='%Y-%m-%d %H:%M:%S', level=logging.INFO)
+logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',
+                    datefmt='%Y-%m-%d %H:%M:%S',
+                    level=logging.INFO)
+
 
 class LRPolicy(object):
     """This class contains details of learning rate policies that are used in caffe.
@@ -59,9 +62,13 @@ def __init__(self, policy, base_rate, gamma, power, max_steps, step_values):
         if (self.max_steps < len(self.stepvalues_list)):
             self.policy = 'step'
             self.stepvalues_list[0] = 1
-            logging.info("Maximum iterations (i.e., %s) is less than provided step values count (i.e, %s), so learning rate policy is reset to (%s) policy with the step value (%s).", self.max_steps, len(self.stepvalues_list), self.policy, self.stepvalues_list[0])
-        else:
-            # Converting stepsize percentages into values
+            logging.info("Maximum iterations (i.e., %s) is less than provided step values count "
+                         "(i.e, %s), so learning rate policy is reset to (%s) policy with the "
+                         "step value (%s).",
+                         self.max_steps, len(self.stepvalues_list),
+                         self.policy,
+                         self.stepvalues_list[0])
+        else:            # Converting stepsize percentages into values
             for i in range(len(self.stepvalues_list)):
                 self.stepvalues_list[i] = round(self.max_steps * self.stepvalues_list[i] / 100)
                 # Avoids 'nan' values during learning rate calculation
@@ -70,10 +77,10 @@ def __init__(self, policy, base_rate, gamma, power, max_steps, step_values):
 
         if (self.policy == 'step') or (self.policy == 'sigmoid'):
             # If the policy is not multistep, then even though multiple step values
-            #  are provided as input, we will consider only the first value.
+            # are provided as input, we will consider only the first value.
             self.step_size = self.stepvalues_list[0]
         elif (self.policy == 'multistep'):
-            self.current_step = 0 # This counter is important to take arbitary steps
+            self.current_step = 0  # This counter is important to take arbitary steps
             self.stepvalue_size = len(self.stepvalues_list)
 
     def get_learning_rate(self, step):
@@ -84,7 +91,7 @@ def get_learning_rate(self, step):
             rate: the learning rate for the requested step
         """
         rate = 0
-        progress = 100 * (step / self.max_steps) # expressed in percent units
+        progress = 100 * (step / self.max_steps)  # expressed in percent units
 
         if self.policy == "fixed":
             rate = self.base_rate
@@ -98,11 +105,12 @@ def get_learning_rate(self, step):
         elif self.policy == "multistep":
             if ((self.current_step < self.stepvalue_size) and (step > self.stepvalues_list[self.current_step])):
                 self.current_step = self.current_step + 1
-            rate = self.base_rate * math.pow(self.gamma, self.current_step);
+            rate = self.base_rate * math.pow(self.gamma, self.current_step)
         elif self.policy == "poly":
             rate = self.base_rate * math.pow(1.0 - (step / self.max_steps), self.power)
         elif self.policy == "sigmoid":
-            rate = self.base_rate * (1.0 / (1.0 + math.exp(self.gamma * (progress - 100 * self.step_size / self.max_steps))));
+            rate = self.base_rate * \
+                (1.0 / (1.0 + math.exp(self.gamma * (progress - 100 * self.step_size / self.max_steps))))
         else:
             logging.error("Unknown learning rate policy: %s", self.policy)
             exit(-1)
diff --git a/digits/tools/tensorflow/main.py b/digits/tools/tensorflow/main.py
index b07ff4b30..93f0a8e09 100644
--- a/digits/tools/tensorflow/main.py
+++ b/digits/tools/tensorflow/main.py
@@ -20,16 +20,17 @@
 import time
 
 import datetime
+import inspect
 import json
 import logging
 import math
 import numpy as np
 import os
-from six.moves import xrange  # pylint: disable=redefined-builtin
+from six.moves import xrange  # noqa
 import tensorflow as tf
-import tensorflow.contrib.slim as slim # pylint: disable=unused-import
-from tensorflow.python.client import timeline, device_lib
-from tensorflow.python.ops import template
+import tensorflow.contrib.slim as slim  # noqa
+from tensorflow.python.client import timeline, device_lib  # noqa
+from tensorflow.python.ops import template  # noqa
 from tensorflow.python.lib.io import file_io
 from tensorflow.core.framework import summary_pb2
 
@@ -37,14 +38,18 @@
 # Local imports
 import utils as digits
 import lr_policy
-import model
+from model import Model, Tower  # noqa
+from utils import model_property  # noqa
+
 import tf_data
 
 # Constants
-TF_INTRA_OP_TRHEADS = 6
-MIN_LOGS_PER_TRAIN_EPOCH = 8 # torch default: 8
+TF_INTRA_OP_THREADS = 0
+TF_INTER_OP_THREADS = 0
+MIN_LOGS_PER_TRAIN_EPOCH = 8  # torch default: 8
 
-logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',datefmt='%Y-%m-%d %H:%M:%S',
+logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',
+                    datefmt='%Y-%m-%d %H:%M:%S',
                     level=logging.INFO)
 
 FLAGS = tf.app.flags.FLAGS
@@ -56,10 +61,10 @@
 tf.app.flags.DEFINE_integer('epoch', 1, """Number of epochs to train, -1 for unbounded""")
 tf.app.flags.DEFINE_string('inference_db', '', """Directory with inference file source""")
 tf.app.flags.DEFINE_integer(
-    'interval', 1, """Number of train epochs to complete, to perform one validation""")
+    'validation_interval', 1, """Number of train epochs to complete, to perform one validation""")
 tf.app.flags.DEFINE_string('labels_list', '', """Text file listing label definitions""")
 tf.app.flags.DEFINE_string('mean', '', """Mean image file""")
-tf.app.flags.DEFINE_float('momentum', '0.9', """Momentum""") # Not used by DIGITS front-end
+tf.app.flags.DEFINE_float('momentum', '0.9', """Momentum""")  # Not used by DIGITS front-end
 tf.app.flags.DEFINE_string('network', '', """File containing network (model)""")
 tf.app.flags.DEFINE_string('networkDirectory', '', """Directory in which network exists""")
 tf.app.flags.DEFINE_string('optimization', 'sgd', """Optimization method""")
@@ -88,7 +93,7 @@
 tf.app.flags.DEFINE_string(
     'weights', '', """Filename for weights of a model to use for fine-tuning""")
 
- # @TODO(tzaman): is the bitdepth in line with the DIGITS team?
+# @TODO(tzaman): is the bitdepth in line with the DIGITS team?
 tf.app.flags.DEFINE_integer('bitdepth', 8, """Specifies an image's bitdepth""")
 
 # @TODO(tzaman); remove torch mentions below
@@ -138,6 +143,7 @@
 tf.app.flags.DEFINE_float(
     'augHSVv', 0., """The stddev of HSV's Value shift as pre-processing augmentation""")
 
+
 def save_timeline_trace(run_metadata, save_dir, step):
     tl = timeline.Timeline(run_metadata.step_stats)
     ctf = tl.generate_chrome_trace_format(show_memory=True)
@@ -146,6 +152,7 @@ def save_timeline_trace(run_metadata, save_dir, step):
         f.write(ctf)
     logging.info('Timeline trace written to %s', tl_fn)
 
+
 def strip_data_from_graph_def(graph_def):
     strip_def = tf.GraphDef()
     for n0 in graph_def.node:
@@ -153,13 +160,13 @@ def strip_data_from_graph_def(graph_def):
         n.MergeFrom(n0)
         if n.op == 'Const':
             tensor = n.attr['value'].tensor
-            size = max(len(tensor.tensor_content), len(tensor.string_val))
             if (tensor.tensor_content):
                 tensor.tensor_content = ''
             if (tensor.string_val):
                 del tensor.string_val[:]
     return strip_def
 
+
 def visualize_graph(graph_def, path):
     graph_def = strip_data_from_graph_def(graph_def)
     logging.info('Writing Graph Definition..')
@@ -167,6 +174,24 @@ def visualize_graph(graph_def, path):
     logging.info('Graph Definition Written.')
 
 
+def average_head_keys(tags, vals):
+    """ Averages keys with same end (head) name.
+    Example: foo1/bar=1 and foo2/bar=2 should collapse to bar=1.5
+    """
+    tail_tags = [w.split('/')[-1] for w in tags]
+    sums = {}
+    nums = {}
+    for a, b in zip(tail_tags, vals):
+        if a not in sums:
+            sums[a] = b
+            nums[a] = 1
+        else:
+            sums[a] += b
+            nums[a] += 1
+    tags_clean = sums.keys()
+    return tags_clean, np.asarray(sums.values())/np.asarray(nums.values())
+
+
 def summary_to_lists(summary_str):
     """ Takes a Tensorflow stringified Summary object and returns only
     the scalar values to a list of tags and a list of values
@@ -182,14 +207,17 @@ def summary_to_lists(summary_str):
     tags = []
     vals = []
     for s in summ.value:
-        if s.HasField('simple_value'):# and s.simple_value: # Only parse scalar_summaries
-            if s.simple_value == float('Inf'):
-                raise ValueError('Model diverged with %s = %s : Try decreasing your learning rate' % (s.tag, s.simple_value))
+        if s.HasField('simple_value'):  # and s.simple_value: # Only parse scalar_summaries
+            if s.simple_value == float('Inf') or np.isnan(s.simple_value):
+                raise ValueError('Model diverged with %s = %s : Try decreasing your learning rate' %
+                                 (s.tag, s.simple_value))
             tags.append(s.tag)
             vals.append(s.simple_value)
+    tags, vals = average_head_keys(tags, vals)
     vals = np.asarray(vals)
     return tags, vals
 
+
 def print_summarylist(tags, vals):
     """ Prints a nice one-line listing of tags and their values in a nice format
     that corresponds to how the DIGITS regex reads it.
@@ -208,10 +236,12 @@ def print_summarylist(tags, vals):
             print_list = print_list + ", "
     return print_list
 
+
 def dump(obj):
     for attr in dir(obj):
         print("obj.%s = %s" % (attr, getattr(obj, attr)))
 
+
 def load_snapshot(sess, weight_path, var_candidates):
     """ Loads a snapshot into a session from a weight path. Will only load the
     weights that are both in the weight_path file and the passed var_candidates."""
@@ -224,8 +254,11 @@ def load_snapshot(sess, weight_path, var_candidates):
     for vt in var_candidates:
         for vm in var_map.keys():
             if vt.name.split(':')[0] == vm:
-                vars_restore.append(vt)
-                logging.info('restoring %s -> %s' % (vm, vt.name))
+                if ("global_step" not in vt.name) and not (vt.name.startswith("train/")):
+                    vars_restore.append(vt)
+                    logging.info('restoring %s -> %s' % (vm, vt.name))
+                else:
+                    logging.info('NOT restoring %s -> %s' % (vm, vt.name))
 
     logging.info('Restoring %s variable ops.' % len(vars_restore))
     tf.train.Saver(vars_restore, max_to_keep=0, sharded=FLAGS.serving_export).restore(sess, weight_path)
@@ -237,7 +270,12 @@ def save_snapshot(sess, saver, save_dir, snapshot_prefix, epoch, for_serving=Fal
     Saves a snapshot of the current session, saving all variables previously defined
     in the ctor of the saver. Also saves the flow of the graph itself (only once).
     """
-    snapshot_file = os.path.join(save_dir, snapshot_prefix + '_' + str(epoch) + '.ckpt')
+    number_dec = str(FLAGS.snapshotInterval-int(FLAGS.snapshotInterval))[2:]
+    if number_dec is '':
+        number_dec = '0'
+    epoch_fmt = "{:." + number_dec + "f}"
+
+    snapshot_file = os.path.join(save_dir, snapshot_prefix + '_' + epoch_fmt.format(epoch) + '.ckpt')
 
     logging.info('Snapshotting to %s', snapshot_file)
     saver.save(sess, snapshot_file)
@@ -255,7 +293,7 @@ def save_snapshot(sess, saver, save_dir, snapshot_prefix, epoch, for_serving=Fal
             logging.info('Saving graph to %s', filename_graph)
             f.write(sess.graph_def.SerializeToString())
             logging.info('Saved graph to %s', filename_graph)
-        #meta_graph_def = tf.train.export_meta_graph(filename='?')
+        # meta_graph_def = tf.train.export_meta_graph(filename='?')
 
 
 def save_weight_visualization(w_names, a_names, w, a):
@@ -269,7 +307,7 @@ def save_weight_visualization(w_names, a_names, w, a):
     db_layers = vis_db.create_group("layers")
 
     logging.info('Saving visualization to %s', fn)
-    for i in range(0,len(w)):
+    for i in range(0, len(w)):
         dset = db_layers.create_group(str(i))
         dset.attrs['var'] = w_names[i].name
         dset.attrs['op'] = a_names[i]
@@ -279,14 +317,16 @@ def save_weight_visualization(w_names, a_names, w, a):
             dset.create_dataset('activations', data=a[i])
     vis_db.close()
 
+
 def Inference(sess, model):
     """
     Runs one inference (evaluation) epoch (all the files in the loader)
     """
 
-    if FLAGS.labels_list: # Classification -> assume softmax usage
+    inference_op = model.towers[0].inference
+    if FLAGS.labels_list:  # Classification -> assume softmax usage
         # Append a softmax op
-        model.inference = tf.nn.softmax(model.inference)
+        inference_op = tf.nn.softmax(inference_op)
 
     weight_vars = []
     activation_ops = []
@@ -297,14 +337,17 @@ def Inference(sess, model):
             for tw in trainable_weights:
                 tw_name_reader = tw.name.split(':')[0] + '/read'
                 if tw_name_reader in n.input:
-                    node_op_name = n.name + ':0' # @TODO(tzaman) this assumes exactly 1 output - allow to be dynamic!
+                    node_op_name = n.name + ':0'  # @TODO(tzaman) this assumes exactly 1 output - allow to be dynamic!
                     weight_vars.append(tw)
                     activation_ops.append(node_op_name)
                     continue
 
     try:
         while not model.queue_coord.should_stop():
-            keys, preds, [w], [a] = sess.run([model.dataloader.batch_k, model.inference, [weight_vars], [activation_ops]])
+            keys, preds, [w], [a] = sess.run([model.dataloader.batch_k,
+                                              inference_op,
+                                              [weight_vars],
+                                              [activation_ops]])
 
             if FLAGS.visualize_inf:
                 save_weight_visualization(weight_vars, activation_ops, w, a)
@@ -313,16 +356,18 @@ def Inference(sess, model):
             for i in range(len(keys)):
                 #    for j in range(len(preds)):
                 # We're allowing multiple predictions per image here. DIGITS doesnt support that iirc
-                logging.info('Predictions for image ' + str(model.dataloader.get_key_index(keys[i])) + ': ' + json.dumps(preds[i].tolist()))
+                logging.info('Predictions for image ' + str(model.dataloader.get_key_index(keys[i])) +
+                             ': ' + json.dumps(preds[i].tolist()))
     except tf.errors.OutOfRangeError:
         print('Done: tf.errors.OutOfRangeError')
 
+
 def Validation(sess, model, current_epoch):
     """
     Runs one validation epoch.
     """
 
-    ## @TODO(tzaman): utilize the coordinator by resetting the queue after 1 epoch.
+    # @TODO(tzaman): utilize the coordinator by resetting the queue after 1 epoch.
     # see https://github.com/tensorflow/tensorflow/issues/4535#issuecomment-248990633
 
     print_vals_sum = 0
@@ -349,13 +394,17 @@ def main(_):
     # Always keep the cpu as default
     with tf.Graph().as_default(), tf.device('/cpu:0'):
 
+        if FLAGS.validation_interval == 0:
+            FLAGS.validation_db = None
+
         # Set Tensorboard log directory
         if FLAGS.summaries_dir:
             # The following gives a nice but unrobust timestamp
             FLAGS.summaries_dir = os.path.join(FLAGS.summaries_dir, datetime.datetime.now().strftime("%Y%m%d_%H%M%S"))
 
         if not FLAGS.train_db and not FLAGS.validation_db and not FLAGS.inference_db and not FLAGS.visualizeModelPath:
-            logging.error("At least one of the following file sources should be specified: train_db, validation_db or inference_db")
+            logging.error("At least one of the following file sources should be specified: "
+                          "train_db, validation_db or inference_db")
             exit(-1)
 
         if FLAGS.seed:
@@ -366,9 +415,8 @@ def main(_):
         logging.info("Train batch size is %s and validation batch size is %s", batch_size_train, batch_size_val)
 
         # This variable keeps track of next epoch, when to perform validation.
-        next_validation = FLAGS.interval
+        next_validation = FLAGS.validation_interval
         logging.info("Training epochs to be completed for each validation : %s", next_validation)
-        last_validation_epoch = 0
 
         # This variable keeps track of next epoch, when to save model weights.
         next_snapshot_save = FLAGS.snapshotInterval
@@ -392,7 +440,6 @@ def main(_):
             logging.info("Loading mean tensor from %s file", FLAGS.mean)
             mean_loader = tf_data.MeanLoader(FLAGS.mean, FLAGS.subtractMean, FLAGS.bitdepth)
 
-
         classes = 0
         nclasses = 0
         if FLAGS.labels_list:
@@ -406,73 +453,73 @@ def main(_):
 
         # Create a data-augmentation dict
         aug_dict = {
-                'aug_flip' : FLAGS.augFlip,
-                'aug_noise' : FLAGS.augNoise,
-                'aug_contrast' : FLAGS.augContrast,
-                'aug_whitening' : FLAGS.augWhitening,
-                'aug_HSV' : {
-                    'h':FLAGS.augHSVh,
-                    's':FLAGS.augHSVs,
-                    'v':FLAGS.augHSVv,
-                },
-            }
-
-        input_shape = []
+            'aug_flip': FLAGS.augFlip,
+            'aug_noise': FLAGS.augNoise,
+            'aug_contrast': FLAGS.augContrast,
+            'aug_whitening': FLAGS.augWhitening,
+            'aug_HSV': {
+                'h': FLAGS.augHSVh,
+                's': FLAGS.augHSVs,
+                'v': FLAGS.augHSVv,
+            },
+        }
 
         # Import the network file
         path_network = os.path.join(os.path.dirname(os.path.realpath(__file__)), FLAGS.networkDirectory, FLAGS.network)
         exec(open(path_network).read(), globals())
+
         try:
-            build_model
+            UserModel
         except NameError:
-            logging.error("The user model build function 'build_model' is not defined.")
+            logging.error("The user model class 'UserModel' is not defined.")
             exit(-1)
-
-        if not callable(build_model):
-            logging.error("The user model build function 'build_model' is not callable, it is of type (%s)", type(build_model))
+        if not inspect.isclass(UserModel):  # noqa
+            logging.error("The user model class 'UserModel' is not a class.")
             exit(-1)
-
-        # Create the network template
-        network_template = template.make_template(digits.GraphKeys.TEMPLATE, build_model)
+        # @TODO(tzaman) - add mode checks to UserModel
 
         if FLAGS.train_db:
-            #with tf.name_scope(self.stage): #@TODO(tzaman) - implement me !
-            train_model = model.Model(digits.STAGE_TRAIN, FLAGS.croplen, nclasses)
-            train_model.create_dataloader(FLAGS.train_db)
-            train_model.dataloader.setup(FLAGS.train_labels, FLAGS.shuffle, FLAGS.bitdepth, batch_size_train, FLAGS.epoch, FLAGS.seed)
-            train_model.dataloader.set_augmentation(mean_loader, aug_dict)
-            train_model.init_dataloader()
-            input_shape = train_model.dataloader.get_shape()
-            train_model.set_optimizer(FLAGS.optimization, FLAGS.momentum)
-            train_model.create_model_from_template(network_template)
+            with tf.name_scope(digits.STAGE_TRAIN) as stage_scope:
+                train_model = Model(digits.STAGE_TRAIN, FLAGS.croplen, nclasses, FLAGS.optimization, FLAGS.momentum)
+                train_model.create_dataloader(FLAGS.train_db)
+                train_model.dataloader.setup(FLAGS.train_labels,
+                                             FLAGS.shuffle,
+                                             FLAGS.bitdepth,
+                                             batch_size_train,
+                                             FLAGS.epoch,
+                                             FLAGS.seed)
+                train_model.dataloader.set_augmentation(mean_loader, aug_dict)
+                train_model.create_model(UserModel, stage_scope)  # noqa
 
         if FLAGS.validation_db:
-            val_model = model.Model(digits.STAGE_VAL, FLAGS.croplen, nclasses)
-            val_model.create_dataloader(FLAGS.validation_db)
-            val_model.dataloader.setup(FLAGS.validation_labels, False, FLAGS.bitdepth, batch_size_val, 1e9, FLAGS.seed) # @TODO(tzaman): set numepochs to 1
-            val_model.dataloader.set_augmentation(mean_loader)
-            val_model.init_dataloader()
-            if not input_shape:
-                input_shape = val_model.dataloader.get_shape()
-            val_model.create_model_from_template(network_template)
+            with tf.name_scope(digits.STAGE_VAL) as stage_scope:
+                val_model = Model(digits.STAGE_VAL, FLAGS.croplen, nclasses)
+                val_model.create_dataloader(FLAGS.validation_db)
+                val_model.dataloader.setup(FLAGS.validation_labels,
+                                           False,
+                                           FLAGS.bitdepth,
+                                           batch_size_val,
+                                           1e9,
+                                           FLAGS.seed)  # @TODO(tzaman): set numepochs to 1
+                val_model.dataloader.set_augmentation(mean_loader)
+                val_model.create_model(UserModel, stage_scope)  # noqa
 
         if FLAGS.inference_db:
-            inf_model = model.Model(digits.STAGE_INF, FLAGS.croplen, nclasses)
-            inf_model.create_dataloader(FLAGS.inference_db)
-            inf_model.dataloader.setup(None, False, FLAGS.bitdepth, FLAGS.batch_size, 1, FLAGS.seed)
-            inf_model.dataloader.set_augmentation(mean_loader)
-            inf_model.init_dataloader()
-            if not input_shape:
-                input_shape = inf_model.dataloader.get_shape()
-            inf_model.create_model_from_template(network_template)
+            with tf.name_scope(digits.STAGE_INF) as stage_scope:
+                inf_model = Model(digits.STAGE_INF, FLAGS.croplen, nclasses)
+                inf_model.create_dataloader(FLAGS.inference_db)
+                inf_model.dataloader.setup(None, False, FLAGS.bitdepth, FLAGS.batch_size, 1, FLAGS.seed)
+                inf_model.dataloader.set_augmentation(mean_loader)
+                inf_model.create_model(UserModel, stage_scope)  # noqa
 
         # Start running operations on the Graph. allow_soft_placement must be set to
         # True to build towers on GPU, as some of the ops do not have GPU
         # implementations.
         sess = tf.Session(config=tf.ConfigProto(
-            allow_soft_placement=True, # will automatically do non-gpu supported ops on cpu
-            intra_op_parallelism_threads=TF_INTRA_OP_TRHEADS,
-            log_device_placement=FLAGS.log_device_placement))
+                          allow_soft_placement=True,  # will automatically do non-gpu supported ops on cpu
+                          inter_op_parallelism_threads=TF_INTER_OP_THREADS,
+                          intra_op_parallelism_threads=TF_INTRA_OP_THREADS,
+                          log_device_placement=FLAGS.log_device_placement))
 
         if FLAGS.visualizeModelPath:
             visualize_graph(sess.graph_def, FLAGS.visualizeModelPath)
@@ -480,7 +527,7 @@ def main(_):
 
         # Saver creation.
         if FLAGS.save_vars == 'all':
-            vars_to_save = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES)
+            vars_to_save = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES)
         elif FLAGS.save_vars == 'trainable':
             vars_to_save = tf.all_variables()
         else:
@@ -489,12 +536,12 @@ def main(_):
         saver = tf.train.Saver(vars_to_save, max_to_keep=0, sharded=FLAGS.serving_export)
 
         # Initialize variables
-        init_op = tf.group(tf.initialize_all_variables(), tf.initialize_local_variables())
+        init_op = tf.group(tf.global_variables_initializer(), tf.local_variables_initializer())
         sess.run(init_op)
 
         # If weights option is set, preload weights from existing models appropriately
         if FLAGS.weights:
-            load_snapshot(sess, FLAGS.weights, tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES))
+            load_snapshot(sess, FLAGS.weights, tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES))
 
         # Tensorboard: Merge all the summaries and write them out
         writer = tf.train.SummaryWriter(os.path.join(FLAGS.summaries_dir, 'tb'), sess.graph)
@@ -504,37 +551,49 @@ def main(_):
             inf_model.start_queue_runners(sess)
             Inference(sess, inf_model)
 
-        start = time.time() # @TODO(tzaman) - removeme
+        queue_size_op = []
+        for n in tf.get_default_graph().as_graph_def().node:
+            if '_Size' in n.name:
+                queue_size_op.append(n.name+':0')
+
+        start = time.time()  # @TODO(tzaman) - removeme
 
-        ## Initial Forward Validation Pass
+        # Initial Forward Validation Pass
         if FLAGS.validation_db:
             val_model.start_queue_runners(sess)
             Validation(sess, val_model, 0)
 
-
         if FLAGS.train_db:
-            # epoch value will be calculated for every batch size. To maintain unique epoch value between batches, it needs to be rounded to the required number of significant digits.
-            epoch_round = 0 # holds the required number of significant digits for round function.
-            tmp_batchsize = batch_size_train
-            while tmp_batchsize <= train_model.dataloader.get_total():
-                tmp_batchsize = tmp_batchsize * 10
-                epoch_round += 1
-            logging.info("While logging, epoch value will be rounded to %s significant digits", epoch_round)
-
             # During training, a log output should occur at least X times per epoch or every X images, whichever lower
             train_steps_per_epoch = train_model.dataloader.get_total() / batch_size_train
             if math.ceil(train_steps_per_epoch/MIN_LOGS_PER_TRAIN_EPOCH) < math.ceil(5000/batch_size_train):
                 logging_interval_step = int(math.ceil(train_steps_per_epoch/MIN_LOGS_PER_TRAIN_EPOCH))
             else:
                 logging_interval_step = int(math.ceil(5000/batch_size_train))
-            logging.info("During training. details will be logged after every %s steps (batches)", logging_interval_step)
+            logging.info("During training. details will be logged after every %s steps (batches)",
+                         logging_interval_step)
+
+            # epoch value will be calculated for every batch size. To maintain unique epoch value between batches,
+            # it needs to be rounded to the required number of significant digits.
+            epoch_round = 0  # holds the required number of significant digits for round function.
+            tmp_batchsize = batch_size_train*logging_interval_step
+            while tmp_batchsize <= train_model.dataloader.get_total():
+                tmp_batchsize = tmp_batchsize * 10
+                epoch_round += 1
+            logging.info("While logging, epoch value will be rounded to %s significant digits", epoch_round)
 
             # Create the learning rate policy
-            total_training_steps = train_model.dataloader.num_epochs * train_model.dataloader.get_total() / train_model.dataloader.batch_size
-            lrpolicy = lr_policy.LRPolicy(FLAGS.lr_policy, FLAGS.lr_base_rate, FLAGS.lr_gamma, FLAGS.lr_power, total_training_steps, FLAGS.lr_stepvalues)
+            total_training_steps = train_model.dataloader.num_epochs * train_model.dataloader.get_total() / \
+                train_model.dataloader.batch_size
+            lrpolicy = lr_policy.LRPolicy(FLAGS.lr_policy,
+                                          FLAGS.lr_base_rate,
+                                          FLAGS.lr_gamma,
+                                          FLAGS.lr_power,
+                                          total_training_steps,
+                                          FLAGS.lr_stepvalues)
             train_model.start_queue_runners(sess)
 
-            ## Training
+            # Training
             logging.info('Started training the model')
 
             current_epoch = 0
@@ -549,15 +608,30 @@ def main(_):
                     run_metadata = None
                     if log_runtime:
                         # For a HARDWARE_TRACE you need NVIDIA CUPTI, a 'CUDA-EXTRA'
-                        run_options = tf.RunOptions(trace_level=tf.RunOptions.FULL_TRACE) # SOFTWARE_TRACE HARDWARE_TRACE FULL_TRACE
+                        # SOFTWARE_TRACE HARDWARE_TRACE FULL_TRACE
+                        run_options = tf.RunOptions(trace_level=tf.RunOptions.FULL_TRACE)
                         run_metadata = tf.RunMetadata()
 
                     feed_dict = {train_model.learning_rate: lrpolicy.get_learning_rate(step)}
 
-                    _, summary_str, step = sess.run([train_model.train, train_model.summary, train_model.global_step],
-                            feed_dict=feed_dict,
-                            options=run_options,
-                            run_metadata=run_metadata)
+                    if False:
+                        for op in train_model.train:
+                            _, summary_str, step = sess.run([op, train_model.summary, train_model.global_step],
+                                                            feed_dict=feed_dict,
+                                                            options=run_options,
+                                                            run_metadata=run_metadata)
+                    else:
+                        _, summary_str, step = sess.run([train_model.train,
+                                                         train_model.summary,
+                                                         train_model.global_step],
+                                                        feed_dict=feed_dict,
+                                                        options=run_options,
+                                                        run_metadata=run_metadata)
+
+                    # HACK
+                    step = step / len(train_model.train)
+
+                    # logging.info(sess.run(queue_size_op)) # DEVELOPMENT: for checking the queue size
 
                     if log_runtime:
                         writer.add_run_metadata(run_metadata, str(step))
@@ -570,11 +644,11 @@ def main(_):
 
                     print_vals_sum = print_vals + print_vals_sum
 
-                    # @TODO(tzaman): account for variable batch_size value on last epoch
+                    # @TODO(tzaman): account for variable batch_size value on very last epoch
                     current_epoch = round((step * batch_size_train) / train_model.dataloader.get_total(), epoch_round)
 
                     # Start with a forward pass
-                    if (step == 1) or ((step % logging_interval_step) == 0):
+                    if ((step % logging_interval_step) == 0):
                         steps_since_log = step - step_last_log
                         print_list = print_summarylist(tags, print_vals_sum/steps_since_log)
                         logging.info("Training (epoch " + str(current_epoch) + "): " + print_list)
@@ -584,32 +658,32 @@ def main(_):
                     # Potential Validation Pass
                     if FLAGS.validation_db and current_epoch >= next_validation:
                         Validation(sess, val_model, current_epoch)
-                        # Find next nearest epoch value that exactly divisible by FLAGS.interval:
-                        next_validation = (round(float(current_epoch)/FLAGS.interval) + 1) * FLAGS.interval
-                        last_validation_epoch = current_epoch
+                        # Find next nearest epoch value that exactly divisible by FLAGS.validation_interval:
+                        next_validation = (round(float(current_epoch)/FLAGS.validation_interval) + 1) * \
+                            FLAGS.validation_interval
 
                     # Saving Snapshot
                     if FLAGS.snapshotInterval > 0 and current_epoch >= next_snapshot_save:
-                        writer.add_summary(summary_str, step)
                         save_snapshot(sess, saver, FLAGS.save, snapshot_prefix, current_epoch, FLAGS.serving_export)
 
                         # To find next nearest epoch value that exactly divisible by FLAGS.snapshotInterval
-                        next_snapshot_save = (round(float(current_epoch)/FLAGS.snapshotInterval) + 1) * FLAGS.snapshotInterval
+                        next_snapshot_save = (round(float(current_epoch)/FLAGS.snapshotInterval) + 1) * \
+                            FLAGS.snapshotInterval
                         last_snapshot_save_epoch = current_epoch
                     writer.flush()
             except tf.errors.OutOfRangeError:
                 logging.info('Done training for epochs: tf.errors.OutOfRangeError')
             except ValueError as err:
                 logging.error(err.args[0])
-                exit(-1) # DIGITS wants a dirty error.
+                exit(-1)  # DIGITS wants a dirty error.
             except (KeyboardInterrupt):
                 logging.info('Interrupt signal received.')
 
-             # If required, perform final snapshot save
+            # If required, perform final snapshot save
             if FLAGS.snapshotInterval > 0 and FLAGS.epoch > last_snapshot_save_epoch:
                 save_snapshot(sess, saver, FLAGS.save, snapshot_prefix, FLAGS.epoch, FLAGS.serving_export)
 
-        print('Training wall-time:', time.time()-start) # @TODO(tzaman) - removeme
+        print('Training wall-time:', time.time()-start)  # @TODO(tzaman) - removeme
 
         # If required, perform final Validation pass
         if FLAGS.validation_db and current_epoch >= next_validation:
diff --git a/digits/tools/tensorflow/model.py b/digits/tools/tensorflow/model.py
index 16343bed8..ed9ac3bb2 100644
--- a/digits/tools/tensorflow/model.py
+++ b/digits/tools/tensorflow/model.py
@@ -4,7 +4,7 @@
 # Linter: pylint
 
 """
-Interface for setting up a model in Tensorflow.
+Interface for setting up and creating a model in Tensorflow.
 
 """
 
@@ -12,286 +12,297 @@
 from __future__ import division
 from __future__ import print_function
 
-import functools
 import logging
 import tensorflow as tf
+from tensorflow.python.framework import ops
 
 # Local imports
 import tf_data
 import utils as digits
+from utils import model_property
 
-logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',datefmt='%Y-%m-%d %H:%M:%S',
+logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',
+                    datefmt='%Y-%m-%d %H:%M:%S',
                     level=logging.INFO)
 
 # Constants
-OUTPUT_HISTOGRAM_SUMMARIES = False # Very heavy for the CPU
-
-def lazy_property(function):
-    # From https://danijar.com/structuring-your-tensorflow-models/
-    attribute = '_cache_' + function.__name__
-    @property
-    @functools.wraps(function)
-    def decorator(self):
-        if not hasattr(self, attribute):
-            setattr(self, attribute, function(self))
-        return getattr(self, attribute)
-    return decorator
-
-# -- from https://github.com/tensorflow/tensorflow/blob/master/tensorflow/models/image/cifar10/cifar10_multi_gpu_train.py
+SUMMARIZE_TOWER_STATS = False
+
+
+# from
+# https://github.com/tensorflow/tensorflow/blob/master/tensorflow/models/image/cifar10/cifar10_multi_gpu_train.py
 def average_gradients(tower_grads):
-  """Calculate the average gradient for each shared variable across all towers.
-  Note that this function provides a synchronization point across all towers.
-  Args:
-    tower_grads: List of lists of (gradient, variable) tuples. The outer list
-      is over individual gradients. The inner list is over the gradient
-      calculation for each tower.
-  Returns:
-     List of pairs of (gradient, variable) where the gradient has been averaged
-     across all towers.
-  """
-  average_grads = []
-  for grad_and_vars in zip(*tower_grads):
-    # Note that each grad_and_vars looks like the following:
-    #   ((grad0_gpu0, var0_gpu0), ... , (grad0_gpuN, var0_gpuN))
-    grads = []
-    for g, _ in grad_and_vars:
-      # Add 0 dimension to the gradients to represent the tower.
-      expanded_g = tf.expand_dims(g, 0)
-
-      # Append on a 'tower' dimension which we will average over below.
-      grads.append(expanded_g)
-
-    # Average over the 'tower' dimension.
-    grad = tf.concat(0, grads)
-    grad = tf.reduce_mean(grad, 0)
-
-    # Keep in mind that the Variables are redundant because they are shared
-    # across towers. So .. we will just return the first tower's pointer to
-    # the Variable.
-    v = grad_and_vars[0][1]
-    grad_and_var = (grad, v)
-    average_grads.append(grad_and_var)
-  return average_grads
+    """Calculate the average gradient for each shared variable across all towers.
+    Note that this function provides a synchronization point across all towers.
+    Args:
+      tower_grads: List of lists of (gradient, variable) tuples. The outer list
+        is over individual gradients. The inner list is over the gradient
+        calculation for each tower.
+    Returns:
+       List of pairs of (gradient, variable) where the gradient has been averaged
+       across all towers.
+    """
+    with tf.name_scope('gradient_average'):
+        average_grads = []
+        for grad_and_vars in zip(*tower_grads):
+            # Note that each grad_and_vars looks like the following:
+            #   ((grad0_gpu0, var0_gpu0), ... , (grad0_gpuN, var0_gpuN))
+            grads = []
+            for g, _ in grad_and_vars:
+                # Add 0 dimension to the gradients to represent the tower.
+                expanded_g = tf.expand_dims(g, 0)
+                # Append on a 'tower' dimension which we will average over below.
+                grads.append(expanded_g)
+            # Average over the 'tower' dimension.
+            grad = tf.concat(0, grads)
+            grad = tf.reduce_mean(grad, 0)
+            # Keep in mind that the Variables are redundant because they are shared
+            # across towers. So .. we will just return the first tower's pointer to
+            # the Variable.
+            v = grad_and_vars[0][1]
+            grad_and_var = (grad, v)
+            average_grads.append(grad_and_var)
+        return average_grads
+
 
 class Model(object):
     """
     @TODO(tzaman)
-
     """
-    def __init__(self, stage, croplen, nclasses):
+    def __init__(self, stage, croplen, nclasses, optimization=None, momentum=None):
         self.stage = stage
         self.croplen = croplen
         self.nclasses = nclasses
         self.dataloader = None
-        self.optimization = None
-        self.momentum = None
-
         self.queue_coord = None
         self.queue_threads = None
 
-        self._summaries = []
-        self.inference = None
-        self.network_loss = None
-
-        # Define graph keys in tf convention
-        self.GraphKeys = {}
-        self.GraphKeys['QUEUE_RUNNERS'] = "queue_runner_" + self.stage
-        self.GraphKeys['MODEL'] = "model_" + self.stage
-        self.GraphKeys['LOSS'] = "loss_" + self.stage # The name-scope
-        self.GraphKeys['LOSSES'] = "losses" + self.stage # The collection
-        self.GraphKeys['LOADER'] = "data_" + self.stage
+        self._optimization = optimization
+        self._momentum = momentum
+        self.summaries = []
+        self.towers = []
+        self._train = None
 
-        # Special exception for summaries, as they need to be accesible to the user model
-        # in a tf compliant way
-        if self.stage == digits.STAGE_TRAIN:
-            self.GraphKeys['SUMMARIES'] = digits.GraphKeys.SUMMARIES_TRAIN
-        elif self.stage == digits.STAGE_VAL:
-            self.GraphKeys['SUMMARIES'] = digits.GraphKeys.SUMMARIES_VAL
-        elif self.stage == digits.STAGE_INF:
-            self.GraphKeys['SUMMARIES'] = digits.GraphKeys.SUMMARIES_INF
+        # Touch to initialize
+        if optimization:
+            self.learning_rate
+            self.global_step
+            self.optimizer
 
     def create_dataloader(self, db_path):
-        self.dataloader = tf_data.LoaderFactory.set_source(db_path)
-        self.dataloader.summaries = self._summaries
+        self.dataloader = tf_data.LoaderFactory.set_source(db_path, is_inference=(self.stage == digits.STAGE_INF))
+        # @TODO(tzaman) communicate the dataloader summaries to our Model summary list
         self.dataloader.stage = self.stage
         self.dataloader.croplen = self.croplen
         self.dataloader.nclasses = self.nclasses
 
     def init_dataloader(self):
         with tf.device('/cpu:0'):
-            with tf.name_scope(self.GraphKeys['LOADER']):
+            with tf.name_scope(digits.GraphKeys.LOADER):
                 self.dataloader.create_input_pipeline()
 
-    def set_optimizer(self, optimization, momentum):
-        self.optimization = optimization
-        self.momentum = momentum
-        # touch and initialize the optimizer and global_step
-        self.global_step
+    def create_model(self, obj_UserModel, stage_scope, batch_x=None):
 
-    def create_model_from_template(self, network_template):
+        if batch_x is None:
+            self.init_dataloader()
+            batch_x = self.dataloader.batch_x
+            if self.stage != digits.STAGE_INF:
+                batch_y = self.dataloader.batch_y
+        else:
+            assert self.stage == digits.STAGE_INF
+            batch_x = batch_x
 
         available_devices = digits.get_available_gpus()
         if not available_devices:
             available_devices.append('/cpu:0')
 
-        # Split the batch over the batch dimension over the number of available gpu's
-        batch_x_split = tf.split(0, len(available_devices), self.dataloader.batch_x, name='split_batch')
+        # available_devices = ['/gpu:0', '/gpu:1'] # DEVELOPMENT : virtual multi-gpu
 
-        if self.stage != digits.STAGE_INF:
-            # Inference never has labels
-            batch_y_split = tf.split(0, len(available_devices), self.dataloader.batch_y, name='split_batch')
+        # Split the batch over the batch dimension over the number of available gpu's
+        if len(available_devices) == 1:
+            batch_x_split = [batch_x]
+            if self.stage != digits.STAGE_INF:  # Has no labels
+                batch_y_split = [batch_y]
+        else:
+            with tf.name_scope('parallelize'):
+                # Split them up
+                batch_x_split = tf.split(0, len(available_devices), batch_x, name='split_batch')
+                if self.stage != digits.STAGE_INF:  # Has no labels
+                    batch_y_split = tf.split(0, len(available_devices), batch_y, name='split_batch')
 
         # Run the user model through the build_model function that should be filled in
         grad_towers = []
-        for gpu_id, gpu_device in enumerate(available_devices):
-            with tf.device(gpu_device):
-                with tf.name_scope('tower_%d' % gpu_id) as scope_tower:
-                    with tf.name_scope(self.GraphKeys['MODEL']):
-                        # Load the parameters to be  passed to the custom user network definition
-                        model_params = {
-                            'x' : batch_x_split[gpu_id],
-                            'input_shape' : self.dataloader.get_shape(),
-                            'nclasses' : self.nclasses,
-                            'is_training' : self.stage == digits.STAGE_TRAIN,
-                        }
-
-                        user_network = network_template(model_params)
-
-                        # Perform checks
-                        if not user_network.has_key('model'):
-                            logging.error("Model definition required in model file but not supplied.")
-                            exit(-1)
-                        else: # Key exists, check type
-                            if 'tensorflow' not in str(type(user_network['model'])):
-                                logging.error("Model definition required in model is not a tf operation type, but is type(%s)", type(user_network['model']))
-                                exit(-1)
-
-                        if not user_network.has_key('loss'):
-                            logging.error("Loss function definition required in model file but not supplied.")
-                            exit(-1)
-                        else: # Key exists, check if callable
-                            if not callable(user_network['loss']):
-                                logging.error("Returned loss function should be a function, but is type(%s).", type(user_network['loss']))
-                                exit(-1)
-
-                        self.inference = user_network['model']
+        for dev_i, dev_name in enumerate(available_devices):
+            with tf.device(dev_name):
+                current_scope = stage_scope if len(available_devices) == 1 else ('tower_%d' % dev_i)
+                with tf.name_scope(current_scope) as scope_tower:
+
+                    if self.stage != digits.STAGE_INF:
+                        tower_model = self.add_tower(obj_tower=obj_UserModel,
+                                                     x=batch_x_split[dev_i],
+                                                     y=batch_y_split[dev_i])
+                    else:
+                        tower_model = self.add_tower(obj_tower=obj_UserModel,
+                                                     x=batch_x_split[dev_i],
+                                                     y=None)
+
+                    with tf.variable_scope(digits.GraphKeys.MODEL, reuse=dev_i > 0):
+                        tower_model.inference  # touch to initialize
 
                     if self.stage == digits.STAGE_INF:
                         # For inferencing we will only use the inference part of the graph
-                        continue;
-
-                    with tf.name_scope(self.GraphKeys['LOSS']):
-
-                        loss_op = user_network['loss'](batch_y_split[gpu_id])
+                        continue
 
-                        tf.add_to_collection(self.GraphKeys['LOSSES'], loss_op)
-                        #loss_op = tf.add_n(tf.get_collection(self.GraphKeys['LOSSES']), name='total_loss')
-                        #tf.add_to_collection('losses', loss_op)
+                    with tf.name_scope(digits.GraphKeys.LOSS):
+                        for loss in self.get_tower_losses(tower_model):
+                            tf.add_to_collection(digits.GraphKeys.LOSSES, loss['loss'])
 
-                        # Assemble all made within this scope so far (f.e. including potential L2-loss from user model)
-                        total_tower_loss =tf.add_n(tf.get_collection(self.GraphKeys['LOSSES'], scope_tower), name='total_tower_loss')
-
-                        if len(available_devices) > 1:
-                            self._summaries.append(tf.scalar_summary('loss_t_%d' % gpu_id, total_tower_loss))
+                        # Assemble all made within this scope so far. The user can add custom
+                        # losses to the digits.GraphKeys.LOSSES collection
+                        losses = tf.get_collection(digits.GraphKeys.LOSSES, scope=scope_tower)
+                        losses += ops.get_collection(ops.GraphKeys.REGULARIZATION_LOSSES, scope=None)
+                        tower_loss = tf.add_n(losses, name='loss')
 
+                        self.summaries.append(tf.scalar_summary(tower_loss.op.name, tower_loss))
 
                     # Reuse the variables in this scope for the next tower/device
                     tf.get_variable_scope().reuse_variables()
 
                     if self.stage == digits.STAGE_TRAIN:
-                        grad_tower = self.optimizer.compute_gradients(total_tower_loss)
-                        grad_towers.append(grad_tower)
-
-        if self.stage != digits.STAGE_INF:
-            with tf.name_scope(self.GraphKeys['MODEL']):
-                self._summaries.append(tf.scalar_summary('loss', tf.add_n(tf.get_collection(self.GraphKeys['LOSSES']))/len(available_devices)))
+                        grad_tower_losses = []
+                        for loss in self.get_tower_losses(tower_model):
+                            grad_tower_loss = self.optimizer.compute_gradients(loss['loss'], loss['vars'])
+                            grad_tower_loss = tower_model.gradientUpdate(grad_tower_loss)
+                            grad_tower_losses.append(grad_tower_loss)
+                        grad_towers.append(grad_tower_losses)
 
         # Assemble and average the gradients from all towers
         if self.stage == digits.STAGE_TRAIN:
-            if len(grad_towers) == 1:
-                grad_avg = grad_towers[0]
+            n_gpus = len(available_devices)
+            if n_gpus == 1:
+                grad_averages = grad_towers[0]
             else:
-                grad_avg = average_gradients(grad_towers)
-            apply_gradient_op = self.optimizer.apply_gradients(grad_avg, global_step=self.global_step)
-            self.train = apply_gradient_op
+                with tf.device(available_devices[0]):
+                    n_losses = len(grad_towers[0])
+                    grad_averages = []
+                    for loss in xrange(n_losses):
+                        grad_averages.append(average_gradients([grad_towers[gpu][loss] for gpu in xrange(n_gpus)]))
+            apply_gradient_ops = []
+            for grad_avg in grad_averages:
+                apply_gradient_ops.append(self.optimizer.apply_gradients(grad_avg, global_step=self.global_step))
+            self._train = apply_gradient_ops
+
+    def start_queue_runners(self, sess):
+        logging.info('Starting queue runners (%s)', self.stage)
+        # Distinguish the queue runner collection (for easily obtaining them by collection key)
+        queue_runners = tf.get_collection(tf.GraphKeys.QUEUE_RUNNERS, scope=self.stage+'.*')
+        for qr in queue_runners:
+            if self.stage in qr.name:
+                tf.add_to_collection(digits.GraphKeys.QUEUE_RUNNERS, qr)
+
+        self.queue_coord = tf.train.Coordinator()
+        self.queue_threads = tf.train.start_queue_runners(sess=sess, coord=self.queue_coord,
+                                                          collection=digits.GraphKeys.QUEUE_RUNNERS)
+        logging.info('Queue runners started (%s)', self.stage)
+
+    def __del__(self):
+        # Destructor
+        if self.queue_coord:
+            # Close and terminate the queues
+            self.queue_coord.request_stop()
+            self.queue_coord.join(self.queue_threads)
+
+    def add_tower(self, obj_tower, x, y):
+        is_training = self.stage == digits.STAGE_TRAIN
+        is_inference = self.stage == digits.STAGE_INF
+        input_shape = self.dataloader.get_shape()
+        tower = obj_tower(x, y, input_shape, self.nclasses, is_training, is_inference)
+        self.towers.append(tower)
+        return tower
+
+    @model_property
+    def train(self):
+        return self._train
 
-    @lazy_property
+    @model_property
     def summary(self):
         """
         Merge train summaries
         """
+        for t in self.towers:
+            self.summaries += t.summaries
 
-        # The below get_collection() commands retrieve any summaries that have been set by the user
-        # in the model
-        self._summaries += tf.get_collection(self.GraphKeys['SUMMARIES'],
-                                             scope='.*'+self.GraphKeys['MODEL'])
-        self._summaries += tf.get_collection(self.GraphKeys['SUMMARIES'],
-                                             scope='.*'+self.GraphKeys['LOSS'])
-
-        if not len(self._summaries):
+        if not len(self.summaries):
             logging.error("No summaries defined. Please define at least one summary.")
             exit(-1)
-        return tf.merge_summary(self._summaries)
+        return tf.merge_summary(self.summaries)
 
-    @lazy_property
+    @model_property
     def global_step(self):
         # Force global_step on the CPU, becaues the GPU's first step will end at 0 instead of 1.
         with tf.device('/cpu:0'):
             return tf.get_variable('global_step', [], initializer=tf.constant_initializer(0),
                                    trainable=False)
 
-    @lazy_property
+    @model_property
     def learning_rate(self):
         # @TODO(tzaman): the learning rate is a function of the global step, so we could
         #  define it entirely in tf ops, instead of a placeholder and feeding.
         with tf.device('/cpu:0'):
             lr = tf.placeholder(tf.float32, shape=[], name='learning_rate')
-            self._summaries.append(tf.scalar_summary('lr', lr))
+            self.summaries.append(tf.scalar_summary('lr', lr))
             return lr
 
-    @lazy_property
+    @model_property
     def optimizer(self):
-        logging.info("Optimizer:%s", self.optimization)
-        if self.optimization == 'sgd':
+        logging.info("Optimizer:%s", self._optimization)
+        if self._optimization == 'sgd':
             return tf.train.GradientDescentOptimizer(learning_rate=self.learning_rate)
-        elif self.optimization == 'adadelta':
+        elif self._optimization == 'adadelta':
             return tf.train.AdadeltaOptimizer(learning_rate=self.learning_rate)
-        elif self.optimization == 'adagrad':
+        elif self._optimization == 'adagrad':
             return tf.train.AdagradOptimizer(learning_rate=self.learning_rate)
-        elif self.optimization == 'adagradda':
+        elif self._optimization == 'adagradda':
             return tf.train.AdagradDAOptimizer(learning_rate=self.learning_rate,
                                                global_step=self.global_step)
-        elif self.optimization == 'momentum':
+        elif self._optimization == 'momentum':
             return tf.train.MomentumOptimizer(learning_rate=self.learning_rate,
-                                              momentum=self.momentum)
-        elif self.optimization == 'adam':
+                                              momentum=self._momentum)
+        elif self._optimization == 'adam':
             return tf.train.AdamOptimizer(learning_rate=self.learning_rate)
-        elif self.optimization == 'ftrl':
+        elif self._optimization == 'ftrl':
             return tf.train.FtrlOptimizer(learning_rate=self.learning_rate)
-        elif self.optimization == 'rmsprop':
+        elif self._optimization == 'rmsprop':
             return tf.train.RMSPropOptimizer(learning_rate=self.learning_rate,
-                                             momentum=self.momentum)
+                                             momentum=self._momentum)
         else:
-            logging.error("Invalid optimization flag %s", self.optimization)
+            logging.error("Invalid optimization flag %s", self._optimization)
             exit(-1)
 
-    def start_queue_runners(self, sess):
-        logging.info('Starting queue runners (%s)', self.stage)
-        # Distinguish the queue runner collection (for easily obtaining them by collection key)
-        queue_runners = tf.get_collection(tf.GraphKeys.QUEUE_RUNNERS)
-        for qr in queue_runners:
-            if self.stage in qr.name:
-                tf.add_to_collection(self.GraphKeys['QUEUE_RUNNERS'], qr)
+    def get_tower_losses(self, tower):
+        """
+        Return list of losses
 
-        self.queue_coord = tf.train.Coordinator()
-        self.queue_threads = tf.train.start_queue_runners(sess=sess, coord=self.queue_coord,
-                                                          collection=self.GraphKeys['QUEUE_RUNNERS']
-                                                         )
-        logging.info('Queue runners started (%s)', self.stage)
+        If user-defined model returns only one loss then this is encapsulated into the expected list of
+        dicts structure
+        """
+        if isinstance(tower.loss, list):
+            return tower.loss
+        else:
+            return [{'loss': tower.loss, 'vars': tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES)}]
 
-    def __del__(self):
-        # Destructor
-        if self.queue_coord:
-            # Close and terminate the queues
-            self.queue_coord.request_stop()
-            self.queue_coord.join(self.queue_threads)
+
+class Tower(object):
+
+    def __init__(self, x, y, input_shape, nclasses, is_training, is_inference):
+        self.input_shape = input_shape
+        self.nclasses = nclasses
+        self.is_training = is_training
+        self.is_inference = is_inference
+        self.summaries = []
+        self.x = x
+        self.y = y
+        self.train = None
+
+    def gradientUpdate(self, grad):
+        return grad
diff --git a/digits/tools/tensorflow/tf_data.py b/digits/tools/tensorflow/tf_data.py
index 5e15cd4cb..a2071bd62 100644
--- a/digits/tools/tensorflow/tf_data.py
+++ b/digits/tools/tensorflow/tf_data.py
@@ -20,7 +20,6 @@
 import math
 import numpy as np
 import os
-import sys
 import tensorflow as tf
 
 # Local imports
@@ -29,24 +28,26 @@
 
 # Constants
 MIN_FRACTION_OF_EXAMPLES_IN_QUEUE = 0.4
-MAX_ABSOLUTE_EXAMPLES_IN_QUEUE = 4096 # The queue size cannot exceed this number
+MAX_ABSOLUTE_EXAMPLES_IN_QUEUE = 4096  # The queue size cannot exceed this number
 NUM_THREADS_DATA_LOADER = 6
-LOG_MEAN_FILE = False # Logs the mean file as loaded in TF to TB
+LOG_MEAN_FILE = False  # Logs the mean file as loaded in TF to TB
 
 # Supported extensions for Loaders
 DB_EXTENSIONS = {
     'hdf5': ['.H5', '.HDF5'],
     'lmdb': ['.MDB', '.LMDB'],
-    'tfrecords' :['.TFRECORDS'],
+    'tfrecords': ['.TFRECORDS'],
     'filelist': ['.TXT'],
     'file': ['.JPG', '.JPEG', '.PNG'],
+    'gangrid': ['.GAN'],
 }
 
-LIST_DELIMITER = ' ' # For the FILELIST format
+LIST_DELIMITER = ' '  # For the FILELIST format
 
-logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s',datefmt='%Y-%m-%d %H:%M:%S',
+logging.basicConfig(format='%(asctime)s [%(levelname)s] %(message)s', datefmt='%Y-%m-%d %H:%M:%S',
                     level=logging.INFO)
 
+
 def get_backend_of_source(db_path):
     """
     Takes a path as argument and infers the format of the data.
@@ -65,7 +66,7 @@ def get_backend_of_source(db_path):
         files_in_path = [db_path]
 
     # Keep the below priority ordering
-    for db_fmt in ['hdf5', 'lmdb', 'tfrecords', 'filelist', 'file']:
+    for db_fmt in ['hdf5', 'lmdb', 'tfrecords', 'filelist', 'file', 'gangrid']:
         ext_list = DB_EXTENSIONS[db_fmt]
         for ext in ext_list:
             if any(ext in os.path.splitext(fn)[1].upper() for fn in files_in_path):
@@ -74,6 +75,7 @@ def get_backend_of_source(db_path):
     logging.error("Cannot infer backend from db_path (%s)." % (db_path))
     exit(-1)
 
+
 class MeanLoader(object):
     """
     Loads in a mean file for tensorflow. This is done through using a constant
@@ -105,19 +107,20 @@ def load_mean(self):
             data = np.array(blob.data, dtype="float32").reshape(blob.channels, blob.height, blob.width)
             if blob.channels == 3:
                 # converting from BGR to RGB
-                data = data[[2,1,0],...] # channel swap
+                data = data[[2, 1, 0], ...]  # channel swap
                 # convert to (height, width, channels)
-                data = data.transpose((1,2,0))
+                data = data.transpose((1, 2, 0))
             elif blob.channels == 1:
                 # convert to (height, width)
                 data = data[0]
             else:
-                logging.error('Unknown amount of channels (%d) in mean file (%s)' % (blob.channels, self._mean_file_path))
+                logging.error('Unknown amount of channels (%d) in mean file (%s)' %
+                              (blob.channels, self._mean_file_path))
                 exit(-1)
-        elif file_extension in IMG_FILE_EXT:
-            img = Image.open(self._mean_file_path)
-            img.load()
-            data = np.asarray(img, dtype="float32")
+        # elif file_extension in IMG_FILE_EXT:
+        #     img = Image.open(self._mean_file_path)
+        #     img.load()
+        #     data = np.asarray(img, dtype="float32")
         else:
             logging.error('Failed loading mean file: Unsupported extension (%s)' % (file_extension))
             exit(-1)
@@ -130,11 +133,7 @@ def load_mean(self):
                 # Explicitly add channel dim
                 data = data[:, :, None]
 
-            # Normalize to [0:1]
-            if self._bitdepth == 16:
-                data = data / 65535
-            else:
-                data = data / 255
+            # return data in original pixel scale
             self.tf_mean_image = tf.constant(data, name='Const_Mean_Image')
 
         else:
@@ -169,7 +168,7 @@ def __init__(self):
         self.batch_k = None
         self.stage = None
         self._seed = None
-        self.unencoded_data_format = 'whc'
+        self.unencoded_data_format = 'hwc'
         self.unencoded_channel_scheme = 'rgb'
         self.summaries = None
         self.aug_dict = {}
@@ -178,7 +177,7 @@ def __init__(self):
         pass
 
     @staticmethod
-    def set_source(db_path):
+    def set_source(db_path, is_inference=False):
         """
         Returns the correct backend.
         """
@@ -192,11 +191,14 @@ def set_source(db_path):
             loader = FileListLoader()
         elif backend == 'tfrecords':
             loader = TFRecordsLoader()
+        elif backend == 'gangrid':
+            loader = GanGridLoader()
         else:
             logging.error("Backend (%s) not implemented" % (backend))
             exit(-1)
         loader.backend = backend
         loader.db_path = db_path
+        loader.is_inference = is_inference
         return loader
 
     def setup(self, labels_db_path, shuffle, bitdepth, batch_size, num_epochs=None, seed=None):
@@ -240,7 +242,7 @@ def get_total(self):
         return self.total
 
     def reshape_decode(self, data, shape):
-        if self.float_data: #@TODO(tzaman): this is LMDB specific - Make generic!
+        if self.float_data:  # @TODO(tzaman): this is LMDB specific - Make generic!
             data = tf.reshape(data, shape)
             data = digits.chw_to_hwc(data)
         else:
@@ -255,20 +257,22 @@ def reshape_decode(self, data, shape):
                     logging.error('Unsupported mime type (%s); cannot be decoded' % (self.data_mime))
                     exit(-1)
             else:
-                data = tf.decode_raw(data, self.image_dtype, name='raw_decoder')
+                if self.backend == 'lmdb':
+                    data = tf.decode_raw(data, self.image_dtype, name='raw_decoder')
 
                 # if data is in CHW, set the shape and convert to HWC
                 if self.unencoded_data_format == 'chw':
-                    data = tf.reshape(data, [shape[2],shape[0],shape[1]])
+                    data = tf.reshape(data, [shape[0], shape[1], shape[2]])
                     data = digits.chw_to_hwc(data)
-                else: #'hwc'
+                else:  # 'hwc'
                     data = tf.reshape(data, shape)
 
                 if (self.channels == 3) and self.unencoded_channel_scheme == 'bgr':
                     data = digits.bgr_to_rgb(data)
 
             # Convert to float
-            data = tf.image.convert_image_dtype(data, tf.float32) # Converts to [0:1) range
+            data = tf.to_float(data)
+            # data = tf.image.convert_image_dtype(data, tf.float32) # normalize to [0:1) range
         return data
 
     def create_input_pipeline(self):
@@ -290,24 +294,25 @@ def create_input_pipeline(self):
         # @TODO(tzaman) the container can be used if the reset function is implemented:
         # see https://github.com/tensorflow/tensorflow/issues/4535#issuecomment-248990633
         #
-        #with tf.container('queue-container'):
+        # with tf.container('queue-container'):
 
         key_queue = self.get_queue()
 
         single_label = None
         single_label_shape = None
         if self.stage == digits.STAGE_INF:
-            single_key, single_data, single_data_shape = self.get_single_data(key_queue)
+            single_key, single_data, single_data_shape, _, _ = self.get_single_data(key_queue)
         else:
-            single_key, single_data, single_data_shape, single_label, single_label_shape = self.get_single_data(key_queue)
+            single_key, single_data, single_data_shape, single_label, single_label_shape = \
+                self.get_single_data(key_queue)
 
-        single_data_shape = tf.reshape(single_data_shape, [3]) # Shape the shape to have three dimensions
+        single_data_shape = tf.reshape(single_data_shape, [3])  # Shape the shape to have three dimensions
         single_data = self.reshape_decode(single_data, single_data_shape)
 
-        if self.labels_db_path: # Using a seperate label db; label can be anything
+        if self.labels_db_path:  # Using a seperate label db; label can be anything
             single_label_shape = tf.reshape(single_label_shape, [3])  # Shape the shape
             single_label = self.labels_db.reshape_decode(single_label, single_label_shape)
-        elif single_label is not None: # Not using a seperate label db; label is a scalar
+        elif single_label is not None:  # Not using a seperate label db; label is a scalar
             single_label = tf.reshape(single_label, [])
 
         # Mean Subtraction
@@ -315,42 +320,57 @@ def create_input_pipeline(self):
             with tf.name_scope('mean_subtraction'):
                 single_data = self.mean_loader.subtract_mean_op(single_data)
                 if LOG_MEAN_FILE:
-                    self.summaries.append(tf.image_summary('mean_image', tf.expand_dims(self.mean_loader.tf_mean_image, 0), max_images=1))
+                    self.summaries.append(tf.image_summary('mean_image',
+                                                           tf.expand_dims(self.mean_loader.tf_mean_image, 0),
+                                          max_images=1))
 
         # (Random) Cropping
         if self.croplen:
             with tf.name_scope('cropping'):
                 if self.stage == digits.STAGE_TRAIN:
-                    single_data = tf.random_crop(single_data, [self.croplen, self.croplen, self.channels], seed=self._seed)
-                else : # Validation or Inference
+                    single_data = tf.random_crop(single_data,
+                                                 [self.croplen, self.croplen, self.channels],
+                                                 seed=self._seed)
+                else:  # Validation or Inference
                     single_data = tf.image.resize_image_with_crop_or_pad(single_data, self.croplen, self.croplen)
 
         # Data Augmentation
         if self.aug_dict:
             with tf.name_scope('augmentation'):
                 flipflag = self.aug_dict['aug_flip']
-                if  flipflag == 'fliplr' or flipflag == 'fliplrud':
+                if flipflag == 'fliplr' or flipflag == 'fliplrud':
                     single_data = tf.image.random_flip_left_right(single_data, seed=self._seed)
-                if  flipflag == 'flipud' or flipflag == 'fliplrud':
+                if flipflag == 'flipud' or flipflag == 'fliplrud':
                     single_data = tf.image.random_flip_up_down(single_data, seed=self._seed)
 
                 noise_std = self.aug_dict['aug_noise']
                 if noise_std > 0.:
                     # Note the tf.random_normal requires a static shape
-                    single_data = tf.add(single_data, tf.random_normal(self.get_shape(), mean=0.0, stddev=noise_std, dtype=tf.float32, seed=self._seed, name='AWGN'))
+                    single_data = tf.add(single_data, tf.random_normal(self.get_shape(),
+                                                                       mean=0.0,
+                                                                       stddev=noise_std,
+                                                                       dtype=tf.float32,
+                                                                       seed=self._seed,
+                                                                       name='AWGN'))
 
                 contrast_fact = self.aug_dict['aug_contrast']
                 if contrast_fact > 0:
-                    single_data = tf.image.random_contrast(single_data, lower=1.-contrast_fact, upper=1.+contrast_fact, seed=self._seed)
+                    single_data = tf.image.random_contrast(single_data,
+                                                           lower=1.-contrast_fact,
+                                                           upper=1.+contrast_fact,
+                                                           seed=self._seed)
 
                 # @TODO(tzaman): rewrite the below HSV stuff entirely in a TF PR to be done in one single operation
                 aug_hsv = self.aug_dict['aug_HSV']
                 if aug_hsv['h'] > 0.:
                     single_data = tf.image.random_hue(single_data, aug_hsv['h'], seed=self._seed)
                 if aug_hsv['s'] > 0.:
-                    single_data = tf.image.random_saturation(single_data, 1-aug_hsv['s'], 1+aug_hsv['s'], seed=self._seed)
+                    single_data = tf.image.random_saturation(single_data,
+                                                             1 - aug_hsv['s'],
+                                                             1 + aug_hsv['s'],
+                                                             seed=self._seed)
                 if aug_hsv['v'] > 0.:
-                     # closely resembles V - temporary until rewritten
+                    # closely resembles V - temporary until rewritten
                     single_data = tf.image.random_brightness(single_data, aug_hsv['v'], seed=self._seed)
 
                 # @TODO(tzaman) whitening is so invasive that we need a way to add it to the val/inf too in a
@@ -359,9 +379,10 @@ def create_input_pipeline(self):
                 if aug_whitening:
                     # Subtract off its own mean and divide by the standard deviation of its own the pixels.
                     with tf.name_scope('whitening'):
-                        single_data = tf.image.per_image_whitening(single_data) # N.B. also converts to float
+                        single_data = tf.image.per_image_standardization(single_data)  # N.B. also converts to float
 
-        max_queue_capacity = min(math.ceil(self.total * MIN_FRACTION_OF_EXAMPLES_IN_QUEUE), MAX_ABSOLUTE_EXAMPLES_IN_QUEUE)
+        max_queue_capacity = min(math.ceil(self.total * MIN_FRACTION_OF_EXAMPLES_IN_QUEUE),
+                                 MAX_ABSOLUTE_EXAMPLES_IN_QUEUE)
 
         single_batch = [single_key, single_data]
         if single_label is not None:
@@ -369,34 +390,33 @@ def create_input_pipeline(self):
 
         if self.backend == 'tfrecords' and self.shuffle:
             batch = tf.train.shuffle_batch(
-                    single_batch,
-                    batch_size=self.batch_size,
-                    num_threads=NUM_THREADS_DATA_LOADER,
-                    capacity=10*self.batch_size, # Max amount that will be loaded and queued
-                    shapes=[[0], self.get_shape(), []], # Only makes sense is dynamic_pad=False #@TODO(tzaman) - FIXME
-                    min_after_dequeue=5*self.batch_size,
-                    allow_smaller_final_batch=True, # Happens if total%batch_size!=0
-                    name='batcher'
-                )
+                single_batch,
+                batch_size=self.batch_size,
+                num_threads=NUM_THREADS_DATA_LOADER,
+                capacity=10*self.batch_size,  # Max amount that will be loaded and queued
+                shapes=[[0], self.get_shape(), []],  # Only makes sense is dynamic_pad=False #@TODO(tzaman) - FIXME
+                min_after_dequeue=5*self.batch_size,
+                allow_smaller_final_batch=True,  # Happens if total%batch_size!=0
+                name='batcher'
+            )
         else:
             batch = tf.train.batch(
-                    single_batch,
-                    batch_size=self.batch_size,
-                    dynamic_pad=True, # Allows us to not supply fixed shape a priori
-                    enqueue_many=False, # Each tensor is a single example
-                    #shapes=[[],[28,28,1],[]], # Only makes sense is dynamic_pad=False
-                    num_threads=NUM_THREADS_DATA_LOADER,
-                    capacity=max_queue_capacity, # Max amount that will be loaded and queued
-                    allow_smaller_final_batch=True, # Happens if total%batch_size!=0
-                    name='batcher',
-                )
-
-        self.batch_k = batch[0] # Key
-        self.batch_x = batch[1] # Input
+                single_batch,
+                batch_size=self.batch_size,
+                dynamic_pad=True,  # Allows us to not supply fixed shape a priori
+                enqueue_many=False,  # Each tensor is a single example
+                # set number of threads to 1 for tfrecords (used for inference)
+                num_threads=NUM_THREADS_DATA_LOADER if not self.is_inference else 1,
+                capacity=max_queue_capacity,  # Max amount that will be loaded and queued
+                allow_smaller_final_batch=True,  # Happens if total%batch_size!=0
+                name='batcher',
+            )
+
+        self.batch_k = batch[0]  # Key
+        self.batch_x = batch[1]  # Input
         if len(batch) == 3:
             # There's a label (unlike during inferencing)
-            self.batch_y = batch[2] # Output (label)
-
+            self.batch_y = batch[2]  # Output (label)
 
 
 class LmdbLoader(LoaderFactory):
@@ -447,13 +467,13 @@ def initialize(self):
 
     def get_queue(self):
         return tf.train.string_input_producer(
-                self.keys,
-                num_epochs=self.num_epochs,
-                capacity=self.total,
-                shuffle=self.shuffle,
-                seed=self._seed,
-                name='input_producer'
-            )
+            self.keys,
+            num_epochs=self.num_epochs,
+            capacity=self.total,
+            shuffle=self.shuffle,
+            seed=self._seed,
+            name='input_producer'
+        )
 
     def get_tf_data_type(self):
         """Returns the type of the data, in tf format.
@@ -495,7 +515,7 @@ def get_data_and_shape(lmdb_txn, key):
                 data = np.asarray(datum.float_data, dtype='float32')
             else:
                 data = datum.data
-            label = np.asarray([datum.label], dtype=np.int64) # scalar label
+            label = np.asarray([datum.label], dtype=np.int64)  # scalar label
             return data, shape, label
 
         def get_data_op(key):
@@ -525,7 +545,7 @@ def get_single_data(self, key_queue):
         Returns:
             key, single_data, single_data_shape, single_label, single_label_shape
         """
-        key = key_queue.dequeue() #Operation that dequeues one key and returns a string with the key
+        key = key_queue.dequeue()  # Operation that dequeues one key and returns a string with the key
         py_func_return_type = [self.get_tf_data_type(), tf.int32, self.get_tf_label_type(), tf.int32]
         d, ds, l, ls = tf.py_func(self.generate_data_op(), [key], py_func_return_type, name='data_reader')
         return key, d, ds, l, ls
@@ -533,6 +553,7 @@ def get_single_data(self, key_queue):
     def __del__(self):
         self.lmdb_env.close()
 
+
 class FileListLoader(LoaderFactory):
     """ The FileListLoader loads files from a list of string(s) pointing to (a) file(s).
     These files are then retrieved by their string and loaded according to their extension.
@@ -560,7 +581,7 @@ def initialize(self):
             if len(self.keys) > 0:
                 # Assume the first entry in the line is a pointer to the file path
                 first_file_path = self.keys[0]
-            else :
+            else:
                 logging.error('Filelist (%s) contains no lines.' % (self.db_path))
                 exit(-1)
         else:
@@ -572,7 +593,7 @@ def initialize(self):
         # Check first file for statistics
         im = Image.open(first_file_path)
         self.width, self.height = im.size
-        self.channels =  1 if im.mode == 'L' else 3 # @TODO(tzaman): allow more channels
+        self.channels = 1 if im.mode == 'L' else 3  # @TODO(tzaman): allow more channels
 
         self.data_mime = magic.from_file(first_file_path, mime=True)
 
@@ -588,13 +609,13 @@ def initialize(self):
 
     def get_queue(self):
         return tf.train.string_input_producer(
-                self.keys,
-                num_epochs=self.num_epochs,
-                capacity=self.total,
-                shuffle=self.shuffle,
-                seed=self._seed,
-                name='input_producer'
-            )
+            self.keys,
+            num_epochs=self.num_epochs,
+            capacity=self.total,
+            shuffle=self.shuffle,
+            seed=self._seed,
+            name='input_producer'
+        )
 
     def get_single_data(self, key_queue):
         """
@@ -602,8 +623,9 @@ def get_single_data(self, key_queue):
             key, single_data, single_data_shape, single_label, single_label_shape
         """
         key, value = self.reader.read(key_queue)
-        shape = np.array([self.width, self.height, self.channels], dtype=np.int32) # @TODO: this is not dynamic
-        return key, value, shape # @TODO(tzaman) - Note: will only work for inferencing stage!
+        shape = np.array([self.width, self.height, self.channels], dtype=np.int32)  # @TODO: this is not dynamic
+        return key, value, shape  # @TODO(tzaman) - Note: will only work for inferencing stage!
+
 
 class TFRecordsLoader(LoaderFactory):
     """ The TFRecordsLoader connects directly into the tensorflow graph.
@@ -613,8 +635,7 @@ def __init__(self):
         pass
 
     def initialize(self):
-        self.float_data = False # For now only strings
-        self.keys = None # Not using keys
+        self.float_data = False  # For now only strings
         self.unencoded_data_format = 'hwc'
         self.unencoded_channel_scheme = 'rgb'
         self.reader = None
@@ -625,21 +646,24 @@ def initialize(self):
 
         # Count all the records @TODO(tzaman): account for shards!
         # Loop the records in path @TODO(tzaman) get this from a txt?
-        #self.db_path += '/test.tfrecords' # @TODO(tzaman) this is a hack
+        # self.db_path += '/test.tfrecords' # @TODO(tzaman) this is a hack
 
         self.shard_paths = []
-        list_db_files = self.db_path + '/list.txt'
+        list_db_files = os.path.join(self.db_path, 'list.txt')
         self.total = 0
-        with open(list_db_files) as f:
-            for line in f:
-                # Account for the relative path format in list.txt
-                shard_path = self.db_path + '/' + os.path.basename(line.strip())
-                record_iter = tf.python_io.tf_record_iterator(shard_path)
-                for r in record_iter:
-                    self.total += 1
-                if not self.total:
-                    raise ValueError('Database or shard contains no records (%s)' % (self.db_path))
-                self.shard_paths.append(shard_path)
+        if os.path.exists(list_db_files):
+            files = [os.path.join(self.db_path, f) for f in open(list_db_files, 'r').read().splitlines()]
+        else:
+            files = [self.db_path]
+        for shard_path in files:
+            # Account for the relative path format in list.txt
+            record_iter = tf.python_io.tf_record_iterator(shard_path)
+            for r in record_iter:
+                self.total += 1
+            if not self.total:
+                raise ValueError('Database or shard contains no records (%s)' % (self.db_path))
+            self.shard_paths.append(shard_path)
+        self.keys = ['%s:0' % p for p in self.shard_paths]
 
         # Use last record read to extract some preliminary data that is sometimes needed or useful
         example_proto = tf.train.Example()
@@ -675,25 +699,22 @@ def get_single_data(self, key_queue):
             key, single_data, single_data_shape, single_label, single_label_shape
         """
 
-        _, serialized_example = self.reader.read(key_queue)
+        key, serialized_example = self.reader.read(key_queue)
         features = tf.parse_single_example(
             serialized_example,
             # Defaults are not specified since both keys are required.
             features={
-                'image_raw': tf.FixedLenFeature([], tf.string),
+                'image_raw': tf.FixedLenFeature([self.height, self.width, self.channels], tf.float32),
                 'label': tf.FixedLenFeature([], tf.int64),
             })
 
-        key = np.array([], dtype=np.int32) # @TODO: this is not dynamic
         d = features['image_raw']
-        ds = np.array([self.width, self.height, self.channels], dtype=np.int32) # @TODO: this is not dynamic
-        l = features['label']#l = tf.cast(features['label'], tf.int32)
-        ls = np.array([], dtype=np.int32) # @TODO: this is not dynamic
+        ds = np.array([self.height, self.width, self.channels], dtype=np.int32)  # @TODO: this is not dynamic
+        l = features['label']  # l = tf.cast(features['label'], tf.int32)
+        ls = np.array([], dtype=np.int32)  # @TODO: this is not dynamic
         return key, d, ds, l, ls
 
 
-
-
 class Hdf5Loader(LoaderFactory):
 
     def __init__(self):
@@ -707,8 +728,8 @@ def initialize(self):
             exit(-1)
 
         self.data_encoded = False
-        self.float_data = True # Always stored as float32
-        self.keys = None # Not using keys
+        self.float_data = True  # Always stored as float32
+        self.keys = None  # Not using keys
 
         self.h5dbs = []
         self.h5dbs_endrange = []
@@ -729,7 +750,7 @@ def initialize(self):
 
     def check_hdf5_db(self, db):
         # Make sure we have data and labels in the db
-        if not "data" in db or not "label" in db:
+        if "data" not in db or "label" not in db:
             logging.error("The HDF5 loader requires both a 'data' and 'label' group in the HDF5 root.")
             exit(-1)
 
@@ -743,13 +764,13 @@ def check_hdf5_db(self, db):
 
     def get_queue(self):
         return tf.train.range_input_producer(
-                self.total,
-                num_epochs=self.num_epochs,
-                capacity=self.total,
-                shuffle=self.shuffle,
-                seed=self._seed,
-                name='input_producer'
-            )
+            self.total,
+            num_epochs=self.num_epochs,
+            capacity=self.total,
+            shuffle=self.shuffle,
+            seed=self._seed,
+            name='input_producer'
+        )
 
     def get_tf_data_type(self):
         """Returns the type of the data, in tf format.
@@ -781,14 +802,12 @@ def get_data_and_shape(self, sample_key):
             if sample_key < end_range:
                 key_within_db = sample_key-prev_end_range
                 data = self.h5dbs[i]['data'][key_within_db]
-                # Convert from CHW to HWC
-                data = data.transpose((1, 2, 0)).astype(np.float32)/255.
                 shape = np.asarray(data.shape, dtype=np.int32)
                 label = self.h5dbs[i]['label'][key_within_db].astype(np.int64)
                 return data, shape, label
             prev_end_range = end_range
 
-        logging.error("Out of range") # @TODO(tzaman) out of range error
+        logging.error("Out of range")  # @TODO(tzaman) out of range error
         exit(-1)
 
     def generate_data_op(self):
@@ -821,11 +840,56 @@ def get_single_data(self, key_queue):
         Returns:
             key, single_data, single_data_shape, single_label, single_label_shape
         """
-        key = key_queue.dequeue() #Operation that dequeues one key and returns a string with the key
+        key = key_queue.dequeue()  # Operation that dequeues one key and returns a string with the key
         py_func_return_type = [self.get_tf_data_type(), tf.int32, self.get_tf_label_type(), tf.int32]
         d, ds, l, ls = tf.py_func(self.generate_data_op(), [key], py_func_return_type, name='data_reader')
         return key, d, ds, l, ls
 
     def __del__(self):
         for db in self.h5dbs:
-            db.close()
\ No newline at end of file
+            db.close()
+
+class GanGridLoader(LoaderFactory):
+    """
+    The GanGridLoader generates data for a GAN.
+    """
+    def __init__(self):
+        pass
+
+    def initialize(self):
+        self.float_data = False  # For now only strings
+        self.keys = None  # Not using keys
+        self.unencoded_data_format = 'hwc'
+        self.unencoded_channel_scheme = 'rgb'
+        self.reader = None
+        self.image_dtype = tf.float32
+
+        self.channels = 1
+        self.height = 1
+        self.width = 100
+        self.data_encoded = False
+
+        self.total = 100000
+
+    def get_queue(self):
+        return tf.train.range_input_producer(
+            self.total,
+            num_epochs=self.num_epochs,
+            capacity=self.total,
+            shuffle=self.shuffle,
+            seed=self._seed,
+            name='input_producer'
+        )
+
+    def get_single_data(self, key_queue):
+        """
+        Returns:
+            key, single_data, single_data_shape, single_label, single_label_shape
+        """
+
+        key = tf.to_int32(key_queue.dequeue())  # Operation that dequeues an index
+
+        d = key
+        ds = np.array([1, 1, 1], dtype=np.int32)
+
+        return key, d, ds, None, None
diff --git a/digits/tools/tensorflow/utils.py b/digits/tools/tensorflow/utils.py
index 4062c8d97..495a755d0 100644
--- a/digits/tools/tensorflow/utils.py
+++ b/digits/tools/tensorflow/utils.py
@@ -10,23 +10,26 @@
 
 import functools
 import tensorflow as tf
-from tensorflow.python.client import timeline, device_lib
+from tensorflow.python.client import device_lib
 
 STAGE_TRAIN = 'train'
 STAGE_VAL = 'val'
 STAGE_INF = 'inf'
 
+
 class GraphKeys(object):
     TEMPLATE = "model"
     QUEUE_RUNNERS = "queue_runner"
     MODEL = "model"
-    LOSS = "loss" # The namescope
-    LOSSES = "losses" # The collection
+    LOSS = "loss"  # The namescope
+    LOSSES = "losses"  # The collection
     LOADER = "data"
 
+
 def model_property(function):
     # From https://danijar.com/structuring-your-tensorflow-models/
     attribute = '_cache_' + function.__name__
+
     @property
     @functools.wraps(function)
     def decorator(self):
@@ -35,6 +38,7 @@ def decorator(self):
         return getattr(self, attribute)
     return decorator
 
+
 def classification_loss(pred, y):
     """
     Definition of the loss for regular classification
@@ -42,20 +46,25 @@ def classification_loss(pred, y):
     ssoftmax = tf.nn.sparse_softmax_cross_entropy_with_logits(pred, y, name='cross_entropy_single')
     return tf.reduce_mean(ssoftmax, name='cross_entropy_batch')
 
+
 def mse_loss(lhs, rhs):
     return tf.reduce_mean(tf.square(lhs - rhs))
 
+
 def constrastive_loss(lhs, rhs, y, margin=1.0):
-    """ Contrastive loss confirming to the Caffe definition
     """
-    d = tf.reduce_sum(tf.square(tf.sub(lhs,rhs)), 1)
+    Contrastive loss confirming to the Caffe definition
+    """
+    d = tf.reduce_sum(tf.square(tf.sub(lhs, rhs)), 1)
     d_sqrt = tf.sqrt(1e-6 + d)
     loss = (y * d) + ((1 - y) * tf.square(tf.maximum(margin - d_sqrt, 0)))
-    return tf.reduce_mean(loss) # Note: constant component removed (/2)
+    return tf.reduce_mean(loss)  # Note: constant component removed (/2)
+
 
 def classification_accuracy_top_n(pred, y, top_n):
     single_acc_t = tf.nn.in_top_k(pred, y, top_n)
-    return  tf.reduce_mean(tf.cast(single_acc_t, tf.float32), name='accuracy_top_%d'%top_n)
+    return tf.reduce_mean(tf.cast(single_acc_t, tf.float32), name='accuracy_top_%d' % top_n)
+
 
 def classification_accuracy(pred, y):
     """
@@ -65,28 +74,31 @@ def classification_accuracy(pred, y):
     single_acc = tf.equal(y, tf.argmax(pred, 1))
     return tf.reduce_mean(tf.cast(single_acc, tf.float32), name='accuracy')
 
+
 def nhwc_to_nchw(x):
-    #x = tf.reshape(x, [1, 3, 4, 2])
     return tf.transpose(x, [0, 3, 1, 2])
 
+
 def hwc_to_chw(x):
-    #x = tf.reshape(x, [2, 3, 1])
     return tf.transpose(x, [2, 0, 1])
 
+
 def nchw_to_nhwc(x):
-    #x = tf.reshape(x, [1, 2, 3, 4])
     return tf.transpose(x, [0, 2, 3, 1])
 
+
 def chw_to_hwc(x):
-    #x = tf.reshape(x, [1, 2, 3])
     return tf.transpose(x, [1, 2, 0])
 
+
 def bgr_to_rgb(x):
     return tf.reverse(x, [False, False, True])
 
+
 def rgb_to_bgr(x):
     return tf.reverse(x, [False, False, True])
 
+
 def get_available_gpus():
     """
     Queries the CUDA GPU devices visible to Tensorflow.
diff --git a/digits/tools/torch/test.lua b/digits/tools/torch/test.lua
index a8a652ae0..5a36a9b32 100644
--- a/digits/tools/torch/test.lua
+++ b/digits/tools/torch/test.lua
@@ -341,6 +341,7 @@ else
             inputs[j] = inputs[1] -- replicate the first image in entire inputs tensor
         end
     end
+    counter = 1 -- here counter is set, so that predictBatch() method displays only the predictions of first image
     predictBatch(inputs, model)
     if opt.visualization=='yes' then
         local filename = paths.concat(opt.save, 'vis.h5')
diff --git a/digits/utils/__init__.py b/digits/utils/__init__.py
index 9a2140360..b5db0d9e5 100644
--- a/digits/utils/__init__.py
+++ b/digits/utils/__init__.py
@@ -25,7 +25,7 @@ def is_url(url):
 
 def wait_time():
     """Wait a random number of seconds"""
-    return uniform(0.3, 0.5)
+    return uniform(0.05, 0.1)
 
 # From http://code.activestate.com/recipes/578900-non-blocking-readlines/
 
diff --git a/digits/utils/forms.py b/digits/utils/forms.py
index b94aae547..002eb2e1b 100644
--- a/digits/utils/forms.py
+++ b/digits/utils/forms.py
@@ -27,10 +27,8 @@ def _validator(form, field):
         if all_conditions_met:
             # Verify that data exists
             if field.data is None \
-                    or (isinstance(field.data, (str, unicode))
-                        and not field.data.strip()) \
-                    or (isinstance(field.data, FileStorage)
-                        and not field.data.filename.strip()):
+                    or (isinstance(field.data, (str, unicode)) and not field.data.strip()) \
+                    or (isinstance(field.data, FileStorage) and not field.data.filename.strip()):
                 raise validators.ValidationError('This field is required.')
         else:
             # This field is not required, ignore other errors
@@ -52,11 +50,9 @@ def _validator(form, field):
         other_field_value = getattr(form, other_field).data
         if other_field_value:
             # Verify that data exists
-            if field.data is None \
-                    or (isinstance(field.data, (str, unicode))
-                        and not field.data.strip()) \
-                    or (isinstance(field.data, FileStorage)
-                        and not field.data.filename.strip()):
+            if field.data is None or \
+                    (isinstance(field.data, (str, unicode)) and not field.data.strip()) \
+                    or (isinstance(field.data, FileStorage) and not field.data.filename.strip()):
                 raise validators.ValidationError('This field is required if %s is set.' % other_field)
         else:
             # This field is not required, ignore other errors
diff --git a/digits/utils/lmdbreader.py b/digits/utils/lmdbreader.py
index 70ce5c4ba..550a54b85 100644
--- a/digits/utils/lmdbreader.py
+++ b/digits/utils/lmdbreader.py
@@ -23,6 +23,8 @@ def __init__(self, location):
         with self._db.begin() as txn:
             self.total_entries = txn.stat()['entries']
 
+        self.txn = self._db.begin()
+
     def entries(self):
         """
         Generator returning all entries in the DB
@@ -31,3 +33,7 @@ def entries(self):
             cursor = txn.cursor()
             for item in cursor:
                 yield item
+
+    def entry(self, key):
+        """Return single entry"""
+        return self.txn.get(key)
diff --git a/digits/views.py b/digits/views.py
index b147b5ab4..44854d614 100644
--- a/digits/views.py
+++ b/digits/views.py
@@ -634,7 +634,6 @@ def handle_error(e):
             details['trace'] = trace.split('\n')
         return flask.jsonify({'error': details}), status_code
     else:
-        escape_message = True
         message = message.replace('\\n', '<br />')
         if isinstance(e, digits.frameworks.errors.NetworkVisualizationError):
             trace = message
diff --git a/examples/gan/README.md b/examples/gan/README.md
new file mode 100644
index 000000000..e2f4bfdfa
--- /dev/null
+++ b/examples/gan/README.md
@@ -0,0 +1,373 @@
+# Using DIGITS to train a Generative Adversarial Network
+
+Table of Contents
+=================
+* [Introduction](#introduction)
+* [Preliminary installation steps](#preliminary-installation-steps)
+* [Handwritten digits](#handwritten-digits)
+    * [Creating the dataset](#creating-the-dataset)
+    * [Training the model](#training-the-model)
+    * [Sampling the model](#sampling-the-model)
+    * [Training an encoder](#training-an-encoder)
+* [Celebrity faces](#celebrity-faces)
+    * [Downloading the CelebA dataset](#downloading-the-celeba-dataset)
+    * [Creating the CelebA dataset](#creating-the-celeba-dataset)
+    * [Training the CelebA model](#training-the-celeba-model)
+    * [Training a CelebA encoder](#training-a-celeba-encoder)
+    * [Generating attribute vectors](#generating-attribute-vectors)
+    * [Sampling the CelebA model](#sampling-the-celeba-model)
+        * [Setting image attributes](#setting-image-attributes)
+        * [Analogy grid](#analogy-grid)
+    * [Embeddings visualization](#embeddings-visualization)
+
+**Disclaimer:**
+This walk-through makes use of experimental features in DIGITS.
+Please do not report issues on the main DIGITS fork.
+
+## Introduction
+
+Generative Adversarial Networks (GAN) were introduced by Ian Goodfellow in [Generative Adversarial Networks](https://arxiv.org/abs/1406.2661), Goodfellow, 2014.
+GANs learn a data probability distribution under unsupervised learning.
+In practice a GAN learns to draw from a dataset probability distribution in order to generate data.
+To this avail, a GAN comprises two pieces: a Generator that generates data and a Discriminator that learns to discriminate between "real" data (from the dataset) and "fake" data (those that were generated).
+A latent representation of the data is learnt by ways of a feature vector called `z`.
+Through a number of fully-connected and transpose convolutional layers, the generator learns to generate images from `z`.
+During training, `z` is sampled from a random distribution.
+During inference, `z` may be specified to generate images with carefully chosen attributes.
+
+The typical training loop comprises the following phases:
+- optimize the discriminator on real samples (make it classify them as such),
+- draw `z` from a random distribution and have the generator create the corresponding image,
+- optimize the discriminator on generator samples (make it classify them as such),
+- optimize the generator (make it fool the disciminator).
+
+Other papers of interest:
+- [Unsupervised Representation Learning with Deep Convolutional Generative Adversarial Networks](https://arxiv.org/abs/1511.06434), Radford, 2015.
+- [Sampling Generative Networks](https://arxiv.org/abs/1609.04468), White, 2016.
+
+## Preliminary installation steps
+
+You will need a version of DIGITS that includes this document.
+
+Tensorflow may be installed by doing for example (refer to the Tensorflow homepage for more up-to-date install instructions):
+
+```sh
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow_gpu-0.12.1-cp27-none-linux_x86_64.whl
+$ pip install --upgrade $TF_BINARY_URL
+```
+
+If you haven't done so already, install the top-level DIGITS module:
+```sh
+$ pip install -e $DIGITS_ROOT
+```
+
+The GAN data and visualization plugins for DIGITS may be installed by doing:
+```sh
+$ pip install -e $DIGITS_ROOT/plugins/data/gan/
+$ pip install -e $DIGITS_ROOT/plugins/view/gan/
+```
+
+## Handwritten digits
+
+Here we will use the MNIST dataset. You don't need labels to train a GAN however if you do have labels, as is the case for MNIST, you can use them to train a **conditional** GAN.
+In this example, we will condition our GAN on the class labels.
+Conditioning a GAN in this way is useful because this allows us to dissociate classes from other learnable features that define the "style" of images.
+In practice, in our network we will concatenate a one-hot representation of labels to the activations of every layer in both the generator and the discriminator.
+
+### Creating the dataset
+
+If you already followed the [GettingStarted](../../docs/GettingStarted.md) example, you should already have a classification dataset for MNIST.
+We will reuse the LMDB files that were already created for the MNIST classification dataset to create a new generic dataset.
+Creating a generic dataset is required here because GANs do not fall into the category of classification datasets and require specific plug-ins.
+
+Open the classification dataset page and make good note of the job directory for your MNIST classification dataset:
+
+![mnist classification dataset](mnist-classification-dataset.png)
+
+On the home page, click `New Dataset>Images>Other`.
+Then specify the path to the training images LMDB and the path to the mean image protobuf file:
+
+![create generic MNIST](create-mnist-generic-dataset.png)
+
+Give your dataset a name and click "Create".
+
+### Training the model
+
+On the home page, click `New Model>Images>Other`.
+- select your dataset,
+- set the number of epochs to 60,
+- set mean subtraction to `None`,
+- select `ADAM` solver,
+- select learning rate to `2e-4`,
+- use only 1 GPU for this model.
+
+In the `custom network` tab, select `Tensorflow` and copy-paste this [network definition](./network-mnist.py).
+
+You can click `Visualize` to browse the model graph (this only works in Chrome):
+
+![mnist graph](mnist-graph.png)
+
+Name your model `GAN-MNIST` and click `Create`.
+
+> Note: when training a neural network it is typical to expect the loss to go down and see there an indication that the model is learning well.
+This is not the case in a typical GAN.
+If the loss of the discriminator is very low, this means that the generator is not doing a good job at fooling the discriminator.
+Conversely, if the loss  of the generator is too low, this means the discriminator is not doing a good job at detecting fake samples.
+In a balanced set-up, equilibrium is reached when the generator can fool the discriminator in 50% of cases.
+From the definition of the cross entropy loss this corresponds to a loss value of `-math.log(0.5)=0.69`.
+
+![mnist loss](mnist-loss.png)
+
+Also note that we've added a metric in this model to track the `Chi-square` distance between the histogram of real pixel values and the histogram of generated pixel values.
+This is used as a proxy indication that the generator has learnt a good propability distribution.
+Getting this distance to go low is a necessary yet insufficient condition.
+Note however how the `Chi-square` metric is going down below:
+
+![mnist chi square](mnist-chi-square.png)
+
+You can also open Tensorboard and point to the `tb` sub-folder of the job directory to see samples of generated and real images (under the `images` tab).
+
+To start Tensorboard:
+
+```sh
+$ tensorboard --logdir <job_dir>/tb/
+```
+
+To open Tensorboard in a browser, open `http://localhost:6006`.
+
+In the below image, the first row shows generated images.
+The second row shows real images (from the dataset).
+This is updated periodically during training so you can monitor how well the network is doing.
+
+![MNIST TB samples](mnist-tb-samples.png)
+
+### Sampling the model
+
+We will see how to sample `z` to produce images.
+On the model page, select the `GAN` inference method and the `GAN` inference form.
+In the inference form, select the `MNIST Class sweep` task.
+
+![MNIST class sweep inference form](mnist-inference-form-class-sweep.png)
+
+Click `Test`.
+This shows a grid of digits, all of them were sampled using the same randomly generated `z`.
+The `z` vector is then concatenated with various shades of labels, using spherical interpolation.
+Every column shows how a digit is slowly morphing into the next digit:
+
+![MNIST class sweep](mnist-class-sweep.png)
+
+This can also be visualized with an animated gif:
+
+![MNIST Animated](mnist-animated.gif)
+
+Now in the inference form, select `MNIST Style sweep` and click `Test`.
+This shows a new grid of digits.
+Every column shows how a digit is slowly morphing from one "style" (i.e. one randomly generated z vector) into another style:
+
+![MNIST style sweep](mnist-style-sweep.png)
+
+### Training an encoder
+
+In order to avoid picking `z` randomly, we can train an encoder to generate the `z` vector, given an input image.
+Here we will fine-tune the discriminator such that it becomes an encoder:
+- we replace the last layer of the discriminator with a fully-connected layer that has as many neurons as there are numbers in `z` (100 in our case),
+- we reverse the order of things in our GAN: the output of the discriminator/encoder is now connected to the input of the generator,
+- we change the loss function: we are now using the L2 distance between the generated image and the image in the dataset.
+
+> Note: the parameters of the generator must be frozen when training the encoder.
+
+To train the encoder, do this:
+- clone the `GAN-MNIST` model
+- in the `Previous networks` tab, select the GAN model, select the last epoch then click `Customize`
+- use this [network description](./network-mnist-encoder.py)
+
+Name your model `GAN-MNIST-Encoder` and click `Create`.
+
+Notice that the loss converges smoothly towards a low plateau:
+
+![MNIST encoder loss](mnist-encoder-loss.png)
+
+Now that we have an encoder we can encode an image and find the corresponding `z` vector.
+On the `GAN-MNIST-Encoder` page,
+- select the `GAN` visualization method and the `MNIST encoder` task,
+- upload an image of a `3`
+- click `Test One`
+
+![MNIST encode image form](mnist-encode-image-form.png)
+
+>Note: in this GAN-encoder, class "3" is hard-coded in the encoder model **during inference**.
+If you want to encode another class you will need to manually update this line in the model description: `self.y = tf.to_int32(3*tf.ones(shape=[self.batch_size]))`
+
+On the resulting page, you can see the input image (left), the reconstructed image (middle), and the corresponding `z` vector (right):
+
+![MNIST encode image](mnist-encode-image.png)
+
+Now that we have a `z` vector, we can do a class sweep for that particular "style":
+- copy the encoded `z` vector from the encoder.
+- move to the `GAN-MNIST` model page.
+- select the `GAN` visualization method and the `Grid` task,
+- select the `GAN` inference form and the `Class sweep` task,
+- paste the encoded `z` vector into the field:
+
+![MNIST styled class sweep form](mnist-styled-class-sweep-form.png)
+
+Now click `Test` and you will see a class sweep using the particular style that you specified:
+
+![MNIST styled class sweep](mnist-styled-class-sweep.png)
+
+## Celebrity faces
+
+### Downloading the CelebA dataset
+
+The Celebrity Faces (a.k.a. "CelebA") dataset may be downloaded from this [Dropbox account](https://www.dropbox.com/sh/8oqt9vytwxb3s4r/AAB06FXaQRUNtjW9ntaoPGvCa?dl=0).
+Download `img/img_align_celeba.zip` and `Anno/list_attr_celeba.txt`.
+Extract the ZIP file into a local folder.
+
+### Creating the CelebA dataset
+
+On the home page, click `New dataset>Images>GAN`.
+Specify the location of the attributes and images:
+
+![celeba dataset creation](celeba-dataset-form.png).
+
+Leave other settings in their default state, name your dataset `CelebA-64` then click `Create`.
+
+You can explore the dataset using the `Explore` button on the model page.
+See below for some image samples:
+
+![celeba samples](exploring-celeba.png)
+
+### Training the CelebA model
+
+This model is very similar to the MNIST one but differs slightly:
+- it receives colour 64x64 images,
+- it has a few more layers,
+- it is not conditioned on labels.
+
+On the home page, click `New Model>Images>Other`.
+- select your dataset,
+- set the number of epochs to 60,
+- set the batch size to 64,
+- set mean subtraction to `None`,
+- select `ADAM` solver,
+- select learning rate to `5e-4`,
+- use only 1 GPU for this model.
+
+In the `custom network` tab, select `Tensorflow` and copy-paste this [network definition](./network-celebA.py).
+
+Name your model `GAN-CelebA` then click create.
+
+You may notice that the learning curves don't converge towards 0.69 as smoothly as in the MNIST case.
+This is because the generator is overpowered by the discriminator.
+This is not necessarily an issue as we will see later.
+
+![CelebA loss](celeba-loss.png)
+
+### Training a CelebA encoder
+
+Proceed as in the MNIST example but use this [network description](./network-celebA-encoder.py).
+
+### Generating attribute vectors
+
+The CelebA dataset comes with 40 different attributes for each image.
+We can use these labels to generate characteristic `z` vectors for each attribute.
+A way to do this is to compute the average `z` vector for images that have the attribute and subtract the average `z` vector for images that do not have the attribute.
+This can be done with the `gan_features.py` script:
+
+```sh
+$ export DIGITS_JOBS_DIR=/path/to/digits/jobs
+$ export GAN_ENCODER_JOB_ID=20170202-100209-72af  # replace this with the Job ID of your GAN-CelebA-Encoder
+$ ./examples/gan/gan_features.py -j $DIGITS_JOBS_DIR $GAN_ENCODER_JOB_ID -g 0
+```
+
+Running the above command will sweep through the 200k images in the dataset and create a file named `attributes_z.pkl` that includes the 40 characteristic `z` vectors.
+
+### Sampling the CelebA model
+
+#### Setting image attributes
+
+You can find `z` vectors by encoding images from the dataset through the GAN-CelebA-Encoder model.
+- move to the model page for your `GAN-CelebA-Encoder`,
+- select the `GAN` visualization method, select the `CelebA Encoder` task,
+- select the `GAN` inference form, select the `Encode list` task,
+- specify the path to your attributes text file and the path to the image folder.
+
+![CelebA encode list form](celeba-encode-list-form.png)
+
+Click `Test`. You may see something like:
+
+![CelebA encode list](celeba-encode-list.png).
+
+Every row is showing the input image (left), the reconstructed image (center) and the corresponding z vector (right).
+
+Now if you pick a `z` vector, you can add/remove attributes to this image:
+- open the `GAN-CelebA` model page,
+- select the `Image output` visualization method and set the `Data order` to `HWC`:
+
+![CelebA select image output](celeba-select-image-output.png)
+
+- select the `GAN` inference form and select the `CelebA - add/remove attributes` task,
+- specify the location of the attributes file you created with `gan_features.py`.
+- paste the `z` vector you found when using the `Encode list` task above.
+- click `Add row` a number of times to create new rows.
+Each row will generate an image with the corresponding attributes.
+If you leave all cells in a row blank, you will get the original image.
+If you set `Black Hair` to `+1` and `Blond Hair` to `-1`, this will transform a blond person into a person with dark hair.
+If you set `Smiling` to `-1` this will make a smiling person... not smile.
+
+See for example:
+
+![CelebA set attributes form](celeba-set-attributes-form.png)
+
+This will generate these images:
+
+![CelebA attributes](celeba-set-attributes.png)
+
+#### Analogy grid
+
+If you pick 3 `z` vectors you can generate an analogy similar to `king - man + woman = queen`.
+To experience this:
+- select the `GAN` visualization method, select the `Grid` task,
+- select the `GAN` inference form, select the `CelebA - analogy` task,
+- set the `source`, `sink 1` and `sink 2` vectors.
+
+This will create a grid with the following analogy: `destination = sink 1 + sink 2 - source` with:
+- `source` in top-left corner,
+- `sink 1` in top-right corner,
+- `sink 2` in bottom-left corner,
+- `destination` in bottom-right corner.
+
+![CelebA analogy form](celeba-analogy-form.png)
+
+This might result in a grid like this:
+
+```
+  man with blond hair looking straight
++ woman with dark hair looking to her left
+- woman with blond hair looking straight
+= man with dark hair looking slightly to his left
+```
+
+Pretty good, heh?
+
+![CelebA analogy](celeba-analogy.png)
+
+The grid can also be visualized through an animated image:
+
+![animated grid](gan-grid-animated.gif)
+
+### Embeddings visualization
+
+You might have noticed another byproduct of the `gan_features.py` script: a file named `embeddings.pkl`.
+This file contains `z` vectors for the first 10k images in the CelebA dataset.
+We can use this to display image embeddings in Tensorboard:
+
+```sh
+$ ./gan_embeddings.py embeddings.pkl
+$ tensorboard --logdir ./gan-tb/
+```
+
+Now open a browser on `http://localhost:6006`.
+In the `Embeddings` tab you will see something similar to this:
+
+![animated embeddings](celeba-embeddings.gif)
diff --git a/examples/gan/celeba-analogy-form.png b/examples/gan/celeba-analogy-form.png
new file mode 100644
index 000000000..4cf71077c
Binary files /dev/null and b/examples/gan/celeba-analogy-form.png differ
diff --git a/examples/gan/celeba-analogy.png b/examples/gan/celeba-analogy.png
new file mode 100644
index 000000000..8ffbf4272
Binary files /dev/null and b/examples/gan/celeba-analogy.png differ
diff --git a/examples/gan/celeba-dataset-form.png b/examples/gan/celeba-dataset-form.png
new file mode 100644
index 000000000..1d1b4ebd3
Binary files /dev/null and b/examples/gan/celeba-dataset-form.png differ
diff --git a/examples/gan/celeba-embeddings.gif b/examples/gan/celeba-embeddings.gif
new file mode 100644
index 000000000..f303e29e6
Binary files /dev/null and b/examples/gan/celeba-embeddings.gif differ
diff --git a/examples/gan/celeba-encode-list-form.png b/examples/gan/celeba-encode-list-form.png
new file mode 100644
index 000000000..ab0f95b1b
Binary files /dev/null and b/examples/gan/celeba-encode-list-form.png differ
diff --git a/examples/gan/celeba-encode-list.png b/examples/gan/celeba-encode-list.png
new file mode 100644
index 000000000..900a83364
Binary files /dev/null and b/examples/gan/celeba-encode-list.png differ
diff --git a/examples/gan/celeba-loss.png b/examples/gan/celeba-loss.png
new file mode 100644
index 000000000..cb2ed81dd
Binary files /dev/null and b/examples/gan/celeba-loss.png differ
diff --git a/examples/gan/celeba-select-image-output.png b/examples/gan/celeba-select-image-output.png
new file mode 100644
index 000000000..2b932a79a
Binary files /dev/null and b/examples/gan/celeba-select-image-output.png differ
diff --git a/examples/gan/celeba-set-attributes-form.png b/examples/gan/celeba-set-attributes-form.png
new file mode 100644
index 000000000..6dbc9d401
Binary files /dev/null and b/examples/gan/celeba-set-attributes-form.png differ
diff --git a/examples/gan/celeba-set-attributes.png b/examples/gan/celeba-set-attributes.png
new file mode 100644
index 000000000..8ce31fd5d
Binary files /dev/null and b/examples/gan/celeba-set-attributes.png differ
diff --git a/examples/gan/create-mnist-generic-dataset.png b/examples/gan/create-mnist-generic-dataset.png
new file mode 100644
index 000000000..020fea509
Binary files /dev/null and b/examples/gan/create-mnist-generic-dataset.png differ
diff --git a/examples/gan/create-mnist-model.png b/examples/gan/create-mnist-model.png
new file mode 100644
index 000000000..1f7927586
Binary files /dev/null and b/examples/gan/create-mnist-model.png differ
diff --git a/examples/gan/exploring-celeba.png b/examples/gan/exploring-celeba.png
new file mode 100644
index 000000000..721495afd
Binary files /dev/null and b/examples/gan/exploring-celeba.png differ
diff --git a/examples/gan/gan-grid-animated.gif b/examples/gan/gan-grid-animated.gif
new file mode 100644
index 000000000..d38d53cc7
Binary files /dev/null and b/examples/gan/gan-grid-animated.gif differ
diff --git a/examples/gan/gan_embeddings.py b/examples/gan/gan_embeddings.py
new file mode 100755
index 000000000..9d4d89f4b
--- /dev/null
+++ b/examples/gan/gan_embeddings.py
@@ -0,0 +1,86 @@
+#!/usr/bin/env python2
+# Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+
+import argparse
+import os
+import pickle
+import shutil
+
+import numpy as np
+import PIL.Image
+import tensorflow as tf
+from tensorflow.contrib.tensorboard.plugins import projector
+
+TB_DIR = os.path.join(os.getcwd(), "gan-tb")
+SPRITE_IMAGE_FILENAME = os.path.join(TB_DIR, "sprite.png")
+
+def save_tb_embeddings(embeddings_filename):
+    f = open(embeddings_filename, 'rb')
+    embeddings = pickle.load(f)
+
+    images = embeddings['images']
+    zs = embeddings['zs']
+
+    # overwrite Tensorboard log dir if necessary
+    if os.path.exists(TB_DIR):
+        shutil.rmtree(TB_DIR)
+    os.makedirs(TB_DIR)
+
+    # create grid image
+    img_width, img_height = save_sprite_image(images)
+
+    with tf.device('cpu:0'):
+        # create embedding var
+        embedding_var = tf.Variable(initial_value=zs)
+
+        # save projector config
+        summary_writer = tf.summary.FileWriter(TB_DIR)
+        config = projector.ProjectorConfig()
+        embedding = config.embeddings.add()
+        embedding.tensor_name = embedding_var.name
+        embedding.sprite.image_path = SPRITE_IMAGE_FILENAME
+        embedding.sprite.single_image_dim.extend([img_width, img_height])
+        projector.visualize_embeddings(summary_writer, config)
+
+        # save embeddings
+        sess=tf.Session()
+        sess.run(embedding_var.initializer)
+        saver = tf.train.Saver([embedding_var])
+        saver.save(sess, os.path.join(TB_DIR, 'model.ckpt'))
+
+def save_sprite_image(images):
+    n_embeddings = images.shape[0]
+    grid_cols = int(np.sqrt(n_embeddings))
+    grid_rows = int(np.ceil(float(n_embeddings) / grid_cols))
+    img_height, img_width, img_channels = images[0].shape
+    grid_image = np.empty((img_height * grid_rows, img_width * grid_cols, img_channels))
+    for i, image in enumerate(images):
+        row = i / grid_cols
+        col = i % grid_cols
+        x = img_width * col
+        y = img_height * row
+        grid_image[y:y + img_height, x:x + img_width] = image
+    grid_image = PIL.Image.fromarray(grid_image.astype('uint8'))
+    grid_image.save(SPRITE_IMAGE_FILENAME)
+    return img_width, img_height
+
+
+if __name__ == '__main__':
+
+    parser = argparse.ArgumentParser(description='Inference tool - DIGITS')
+
+    # Positional arguments
+
+    parser.add_argument(
+        'embeddings_file',
+        help='Embeddings pickle file')
+
+    args = vars(parser.parse_args())
+
+    try:
+        save_tb_embeddings(
+            args['embeddings_file'],
+        )
+    except Exception as e:
+        print('%s: %s' % (type(e).__name__, e.message))
+        raise
diff --git a/examples/gan/gan_features.py b/examples/gan/gan_features.py
new file mode 100755
index 000000000..40702a43a
--- /dev/null
+++ b/examples/gan/gan_features.py
@@ -0,0 +1,247 @@
+#!/usr/bin/env python2
+# Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+
+import argparse
+import logging
+import numpy as np
+import pickle
+import PIL.Image
+import os
+import sys
+try:
+    from cStringIO import StringIO
+except ImportError:
+    from StringIO import StringIO
+
+# Add path for DIGITS package
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))
+import digits.config  # noqa
+from digits import utils, log  # noqa
+from digits.inference.errors import InferenceError  # noqa
+from digits.job import Job  # noqa
+from digits.utils.lmdbreader import DbReader  # noqa
+
+# Import digits.config before caffe to set the path
+import caffe_pb2  # noqa
+
+logger = logging.getLogger('digits.tools.inference')
+
+# number of image embeddings to store
+N_EMBEDDINGS = 10000
+
+
+def parse_datum(value):
+    """
+    Parse a Caffe datum
+    """
+    datum = caffe_pb2.Datum()
+    datum.ParseFromString(value)
+    if datum.encoded:
+        s = StringIO()
+        s.write(datum.data)
+        s.seek(0)
+        img = PIL.Image.open(s)
+        img = np.array(img)
+    else:
+        import caffe.io
+        arr = caffe.io.datum_to_array(datum)
+        # CHW -> HWC
+        arr = arr.transpose((1, 2, 0))
+        if arr.shape[2] == 1:
+            # HWC -> HW
+            arr = arr[:, :, 0]
+        elif arr.shape[2] == 3:
+            # BGR -> RGB
+            # XXX see issue #59
+            arr = arr[:, :, [2, 1, 0]]
+        img = arr
+    return img
+
+
+def save_attributes(attributes):
+    """
+    Save attribute vectors
+    """
+    zs = np.zeros(attributes['positive_attribute_z'].shape)
+    for i in xrange(attributes['n_attributes']):
+        zs[i] = attributes['positive_attribute_z'][i] / attributes['positive_count'][i] \
+            - attributes['negative_attribute_z'][i] / attributes['negative_count'][i]
+    output = open('attributes_z.pkl', 'wb')
+    pickle.dump(zs, output)
+
+
+def save_embeddings(embeddings):
+    filename = 'embeddings.pkl'
+    logger.info('Saving embeddings to %s...' % filename)
+    output = open(filename, 'wb')
+    pickle.dump(embeddings, output)
+
+
+def infer(jobs_dir,
+          model_id,
+          epoch,
+          batch_size,
+          gpu):
+    """
+    Perform inference on a list of images using the specified model
+    """
+    # job directory defaults to that defined in DIGITS config
+    if jobs_dir == 'none':
+        jobs_dir = digits.config.config_value('jobs_dir')
+
+    # load model job
+    model_dir = os.path.join(jobs_dir, model_id)
+    assert os.path.isdir(model_dir), "Model dir %s does not exist" % model_dir
+    model = Job.load(model_dir)
+
+    # load dataset job
+    dataset_dir = os.path.join(jobs_dir, model.dataset_id)
+    assert os.path.isdir(dataset_dir), "Dataset dir %s does not exist" % dataset_dir
+    dataset = Job.load(dataset_dir)
+    for task in model.tasks:
+        task.dataset = dataset
+
+    # retrieve snapshot file
+    task = model.train_task()
+    snapshot_filename = None
+    epoch = float(epoch)
+    if epoch == -1 and len(task.snapshots):
+        # use last epoch
+        epoch = task.snapshots[-1][1]
+        snapshot_filename = task.snapshots[-1][0]
+    else:
+        for f, e in task.snapshots:
+            if e == epoch:
+                snapshot_filename = f
+                break
+    if not snapshot_filename:
+        raise InferenceError("Unable to find snapshot for epoch=%s" % repr(epoch))
+
+    input_data = []      # sample data
+    input_labels = []    # sample labels
+
+    # load images from database
+    feature_db_path = dataset.get_feature_db_path(utils.constants.TRAIN_DB)
+    feature_reader = DbReader(feature_db_path)
+
+    label_db_path = dataset.get_label_db_path(utils.constants.TRAIN_DB)
+    label_reader = DbReader(label_db_path)
+
+    embeddings = {'count': 0, 'images': None, 'zs': None}
+
+    def aggregate(images, labels, attributes, embeddings):
+        # perform inference
+        outputs = model.train_task().infer_many(
+            images,
+            snapshot_epoch=epoch,
+            gpu=gpu,
+            resize=False)
+        z_vectors = outputs['output'][:, :100]
+        for image, label, z in zip(images, labels, z_vectors):
+            if embeddings['images'] is None:
+                embeddings['images'] = np.empty((N_EMBEDDINGS,) + image.shape)
+            if embeddings['zs'] is None:
+                embeddings['zs'] = np.empty((N_EMBEDDINGS,) + z.shape)
+            if embeddings['count'] < N_EMBEDDINGS:
+                embeddings['images'][embeddings['count']] = image
+                embeddings['zs'][embeddings['count']] = z
+                embeddings['count'] += 1
+                if embeddings['count'] == N_EMBEDDINGS:
+                    save_embeddings(embeddings)
+
+            for attribute in range(attributes['n_attributes']):
+                if label[attribute] > 0:
+                    attributes['positive_attribute_z'][attribute] += z
+                    attributes['positive_count'][attribute] += 1
+                else:
+                    attributes['negative_attribute_z'][attribute] += z
+                    attributes['negative_count'][attribute] += 1
+        # save
+        save_attributes(attributes)
+
+    n_input_samples = 0
+    label_len = None
+    z_dim = 100
+    for key, value in feature_reader.entries():
+        img = parse_datum(value)
+        label = parse_datum(label_reader.entry(key))[0]
+        if label_len is None:
+            label_len = len(label)
+            attributes = {
+                'n_attributes': label_len,
+                'negative_count': np.zeros(label_len),
+                'positive_count': np.zeros(label_len),
+                'negative_attribute_z': np.zeros((label_len, z_dim)),
+                'positive_attribute_z': np.zeros((label_len, z_dim)),
+            }
+        elif label_len != len(label):
+            raise ValueError("label len differs: %d vs %d" % (label_len, len(label)))
+        input_data.append(img)
+        input_labels.append(label)
+        n_input_samples = n_input_samples + 1
+        if n_input_samples % batch_size == 0:
+            aggregate(input_data, input_labels, attributes, embeddings)
+            print("######## %d processed ########" % n_input_samples)
+            input_data = []      # sample data
+            input_labels = []    # sample labels
+
+    if n_input_samples % batch_size != 0:
+        aggregate(input_data, input_labels, attributes, embeddings)
+        print("######## %d processed ########" % n_input_samples)
+
+if __name__ == '__main__':
+
+    parser = argparse.ArgumentParser(description='Inference tool - DIGITS')
+
+    # Positional arguments
+
+    parser.add_argument(
+        'model',
+        help='Model ID')
+
+    # Optional arguments
+    parser.add_argument(
+        '-e',
+        '--epoch',
+        default='-1',
+        help="Epoch (-1 for last)"
+    )
+
+    parser.add_argument(
+        '-j',
+        '--jobs_dir',
+        default='none',
+        help='Jobs directory (default: from DIGITS config)',
+    )
+
+    parser.add_argument(
+        '-b',
+        '--batch_size',
+        type=int,
+        default=1024,
+        help='Batch size',
+    )
+
+    parser.add_argument(
+        '-g',
+        '--gpu',
+        type=int,
+        default=None,
+        help='GPU to use (as in nvidia-smi output, default: None)',
+    )
+
+    parser.set_defaults(resize=True)
+
+    args = vars(parser.parse_args())
+
+    try:
+        infer(
+            args['jobs_dir'],
+            args['model'],
+            args['epoch'],
+            args['batch_size'],
+            args['gpu'],
+        )
+    except Exception as e:
+        logger.error('%s: %s' % (type(e).__name__, e.message))
+        raise
diff --git a/examples/gan/mnist-animated.gif b/examples/gan/mnist-animated.gif
new file mode 100644
index 000000000..d1719763f
Binary files /dev/null and b/examples/gan/mnist-animated.gif differ
diff --git a/examples/gan/mnist-chi-square.png b/examples/gan/mnist-chi-square.png
new file mode 100644
index 000000000..af19cb4a3
Binary files /dev/null and b/examples/gan/mnist-chi-square.png differ
diff --git a/examples/gan/mnist-class-sweep.png b/examples/gan/mnist-class-sweep.png
new file mode 100644
index 000000000..4e47d8dab
Binary files /dev/null and b/examples/gan/mnist-class-sweep.png differ
diff --git a/examples/gan/mnist-classification-dataset.png b/examples/gan/mnist-classification-dataset.png
new file mode 100644
index 000000000..045ac1e5f
Binary files /dev/null and b/examples/gan/mnist-classification-dataset.png differ
diff --git a/examples/gan/mnist-encode-image-form.png b/examples/gan/mnist-encode-image-form.png
new file mode 100644
index 000000000..2e28dc948
Binary files /dev/null and b/examples/gan/mnist-encode-image-form.png differ
diff --git a/examples/gan/mnist-encode-image.png b/examples/gan/mnist-encode-image.png
new file mode 100644
index 000000000..d8493e95b
Binary files /dev/null and b/examples/gan/mnist-encode-image.png differ
diff --git a/examples/gan/mnist-encoder-loss.png b/examples/gan/mnist-encoder-loss.png
new file mode 100644
index 000000000..1065b9497
Binary files /dev/null and b/examples/gan/mnist-encoder-loss.png differ
diff --git a/examples/gan/mnist-graph.png b/examples/gan/mnist-graph.png
new file mode 100644
index 000000000..197b30e9a
Binary files /dev/null and b/examples/gan/mnist-graph.png differ
diff --git a/examples/gan/mnist-inference-form-class-sweep.png b/examples/gan/mnist-inference-form-class-sweep.png
new file mode 100644
index 000000000..7dd6e2dc8
Binary files /dev/null and b/examples/gan/mnist-inference-form-class-sweep.png differ
diff --git a/examples/gan/mnist-loss.png b/examples/gan/mnist-loss.png
new file mode 100644
index 000000000..f6cb49bf6
Binary files /dev/null and b/examples/gan/mnist-loss.png differ
diff --git a/examples/gan/mnist-style-sweep.png b/examples/gan/mnist-style-sweep.png
new file mode 100644
index 000000000..ea4fc8a52
Binary files /dev/null and b/examples/gan/mnist-style-sweep.png differ
diff --git a/examples/gan/mnist-styled-class-sweep-form.png b/examples/gan/mnist-styled-class-sweep-form.png
new file mode 100644
index 000000000..1b85912d6
Binary files /dev/null and b/examples/gan/mnist-styled-class-sweep-form.png differ
diff --git a/examples/gan/mnist-styled-class-sweep.png b/examples/gan/mnist-styled-class-sweep.png
new file mode 100644
index 000000000..fb2112663
Binary files /dev/null and b/examples/gan/mnist-styled-class-sweep.png differ
diff --git a/examples/gan/mnist-tb-samples.png b/examples/gan/mnist-tb-samples.png
new file mode 100644
index 000000000..5d70bf67f
Binary files /dev/null and b/examples/gan/mnist-tb-samples.png differ
diff --git a/examples/gan/network-celebA-encoder.py b/examples/gan/network-celebA-encoder.py
new file mode 100644
index 000000000..605b4fde3
--- /dev/null
+++ b/examples/gan/network-celebA-encoder.py
@@ -0,0 +1,407 @@
+# The MIT License (MIT)
+#
+# Original work Copyright (c) 2016 Taehoon Kim
+# Modified work Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import math
+import numpy as np
+import tensorflow as tf
+
+from tensorflow.python.framework import ops
+
+image_summary = tf.summary.image
+scalar_summary = tf.summary.scalar
+histogram_summary = tf.summary.histogram
+merge_summary = tf.summary.merge
+SummaryWriter = tf.summary.FileWriter
+
+
+class batch_norm(object):
+    """
+    This class creates an op that composes the specified tensor with a batch
+    normalization layer.
+    """
+
+    def __init__(self, epsilon=1e-5, momentum=0.9, name="batch_norm"):
+        """Instance initialization"""
+        with tf.variable_scope(name):
+            self.epsilon = epsilon
+            self.momentum = momentum
+            self.name = name
+
+    def __call__(self, x, train=True):
+        """
+        Functional interface
+
+        Args:
+            x: tensor to compose
+            train: set to True during training and False otherwise
+        """
+        return tf.contrib.layers.batch_norm(x,
+                                            decay=self.momentum,
+                                            updates_collections=None,
+                                            epsilon=self.epsilon,
+                                            scale=True,
+                                            is_training=train,
+                                            scope=self.name)
+
+
+def conv2d(input_, output_dim,
+           k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+           name="conv2d"):
+    """
+    Compose specified symbol with 2D convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_dim: number of output features maps
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        w = tf.get_variable('w', [k_h, k_w, input_.get_shape()[-1], output_dim],
+                            initializer=tf.truncated_normal_initializer(stddev=stddev))
+        conv = tf.nn.conv2d(input_, w, strides=[1, d_h, d_w, 1], padding='SAME')
+
+        biases = tf.get_variable('biases', [output_dim], initializer=tf.constant_initializer(0.0))
+        conv = tf.nn.bias_add(conv, biases)
+
+        return conv
+
+
+def deconv2d(input_, output_shape,
+             k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+             name="deconv2d", with_w=False):
+    """
+    Compose specified symbol with 2D *transpose* convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_shape: output shape
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        # filter : [height, width, output_channels, in_channels]
+        w = tf.get_variable('w',
+                            [k_h, k_w, output_shape[-1],
+                            input_.get_shape()[-1]],
+                            initializer=tf.random_normal_initializer(stddev=stddev))
+        deconv = tf.nn.conv2d_transpose(input_, w,
+                                        output_shape=output_shape,
+                                        strides=[1, d_h, d_w, 1])
+
+        biases = tf.get_variable('biases', [output_shape[-1]], initializer=tf.constant_initializer(0.0))
+        deconv = tf.reshape(tf.nn.bias_add(deconv, biases), output_shape)
+
+        if with_w:
+            return deconv, w, biases
+        else:
+            return deconv
+
+
+def lrelu(x, leak=0.2, name="lrelu"):
+    """Compose specified tensor with leaky Rectifier Linear Unit"""
+    return tf.maximum(x, leak*x)
+
+
+def linear(input_, output_size, scope=None, stddev=0.02, bias_start=0.0, with_w=False):
+    """
+    Compose specified tensor with linear (fully-connected) layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, M]
+        output_size: number of output neurons
+        scope: name scope
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+        with_w: whether to also return parameter variables
+
+    Returns:
+      Composed tensor. Shape: [N, output_size]
+    """
+    shape = input_.get_shape().as_list()
+
+    with tf.variable_scope(scope or "Linear"):
+        matrix = tf.get_variable("Matrix", [shape[1], output_size], tf.float32,
+                                 tf.random_normal_initializer(stddev=stddev))
+        bias = tf.get_variable("bias", [output_size],
+            initializer=tf.constant_initializer(bias_start))
+        if with_w:
+            return tf.matmul(input_, matrix) + bias, matrix, bias
+        else:
+            return tf.matmul(input_, matrix) + bias
+
+
+class UserModel(Tower):
+    """
+    User Model definition
+
+    DIGITS creates an instance of this class for every tower it needs
+    to create. This includes:
+    - one for training,
+    - one for validation,
+    - one for testing.
+
+    In the case of multi-GPU training, one training instance is created
+    for every GPU. DIGITS takes care of doing the gradient averaging
+    across GPUs so this class only needs to define the inference op
+    and desired loss/cost function.
+    """
+
+    def __init__(self, *args, **kwargs):
+        """
+        Identify the correct input nodes.
+
+        In the parent class, DIGITS conveniently sets the following fields:
+        - self.is_training: whether this is a training graph
+        - self.is_inference: whether this graph is created for inference/testing
+        - self.x: input node. Shape: [N, H, W, C]
+        - self.y: label. Shape: [N] for scalar labels, [N, H, W, C] otherwise.
+                  Only defined if self._is_training is True
+        """
+        super(UserModel, self).__init__(*args, **kwargs)
+
+        image_size = 64
+        output_size = 64
+        c_dim = 3
+        z_dim = 100
+
+        self.dcgan_init(image_size=image_size,
+                        output_size=output_size,
+                        c_dim=c_dim,
+                        z_dim=z_dim,
+                        )
+
+    @model_property
+    def inference(self):
+        """ op to use for inference """
+
+        # scale back to [0, 255] range
+        images = (self.G * 127) + 128
+        images_flat = tf.reshape(images, [self.batch_size, self.image_size * self.image_size * self.c_dim])
+        # concatenate encoded z and generated image into a single flat structure
+        zgen_flat = tf.reshape(self.DzGEN, [self.batch_size, self.z_dim])
+        return tf.concat(1, [zgen_flat, images_flat])
+
+    @model_property
+    def loss(self):
+        """
+        Loss function
+
+        Returns either an op or a list of dicts.
+        If the returned value is an op then DIGITS will optimize against this op
+        with respect to all trainable variables.
+        If the returned value is a list then DIGITS will optimize against each
+        loss in the list with respect to the specified variables.
+        """
+
+        # here we are returning a list because we want to alternately optimize the
+        # discriminator and the generator.
+
+        losses = [
+            {'loss': self.dzgen_loss, 'vars': self.d_vars},
+        ]
+        return losses
+
+    def dcgan_init(self,
+                   image_size,
+                   output_size,
+                   z_dim,
+                   c_dim,
+                   gf_dim=64,
+                   df_dim=64,
+                   gfc_dim=1024,
+                   dfc_dim=1024,
+                   ):
+        """
+
+        Args:
+            output_size: (optional) The resolution in pixels of the images. [64]
+            z_dim: (optional) Dimension of dim for Z. [100]
+            gf_dim: (optional) Dimension of gen filters in first conv layer. [64]
+            df_dim: (optional) Dimension of discrim filters in first conv layer. [64]
+            gfc_dim: (optional) Dimension of gen units for for fully connected layer. [1024]
+            dfc_dim: (optional) Dimension of discrim units for fully connected layer. [1024]
+            c_dim: (optional) Dimension of image color. For grayscale input, set to 1. [3]
+        """
+        self.image_size = image_size
+        self.output_size = output_size
+
+        self.z_dim = z_dim
+
+        self.gf_dim = gf_dim
+        self.df_dim = df_dim
+
+        self.gfc_dim = gfc_dim
+        self.dfc_dim = dfc_dim
+
+        self.c_dim = c_dim
+
+        self.batch_size = tf.shape(self.x)[0]
+
+        self.soft_label_margin = 0.1
+
+        # batch normalization : deals with poor initialization helps gradient flow
+        self.d_bn1 = batch_norm(name='d_bn1')
+        self.d_bn2 = batch_norm(name='d_bn2')
+        self.d_bn3 = batch_norm(name='d_bn3')
+
+        self.g_bn0 = batch_norm(name='g_bn0')
+        self.g_bn1 = batch_norm(name='g_bn1')
+        self.g_bn2 = batch_norm(name='g_bn2')
+        self.g_bn3 = batch_norm(name='g_bn3')
+
+        self.build_model()
+
+    def build_model(self):
+
+        # reshape/rescale x
+        self.images = (tf.reshape(self.x,
+                                  shape=[self.batch_size,
+                                         self.image_size,
+                                         self.image_size,
+                                         self.c_dim],
+                                  name='x_reshaped') - 128)/ 127.
+
+        # create discriminator/encoder
+        self.DzGEN, self.D_logits  = self.discriminator(self.images, reuse=False)
+        # create generator
+        self.G = self.generator(self.DzGEN)
+        # loss is now L2 distance between input image and generator output
+        self.dzgen_loss = tf.reduce_mean(tf.square(self.G - self.images), name="loss_DzGEN")
+
+        # debug
+        self.summaries.append(image_summary("G", self.G, max_outputs=3))
+        self.summaries.append(image_summary("X", self.images, max_outputs=3))
+        self.summaries.append(histogram_summary("G_hist", self.G))
+        self.summaries.append(histogram_summary("X_hist", self.images))
+        self.summaries.append(scalar_summary("DzGen_loss", self.dzgen_loss))
+
+        # all trainable variables
+        t_vars = tf.trainable_variables()
+        # d variables
+        self.d_vars = [var for var in t_vars if 'd_' in var.name]
+
+    def discriminator(self, image, y=None, reuse=False):
+        """
+        Create the discriminator
+
+        This creates a string of layers:
+        - input - [N, 64, 64, 3]
+        - conv layer with 64 5x5 kernels and 2x2 stride - [N, 32, 32, 64]
+        - leaky relu - [N, 32, 32, 64]
+        - conv layer with 128 5x5 kernels and 2x2 stride - [N, 16, 16, 32]
+        - batch norm - [N, 16, 16, 32]
+        - leaky relu - [N, 16, 16, 32]
+        - conv layer with 256 5x5 kernels and 2x2 stride - [N, 8, 8, 256]
+        - batch norm - [N, 8, 8, 256]
+        - leaky relu - [N, 8, 8, 256]
+        - conv layer with 256 5x5 kernels and 2x2 stride - [N, 4, 4, 512]
+        - batch norm - [N, 4, 4, 512]
+        - leaky relu - [N, 4, 4, 512]
+        - flatten - [N, 8192]
+        - linear layer with 1 output neurons - [N, 1]
+        - sigmoid - [N,1]
+
+        Args:
+            image: batch of input images - shape: [N, H, W, C]
+            y: batch of one-hot encoded labels - shape: [N, K]
+            reuse: whether to re-use previously created variables
+        """
+
+        # NOTE: although we are really creating an encoder here we need to re-use the same
+        # variable scope (i.e. "discriminator") as in the original GAN so we can re-use
+        # learned parameters
+        with tf.variable_scope("discriminator") as scope:
+            if reuse:
+                scope.reuse_variables()
+
+            h0 = lrelu(conv2d(image, self.df_dim, name='d_h0_conv'))
+            h1 = lrelu(self.d_bn1(conv2d(h0, self.df_dim*2, name='d_h1_conv'), train=self.is_training))
+            h2 = lrelu(self.d_bn2(conv2d(h1, self.df_dim*4, name='d_h2_conv'), train=self.is_training))
+            h3 = lrelu(self.d_bn3(conv2d(h2, self.df_dim*8, name='d_h3_conv'), train=self.is_training))
+            h3_size = ((self.output_size // 16) ** 2) * self.df_dim * 8
+            h4 = linear(tf.reshape(h3, [self.batch_size, h3_size]), self.z_dim, 'd_h3_lin_retrain')
+            return h4, h4
+
+    def generator(self, z, y=None):
+        """
+        Create the generator
+
+        This creates a string of layers:
+        - input - [N, 100]
+        - linear layer with 8192 output neurons - [N, 8192]
+        - reshape - [N, 4, 4, 512]
+        - batch norm - [N, 4, 4, 512]
+        - relu - [N, 4, 4, 512]
+        - transpose convolution with 256 filters and stride 2 - [N, 8, 8, 256]
+        - batch norm - [N, 8, 8, 256]
+        - relu - [N, 8, 8, 256]
+        - transpose convolution with 128 filters and stride 2 - [N, 16, 16, 128]
+        - batch norm - [N, 16, 16, 128]
+        - relu - [N, 16, 16, 128]
+        - transpose convolution with 64 filters and stride 2 - [N, 32, 32, 64]
+        - batch norm - [N, 32, 32, 64]
+        - relu - [N, 32, 32, 64]
+        - transpose convolution with 3 filters and stride 2 - [N, 64, 64, 3]
+        - tanh - [N, 64, 64, 3]
+        """
+        with tf.variable_scope("generator") as scope:
+            s = self.output_size
+            s2, s4, s8, s16 = int(s/2), int(s/4), int(s/8), int(s/16)
+
+            # project `z` and reshape
+            self.z_, self.h0_w, self.h0_b = linear(z, self.gf_dim*8*s16*s16, 'g_h0_lin', with_w=True)
+
+            self.h0 = tf.reshape(self.z_, [-1, s16, s16, self.gf_dim * 8])
+            h0 = tf.nn.relu(self.g_bn0(self.h0, train=False))
+
+            self.h1, self.h1_w, self.h1_b = deconv2d(h0,
+                [self.batch_size, s8, s8, self.gf_dim*4], name='g_h1', with_w=True)
+            h1 = tf.nn.relu(self.g_bn1(self.h1, train=False))
+
+            h2, self.h2_w, self.h2_b = deconv2d(h1,
+                [self.batch_size, s4, s4, self.gf_dim*2], name='g_h2', with_w=True)
+            h2 = tf.nn.relu(self.g_bn2(h2, train=False))
+
+            h3, self.h3_w, self.h3_b = deconv2d(h2,
+                [self.batch_size, s2, s2, self.gf_dim*1], name='g_h3', with_w=True)
+            h3 = tf.nn.relu(self.g_bn3(h3, train=False))
+
+            h4, self.h4_w, self.h4_b = deconv2d(h3,
+                [self.batch_size, s, s, self.c_dim], name='g_h4', with_w=True)
+
+            return tf.nn.tanh(h4)
diff --git a/examples/gan/network-celebA.py b/examples/gan/network-celebA.py
new file mode 100644
index 000000000..8e454b5bb
--- /dev/null
+++ b/examples/gan/network-celebA.py
@@ -0,0 +1,447 @@
+# The MIT License (MIT)
+#
+# Original work Copyright (c) 2016 Taehoon Kim
+# Modified work Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import math
+import numpy as np
+import tensorflow as tf
+
+from tensorflow.python.framework import ops
+
+image_summary = tf.summary.image
+scalar_summary = tf.summary.scalar
+histogram_summary = tf.summary.histogram
+merge_summary = tf.summary.merge
+SummaryWriter = tf.summary.FileWriter
+
+
+class batch_norm(object):
+    """
+    This class creates an op that composes the specified tensor with a batch
+    normalization layer.
+    """
+
+    def __init__(self, epsilon=1e-5, momentum=0.9, name="batch_norm"):
+        """Instance initialization"""
+        with tf.variable_scope(name):
+            self.epsilon = epsilon
+            self.momentum = momentum
+            self.name = name
+
+    def __call__(self, x, train=True):
+        """
+        Functional interface
+
+        Args:
+            x: tensor to compose
+            train: set to True during training and False otherwise
+        """
+        return tf.contrib.layers.batch_norm(x,
+                                            decay=self.momentum,
+                                            updates_collections=None,
+                                            epsilon=self.epsilon,
+                                            scale=True,
+                                            is_training=train,
+                                            scope=self.name)
+
+
+def conv2d(input_, output_dim,
+           k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+           name="conv2d"):
+    """
+    Compose specified symbol with 2D convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_dim: number of output features maps
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        w = tf.get_variable('w', [k_h, k_w, input_.get_shape()[-1], output_dim],
+                            initializer=tf.truncated_normal_initializer(stddev=stddev))
+        conv = tf.nn.conv2d(input_, w, strides=[1, d_h, d_w, 1], padding='SAME')
+
+        biases = tf.get_variable('biases', [output_dim], initializer=tf.constant_initializer(0.0))
+        conv = tf.nn.bias_add(conv, biases)
+
+        return conv
+
+
+def deconv2d(input_, output_shape,
+             k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+             name="deconv2d", with_w=False):
+    """
+    Compose specified symbol with 2D *transpose* convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_shape: output shape
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        # filter : [height, width, output_channels, in_channels]
+        w = tf.get_variable('w',
+                            [k_h, k_w, output_shape[-1],
+                            input_.get_shape()[-1]],
+                            initializer=tf.random_normal_initializer(stddev=stddev))
+        deconv = tf.nn.conv2d_transpose(input_, w,
+                                        output_shape=output_shape,
+                                        strides=[1, d_h, d_w, 1])
+
+        biases = tf.get_variable('biases', [output_shape[-1]], initializer=tf.constant_initializer(0.0))
+        deconv = tf.reshape(tf.nn.bias_add(deconv, biases), output_shape)
+
+        if with_w:
+            return deconv, w, biases
+        else:
+            return deconv
+
+
+def lrelu(x, leak=0.2, name="lrelu"):
+    """Compose specified tensor with leaky Rectifier Linear Unit"""
+    return tf.maximum(x, leak*x)
+
+
+def linear(input_, output_size, scope=None, stddev=0.02, bias_start=0.0, with_w=False):
+    """
+    Compose specified tensor with linear (fully-connected) layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, M]
+        output_size: number of output neurons
+        scope: name scope
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+        with_w: whether to also return parameter variables
+
+    Returns:
+      Composed tensor. Shape: [N, output_size]
+    """
+    shape = input_.get_shape().as_list()
+
+    with tf.variable_scope(scope or "Linear"):
+        matrix = tf.get_variable("Matrix", [shape[1], output_size], tf.float32,
+                                 tf.random_normal_initializer(stddev=stddev))
+        bias = tf.get_variable("bias", [output_size],
+            initializer=tf.constant_initializer(bias_start))
+        if with_w:
+            return tf.matmul(input_, matrix) + bias, matrix, bias
+        else:
+            return tf.matmul(input_, matrix) + bias
+
+
+class UserModel(Tower):
+    """
+    User Model definition
+
+    DIGITS creates an instance of this class for every tower it needs
+    to create. This includes:
+    - one for training,
+    - one for validation,
+    - one for testing.
+
+    In the case of multi-GPU training, one training instance is created
+    for every GPU. DIGITS takes care of doing the gradient averaging
+    across GPUs so this class only needs to define the inference op
+    and desired loss/cost function.
+    """
+
+    def __init__(self, *args, **kwargs):
+        """
+        Identify the correct input nodes.
+
+        In the parent class, DIGITS conveniently sets the following fields:
+        - self.is_training: whether this is a training graph
+        - self.is_inference: whether this graph is created for inference/testing
+        - self.x: input node. Shape: [N, H, W, C]
+        - self.y: label. Shape: [N] for scalar labels, [N, H, W, C] otherwise.
+                  Only defined if self._is_training is True
+        """
+        super(UserModel, self).__init__(*args, **kwargs)
+
+        image_size = 64
+        output_size = 64
+        c_dim = 3
+        z_dim = 100
+
+        self.dcgan_init(image_size=image_size,
+                        output_size=output_size,
+                        c_dim=c_dim,
+                        z_dim=z_dim,
+                        )
+
+    @model_property
+    def inference(self):
+        """op to use for inference"""
+
+        # scale back to [0, 255] range
+        return tf.to_int32((self.G+127) * 128)
+
+    @model_property
+    def loss(self):
+        """
+        Loss function
+
+        Returns either an op or a list of dicts.
+        If the returned value is an op then DIGITS will optimize against this op
+        with respect to all trainable variables.
+        If the returned value is a list then DIGITS will optimize against each
+        loss in the list with respect to the specified variables.
+        """
+
+        # here we are returning a list because we want to alternately optimize the
+        # discriminator and the generator.
+
+        losses = [
+            {'loss': self.d_loss, 'vars': self.d_vars},
+            {'loss': self.g_loss, 'vars': self.g_vars}
+        ]
+        return losses
+
+    def dcgan_init(self,
+                   image_size,
+                   output_size,
+                   z_dim,
+                   c_dim,
+                   gf_dim=64,
+                   df_dim=64,
+                   gfc_dim=1024,
+                   dfc_dim=1024,
+                   ):
+        """
+
+        Args:
+            output_size: (optional) The resolution in pixels of the images. [64]
+            z_dim: (optional) Dimension of dim for Z. [100]
+            gf_dim: (optional) Dimension of gen filters in first conv layer. [64]
+            df_dim: (optional) Dimension of discrim filters in first conv layer. [64]
+            gfc_dim: (optional) Dimension of gen units for for fully connected layer. [1024]
+            dfc_dim: (optional) Dimension of discrim units for fully connected layer. [1024]
+            c_dim: (optional) Dimension of image color. For grayscale input, set to 1. [3]
+        """
+        self.image_size = image_size
+        self.output_size = output_size
+
+        self.z_dim = z_dim
+
+        self.gf_dim = gf_dim
+        self.df_dim = df_dim
+
+        self.gfc_dim = gfc_dim
+        self.dfc_dim = dfc_dim
+
+        self.c_dim = c_dim
+
+        self.batch_size = tf.shape(self.x)[0]
+
+        self.soft_label_margin = 0.1
+
+        # batch normalization : deals with poor initialization helps gradient flow
+        self.d_bn1 = batch_norm(name='d_bn1')
+        self.d_bn2 = batch_norm(name='d_bn2')
+        self.d_bn3 = batch_norm(name='d_bn3')
+
+        self.g_bn0 = batch_norm(name='g_bn0')
+        self.g_bn1 = batch_norm(name='g_bn1')
+        self.g_bn2 = batch_norm(name='g_bn2')
+        self.g_bn3 = batch_norm(name='g_bn3')
+
+        self.build_model()
+
+    def build_model(self):
+
+        if not self.is_inference:
+            # create both the generator and the discriminator
+            # self.x is a batch of images - shape: [N, H, W, C]
+            # self.y is a vector of labels - shape: [N]
+
+            # sample z from a normal distribution
+            self.z = tf.random_normal(shape=[self.batch_size, self.z_dim], dtype=tf.float32, seed=None, name='z')
+
+            # scale input to [-1, +1] range
+            self.images = (tf.reshape(self.x,
+                                      shape=[self.batch_size,
+                                             self.image_size,
+                                             self.image_size,
+                                             self.c_dim],
+                                      name='x_reshaped') - 128)/ 127.
+
+            # create generator
+            self.G = self.generator(self.z)
+            # create an instance of the discriminator (real samples)
+            self.D, self.D_logits = self.discriminator(self.images, reuse=False)
+            # create another identical instance of the discriminator (fake samples)
+            # NOTE: we are re-using variables here to share weights between the two
+            # instances of the discriminator
+            self.D_, self.D_logits_ = self.discriminator(self.G, reuse=True)
+
+            # we are using the cross entropy loss for all these losses
+            # note the use of the soft label smoothing here to prevent D from getting overly confident
+            # on real samples
+            self.d_loss_real = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(self.D_logits,
+                                              tf.ones_like(self.D) - self.soft_label_margin,
+                                              name="loss_D_real"))
+            self.d_loss_fake = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(self.D_logits_,
+                                              tf.zeros_like(self.D_),
+                                              name="loss_D_fake"))
+            self.d_loss = (self.d_loss_real + self.d_loss_fake) / 2.
+            # the typical GAN set-up is that of a minimax game where D is trying to minimize its own error and G is trying to maximize D's error
+            # however note how we are flipping G labels here: instead of maximizing D's error, we are minimizing D's error on the 'wrong' label
+            # this trick helps produce a stronger gradient
+            self.g_loss = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(self.D_logits_,
+                                              tf.ones_like(self.D_) + self.soft_label_margin,
+                                              name="loss_G"))
+
+            # debug
+            self.summaries.append(image_summary("G", self.G, max_outputs=3))
+            self.summaries.append(image_summary("X", self.images, max_outputs=3))
+            self.summaries.append(histogram_summary("G_hist", self.G))
+            self.summaries.append(histogram_summary("X_hist", self.images))
+            self.summaries.append(scalar_summary("d_loss_real", self.d_loss_real))
+            self.summaries.append(scalar_summary("d_loss_fake", self.d_loss_fake))
+            self.summaries.append(scalar_summary("g_loss", self.g_loss))
+            self.summaries.append(scalar_summary("d_loss", self.d_loss))
+
+            # all trainable variables
+            t_vars = tf.trainable_variables()
+            # G variables
+            self.g_vars = [var for var in t_vars if 'g_' in var.name]
+            # D variables
+            self.d_vars = [var for var in t_vars if 'd_' in var.name]
+
+            # Extra hook for debug: log chi-square distance between G's output histogram and the dataset's histogram
+            value_range = [0.0, 1.0]
+            nbins = 100
+            hist_g = tf.histogram_fixed_width(self.G, value_range, nbins=nbins, dtype=tf.float32) / nbins
+            hist_images = tf.histogram_fixed_width(self.images, value_range, nbins=nbins, dtype=tf.float32) / nbins
+            chi_square = tf.reduce_mean(tf.div(tf.square(hist_g - hist_images), hist_g + hist_images + 1e-5))
+            self.summaries.append(scalar_summary("chi_square", chi_square))
+        else:
+            # Create only the generator
+            self.x = tf.reshape(self.x, shape=[self.batch_size, self.z_dim])
+            self.z = self.x[:, :self.z_dim]
+            self.G = self.generator(self.z)
+
+    def discriminator(self, image, y=None, reuse=False):
+        """
+        Create the discriminator
+
+        This creates a string of layers:
+        - input - [N, 64, 64, 3]
+        - conv layer with 64 5x5 kernels and 2x2 stride - [N, 32, 32, 64]
+        - leaky relu - [N, 32, 32, 64]
+        - conv layer with 128 5x5 kernels and 2x2 stride - [N, 16, 16, 32]
+        - batch norm - [N, 16, 16, 32]
+        - leaky relu - [N, 16, 16, 32]
+        - conv layer with 256 5x5 kernels and 2x2 stride - [N, 8, 8, 256]
+        - batch norm - [N, 8, 8, 256]
+        - leaky relu - [N, 8, 8, 256]
+        - conv layer with 256 5x5 kernels and 2x2 stride - [N, 4, 4, 512]
+        - batch norm - [N, 4, 4, 512]
+        - leaky relu - [N, 4, 4, 512]
+        - flatten - [N, 8192]
+        - linear layer with 1 output neurons - [N, 1]
+        - sigmoid - [N,1]
+
+        Args:
+            image: batch of input images - shape: [N, H, W, C]
+            y: batch of one-hot encoded labels - shape: [N, K]
+            reuse: whether to re-use previously created variables
+        """
+        with tf.variable_scope("discriminator") as scope:
+            if reuse:
+                scope.reuse_variables()
+
+            h0 = lrelu(conv2d(image, self.df_dim, name='d_h0_conv'))
+            h1 = lrelu(self.d_bn1(conv2d(h0, self.df_dim * 2, name='d_h1_conv'), train=self.is_training))
+            h2 = lrelu(self.d_bn2(conv2d(h1, self.df_dim * 4, name='d_h2_conv'), train=self.is_training))
+            h3 = lrelu(self.d_bn3(conv2d(h2, self.df_dim * 8, name='d_h3_conv'), train=self.is_training))
+            h3_size = ((self.output_size // 16) ** 2) * self.df_dim * 8
+            h4 = linear(tf.reshape(h3, [self.batch_size, h3_size]), 1, 'd_h3_lin')
+
+            return tf.nn.sigmoid(h4), h4
+
+    def generator(self, z, y=None):
+        """
+        Create the generator
+
+        This creates a string of layers:
+        - input - [N, 100]
+        - linear layer with 8192 output neurons - [N, 8192]
+        - reshape - [N, 4, 4, 512]
+        - batch norm - [N, 4, 4, 512]
+        - relu - [N, 4, 4, 512]
+        - transpose convolution with 256 filters and stride 2 - [N, 8, 8, 256]
+        - batch norm - [N, 8, 8, 256]
+        - relu - [N, 8, 8, 256]
+        - transpose convolution with 128 filters and stride 2 - [N, 16, 16, 128]
+        - batch norm - [N, 16, 16, 128]
+        - relu - [N, 16, 16, 128]
+        - transpose convolution with 64 filters and stride 2 - [N, 32, 32, 64]
+        - batch norm - [N, 32, 32, 64]
+        - relu - [N, 32, 32, 64]
+        - transpose convolution with 3 filters and stride 2 - [N, 64, 64, 3]
+        - tanh - [N, 64, 64, 3]
+        """
+        with tf.variable_scope("generator") as scope:
+
+            s = self.output_size
+            s2, s4, s8, s16 = int(s // 2), int(s // 4), int(s // 8), int(s // 16)
+
+            # project `z` and reshape
+            self.z_, self.h0_w, self.h0_b = linear(z, self.gf_dim * 8 * s16 * s16, 'g_h0_lin', with_w=True)
+
+            self.h0 = tf.reshape(self.z_, [-1, s16, s16, self.gf_dim * 8])
+            h0 = tf.nn.relu(self.g_bn0(self.h0, train=self.is_training))
+
+            self.h1, self.h1_w, self.h1_b = deconv2d(h0,
+                [self.batch_size, s8, s8, self.gf_dim * 4], name='g_h1', with_w=True)
+            h1 = tf.nn.relu(self.g_bn1(self.h1, train=self.is_training))
+
+            h2, self.h2_w, self.h2_b = deconv2d(h1,
+                [self.batch_size, s4, s4, self.gf_dim * 2], name='g_h2', with_w=True)
+            h2 = tf.nn.relu(self.g_bn2(h2, train=self.is_training))
+
+            h3, self.h3_w, self.h3_b = deconv2d(h2,
+                [self.batch_size, s2, s2, self.gf_dim * 1], name='g_h3', with_w=True)
+            h3 = tf.nn.relu(self.g_bn3(h3, train=self.is_training))
+
+            h4, self.h4_w, self.h4_b = deconv2d(h3,
+                [self.batch_size, s, s, self.c_dim], name='g_h4', with_w=True)
+
+            return tf.nn.tanh(h4)
diff --git a/examples/gan/network-mnist-encoder.py b/examples/gan/network-mnist-encoder.py
new file mode 100644
index 000000000..2567aaa9f
--- /dev/null
+++ b/examples/gan/network-mnist-encoder.py
@@ -0,0 +1,432 @@
+# The MIT License (MIT)
+#
+# Original work Copyright (c) 2016 Taehoon Kim
+# Modified work Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import math
+import numpy as np
+import tensorflow as tf
+
+from tensorflow.python.framework import ops
+
+image_summary = tf.summary.image
+scalar_summary = tf.summary.scalar
+histogram_summary = tf.summary.histogram
+merge_summary = tf.summary.merge
+SummaryWriter = tf.summary.FileWriter
+
+
+class batch_norm(object):
+    """
+    This class creates an op that composes the specified tensor with a batch
+    normalization layer.
+    """
+
+    def __init__(self, epsilon=1e-5, momentum=0.9, name="batch_norm"):
+        """Instance initialization"""
+        with tf.variable_scope(name):
+            self.epsilon = epsilon
+            self.momentum = momentum
+            self.name = name
+
+    def __call__(self, x, train=True):
+        """
+        Functional interface
+
+        Args:
+            x: tensor to compose
+            train: set to True during training and False otherwise
+        """
+        return tf.contrib.layers.batch_norm(x,
+                                            decay=self.momentum,
+                                            updates_collections=None,
+                                            epsilon=self.epsilon,
+                                            scale=True,
+                                            is_training=train,
+                                            scope=self.name)
+
+
+def conv_cond_concat(x, y):
+    """
+    Concatenate conditioning matrix across channel axis.
+
+    The specified input tensor is concatenated with K feature maps (K = number of classes)
+    across the channel dimension. Each of the K feature maps is set to all-zeros except for
+    the one whose index matches the target class (which is set to all-ones).
+
+    Args:
+        x: non-conditioned tensor. Shape: [N, H, W, C]
+        y: one-hot encoded conditioning matrix. Shape: [N, K]
+
+    Returns:
+        conditioned feature map. Shape: [N, H, W, C + K]
+    """
+    x_shapes = x.get_shape()
+    y_shapes = y.get_shape()
+    batch_size = tf.shape(x)[0]
+    return tf.concat(3, [x, y * tf.ones([batch_size, int(x_shapes[1]), int(x_shapes[2]), int(y_shapes[3])])])
+
+
+def conv2d(input_, output_dim,
+           k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+           name="conv2d"):
+    """
+    Compose specified symbol with 2D convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_dim: number of output features maps
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        w = tf.get_variable('w', [k_h, k_w, input_.get_shape()[-1], output_dim],
+                            initializer=tf.truncated_normal_initializer(stddev=stddev))
+        conv = tf.nn.conv2d(input_, w, strides=[1, d_h, d_w, 1], padding='SAME')
+
+        biases = tf.get_variable('biases', [output_dim], initializer=tf.constant_initializer(0.0))
+        conv = tf.nn.bias_add(conv, biases)
+
+        return conv
+
+
+def deconv2d(input_, output_shape,
+             k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+             name="deconv2d", with_w=False):
+    """
+    Compose specified symbol with 2D *transpose* convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_shape: output shape
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        # filter : [height, width, output_channels, in_channels]
+        w = tf.get_variable('w',
+                            [k_h, k_w, output_shape[-1],
+                            input_.get_shape()[-1]],
+                            initializer=tf.random_normal_initializer(stddev=stddev))
+        deconv = tf.nn.conv2d_transpose(input_, w,
+                                        output_shape=output_shape,
+                                        strides=[1, d_h, d_w, 1])
+
+        biases = tf.get_variable('biases', [output_shape[-1]], initializer=tf.constant_initializer(0.0))
+        deconv = tf.reshape(tf.nn.bias_add(deconv, biases), output_shape)
+
+        if with_w:
+            return deconv, w, biases
+        else:
+            return deconv
+
+
+def lrelu(x, leak=0.2, name="lrelu"):
+    """Compose specified tensor with leaky Rectifier Linear Unit"""
+    return tf.maximum(x, leak*x)
+
+
+def linear(input_, output_size, scope=None, stddev=0.02, bias_start=0.0, with_w=False):
+    """
+    Compose specified tensor with linear (fully-connected) layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, M]
+        output_size: number of output neurons
+        scope: name scope
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+        with_w: whether to also return parameter variables
+
+    Returns:
+      Composed tensor. Shape: [N, output_size]
+    """
+    shape = input_.get_shape().as_list()
+
+    with tf.variable_scope(scope or "Linear"):
+        matrix = tf.get_variable("Matrix", [shape[1], output_size], tf.float32,
+                                 tf.random_normal_initializer(stddev=stddev))
+        bias = tf.get_variable("bias", [output_size],
+            initializer=tf.constant_initializer(bias_start))
+        if with_w:
+            return tf.matmul(input_, matrix) + bias, matrix, bias
+        else:
+            return tf.matmul(input_, matrix) + bias
+
+
+class UserModel(Tower):
+    """
+    User Model definition
+
+    DIGITS creates an instance of this class for every tower it needs
+    to create. This includes:
+    - one for training,
+    - one for validation,
+    - one for testing.
+
+    In the case of multi-GPU training, one training instance is created
+    for every GPU. DIGITS takes care of doing the gradient averaging
+    across GPUs so this class only needs to define the inference op
+    and desired loss/cost function.
+    """
+
+    def __init__(self, *args, **kwargs):
+        """
+        Identify the correct input nodes.
+
+        In the parent class, DIGITS conveniently sets the following fields:
+        - self.is_training: whether this is a training graph
+        - self.is_inference: whether this graph is created for inference/testing
+        - self.x: input node. Shape: [N, H, W, C]
+        - self.y: label. Shape: [N] for scalar labels, [N, H, W, C] otherwise.
+                  Only defined if self._is_training is True
+        """
+        super(UserModel, self).__init__(*args, **kwargs)
+
+        # initialize graph with parameters for MNIST
+        self.dcgan_init(image_size=28,
+                        y_dim=10,
+                        output_size=28,
+                        c_dim=1,
+                        )
+
+    @model_property
+    def inference(self):
+        """ op to use for inference """
+        # rescale
+        images = self.G * 255
+        # flatten G output
+        images_flat = tf.reshape(images, [self.batch_size, self.image_size * self.image_size * self.c_dim])
+        # now return encoded z concatenated with G output
+        # during inference the visualization script will need to extract
+        # both z and the generated image to display them separately
+        zgen_flat = tf.reshape(self.DzGEN, [self.batch_size, self.z_dim])
+        return tf.concat(1, [zgen_flat, images_flat])
+
+    @model_property
+    def loss(self):
+        """
+        Loss function
+
+        Returns either an op or a list of dicts.
+        If the returned value is an op then DIGITS will optimize against this op
+        with respect to all trainable variables.
+        If the returned value is a list then DIGITS will optimize against each
+        loss in the list with respect to the specified variables.
+        """
+
+        # here we are returning a list because we want to alternately optimize the
+        # discriminator on real samples, the discriminator on fake samples and the
+        # generator.
+        losses = [
+            {'loss': self.dzgen_loss, 'vars': self.d_vars},
+        ]
+        return losses
+
+    def dcgan_init(self, image_size=108,
+                   output_size=64, y_dim=None, z_dim=100, gf_dim=64, df_dim=64,
+                   gfc_dim=1024, dfc_dim=1024, c_dim=3):
+        """
+        Create the model
+
+        Args:
+            output_size: (optional) The resolution in pixels of the images. [64]
+            y_dim: (optional) Dimension of dim for y. [None]
+            z_dim: (optional) Dimension of dim for Z. [100]
+            gf_dim: (optional) Dimension of gen filters in first conv layer. [64]
+            df_dim: (optional) Dimension of discrim filters in first conv layer. [64]
+            gfc_dim: (optional) Dimension of gen units for for fully connected layer. [1024]
+            dfc_dim: (optional) Dimension of discrim units for fully connected layer. [1024]
+            c_dim: (optional) Dimension of image color. For grayscale input, set to 1. [3]
+        """
+        self.image_size = image_size
+        self.output_size = output_size
+
+        self.y_dim = y_dim
+        self.z_dim = z_dim
+
+        self.gf_dim = gf_dim
+        self.df_dim = df_dim
+
+        self.gfc_dim = gfc_dim
+        self.dfc_dim = dfc_dim
+
+        self.c_dim = c_dim
+
+        self.batch_size = tf.shape(self.x)[0]
+
+        # batch normalization : deals with poor initialization helps gradient flow
+        self.d_bn1 = batch_norm(name='d_bn1')
+        self.d_bn2 = batch_norm(name='d_bn2')
+
+        self.g_bn0 = batch_norm(name='g_bn0')
+        self.g_bn1 = batch_norm(name='g_bn1')
+        self.g_bn2 = batch_norm(name='g_bn2')
+
+        self.build_model()
+
+    def build_model(self):
+        """Create the main ops"""
+
+        if self.is_inference:
+            # HACK: we are hard-coding class 3 during inference
+            # TODO: find way to pass this from UI
+            self.y = tf.to_int32(3*tf.ones(shape=[self.batch_size]))
+
+        # create both the generator and the discriminator/encoder
+        # self.x is a batch of images - shape: [N, H, W, C]
+        # self.y is a vector of labels - shape: [N]
+
+        # rescale to [0,1] range
+        x_reshaped = tf.reshape(self.x, shape=[self.batch_size, self.image_size, self.image_size, self.c_dim], name='x_reshaped')
+        self.images = x_reshaped / 255.
+
+        # one-hot encode y - shape: [N] -> [N, self.y_dim]
+        self.y = tf.one_hot(self.y, self.y_dim, name='y_onehot')
+
+        # create discriminator/encoder
+        self.DzGEN, self.D_logits  = self.discriminator(self.images, self.y, reuse=False)
+
+        # create generator
+        self.G = self.generator(self.DzGEN, self.y)
+
+        # we only have one loss function here (L2 distance between input image and generator output)
+        self.dzgen_loss = tf.reduce_mean(tf.square(self.G - self.images), name="loss_DzGEN")
+
+        # debug
+        self.summaries.append(image_summary("G", self.G, max_outputs=5))
+        self.summaries.append(image_summary("X", self.images, max_outputs=5))
+        self.summaries.append(histogram_summary("G_hist", self.G))
+        self.summaries.append(histogram_summary("X_hist", self.images))
+        self.summaries.append(scalar_summary("DzGen_loss", self.dzgen_loss))
+
+        # all trainable variables
+        t_vars = tf.trainable_variables()
+        # D variables
+        self.d_vars = [var for var in t_vars if 'd_' in var.name]
+
+    def discriminator(self, image, y=None, reuse=False):
+        """
+        Create the discriminator/encoder
+
+        This creates a string of layers:
+        - input - [N, 28, 28, 1]
+        - concat conditioning - [N, 28, 28, 11]
+        - conv layer with 11 5x5 kernels and 2x2 stride - [N, 14, 14, 11]
+        - leaky relu - [N, 14, 14, 11]
+        - concat conditioning - [N, 14, 14, 21]
+        - conv layer with 74 5x5 kernels and 2x2 stride - [N, 7, 7, 74]
+        - batch norm - [N, 14, 14, 64]
+        - leaky relu - [N, 14, 14, 64]
+        - flatten - [N, 3626]
+        - concat conditioning - [N, 3636]
+        - linear layer with 1014 output neurons - [N, 1024]
+        - batch norm - [N, 1024]
+        - leaky relu - [N, 1024]
+        - concat conditioning - [N, 1034]
+        - linear layer with 1 output neuron - [N, z_dim]
+
+        Args:
+            image: batch of input images - shape: [N, H, W, C]
+            y: batch of one-hot encoded labels - shape: [N, K]
+            reuse: whether to re-use previously created variables
+        """
+
+        # NOTE: although we are really creating an encoder here we need to re-use the same
+        # variable scope (i.e. "discriminator") as in the original GAN so we can re-use
+        # learned parameters
+        with tf.variable_scope("discriminator") as scope:
+            if reuse:
+                # re-use (share) variables
+                scope.reuse_variables()
+
+            yb = tf.reshape(y, [self.batch_size, 1, 1, self.y_dim])
+            x = conv_cond_concat(image, yb)
+
+            h0 = lrelu(conv2d(x, self.c_dim + self.y_dim, name='d_h0_conv'))
+            h0 = conv_cond_concat(h0, yb)
+
+            h1 = lrelu(self.d_bn1(conv2d(h0, self.df_dim + self.y_dim, name='d_h1_conv'), train=self.is_training))
+            sz = h1.get_shape()
+            h1 = tf.reshape(h1, [self.batch_size, int(sz[1] * sz[2] * sz[3])])
+            h1 = tf.concat(1, [h1, y])
+
+            h2 = lrelu(self.d_bn2(linear(h1, self.dfc_dim, 'd_h2_lin'), train=self.is_training))
+            h2 = tf.concat(1, [h2, y])
+
+            h3 = linear(h2, self.z_dim, 'd_h3_lin_retrain')
+            return h3, h3
+
+
+    def generator(self, z, y=None):
+        """
+        Create the generator
+
+        This creates a string of layers:
+        - input - [N, 100]
+        - concatenate conditioning - [N, 110]
+        - linear layer with 1024 output neurons - [N, 1024]
+        - batch norm - [N, 1024]
+        - relu - [N, 1024]
+        - concatenate conditioning - [N, 1034]
+        - linear layer with 7*7*128=6272 output neurons - [N, 6272]
+        - reshape 7x7 feature maps - [N, 7, 7, 128]
+        - concatenate conditioning - [N, 7, 7, 138]
+        - transpose convolution with 128 filters and stride 2 - [N, 14, 14, 128]
+        - batch norm - [N, 14, 14, 128]
+        - relu - [N, 14, 14, 128]
+        - concatenate conditioing - [N, 14, 14, 138]
+        - transpose convolution with 1 filter and stride 2 - [N, 28, 28, 1]
+        """
+        with tf.variable_scope("generator") as scope:
+            s = self.output_size
+            s2, s4 = int(s/2), int(s/4)
+
+            # yb = tf.expand_dims(tf.expand_dims(y, 1),2)
+            yb = tf.reshape(y, [self.batch_size, 1, 1, self.y_dim])
+            z = tf.concat(1, [z, y])
+
+            h0 = tf.nn.relu(self.g_bn0(linear(z, self.gfc_dim, 'g_h0_lin'), train=False))
+            h0 = tf.concat(1, [h0, y])
+
+            h1 = tf.nn.relu(self.g_bn1(linear(h0, self.gf_dim*2*s4*s4, 'g_h1_lin'), train=False))
+            h1 = tf.reshape(h1, [self.batch_size, s4, s4, self.gf_dim * 2])
+
+            h1 = conv_cond_concat(h1, yb)
+
+            h2 = tf.nn.relu(self.g_bn2(deconv2d(h1, [self.batch_size, s2, s2, self.gf_dim * 2], name='g_h2'), train=False))
+            h2 = conv_cond_concat(h2, yb)
+
+            return tf.nn.sigmoid(deconv2d(h2, [self.batch_size, s, s, self.c_dim], name='g_h3'))
diff --git a/examples/gan/network-mnist.py b/examples/gan/network-mnist.py
new file mode 100644
index 000000000..458ae6acc
--- /dev/null
+++ b/examples/gan/network-mnist.py
@@ -0,0 +1,464 @@
+# The MIT License (MIT)
+#
+# Original work Copyright (c) 2016 Taehoon Kim
+# Modified work Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import math
+import numpy as np
+import tensorflow as tf
+
+from tensorflow.python.framework import ops
+
+image_summary = tf.summary.image
+scalar_summary = tf.summary.scalar
+histogram_summary = tf.summary.histogram
+merge_summary = tf.summary.merge
+SummaryWriter = tf.summary.FileWriter
+
+
+class batch_norm(object):
+    """
+    This class creates an op that composes the specified tensor with a batch
+    normalization layer.
+    """
+
+    def __init__(self, epsilon=1e-5, momentum=0.9, name="batch_norm"):
+        """Instance initialization"""
+        with tf.variable_scope(name):
+            self.epsilon = epsilon
+            self.momentum = momentum
+            self.name = name
+
+    def __call__(self, x, train=True):
+        """
+        Functional interface
+
+        Args:
+            x: tensor to compose
+            train: set to True during training and False otherwise
+        """
+        return tf.contrib.layers.batch_norm(x,
+                                            decay=self.momentum,
+                                            updates_collections=None,
+                                            epsilon=self.epsilon,
+                                            scale=True,
+                                            is_training=train,
+                                            scope=self.name)
+
+
+def conv_cond_concat(x, y):
+    """
+    Concatenate conditioning matrix across channel axis.
+
+    The specified input tensor is concatenated with K feature maps (K = number of classes)
+    across the channel dimension. Each of the K feature maps is set to all-zeros except for
+    the one whose index matches the target class (which is set to all-ones).
+
+    Args:
+        x: non-conditioned tensor. Shape: [N, H, W, C]
+        y: one-hot encoded conditioning matrix. Shape: [N, K]
+
+    Returns:
+        conditioned feature map. Shape: [N, H, W, C + K]
+    """
+    x_shapes = x.get_shape()
+    y_shapes = y.get_shape()
+    batch_size = tf.shape(x)[0]
+    return tf.concat(3, [x, y * tf.ones([batch_size, int(x_shapes[1]), int(x_shapes[2]), int(y_shapes[3])])])
+
+
+def conv2d(input_, output_dim,
+           k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+           name="conv2d"):
+    """
+    Compose specified symbol with 2D convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_dim: number of output features maps
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        w = tf.get_variable('w', [k_h, k_w, input_.get_shape()[-1], output_dim],
+                            initializer=tf.truncated_normal_initializer(stddev=stddev))
+        conv = tf.nn.conv2d(input_, w, strides=[1, d_h, d_w, 1], padding='SAME')
+
+        biases = tf.get_variable('biases', [output_dim], initializer=tf.constant_initializer(0.0))
+        conv = tf.nn.bias_add(conv, biases)
+
+        return conv
+
+
+def deconv2d(input_, output_shape,
+             k_h=5, k_w=5, d_h=2, d_w=2, stddev=0.02,
+             name="deconv2d", with_w=False):
+    """
+    Compose specified symbol with 2D *transpose* convolution layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, H, W, C]
+        output_shape: output shape
+        k_h: kernel height
+        k_w: kernel width
+        d_h: horizontal stride
+        d_w: vertical stride
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+
+    Returns:
+        Composed tensor.
+    """
+    with tf.variable_scope(name):
+        # filter : [height, width, output_channels, in_channels]
+        w = tf.get_variable('w',
+                            [k_h, k_w, output_shape[-1],
+                            input_.get_shape()[-1]],
+                            initializer=tf.random_normal_initializer(stddev=stddev))
+        deconv = tf.nn.conv2d_transpose(input_, w,
+                                        output_shape=output_shape,
+                                        strides=[1, d_h, d_w, 1])
+
+        biases = tf.get_variable('biases', [output_shape[-1]], initializer=tf.constant_initializer(0.0))
+        deconv = tf.reshape(tf.nn.bias_add(deconv, biases), output_shape)
+
+        if with_w:
+            return deconv, w, biases
+        else:
+            return deconv
+
+
+def lrelu(x, leak=0.2, name="lrelu"):
+    """Compose specified tensor with leaky Rectifier Linear Unit"""
+    return tf.maximum(x, leak*x)
+
+
+def linear(input_, output_size, scope=None, stddev=0.02, bias_start=0.0, with_w=False):
+    """
+    Compose specified tensor with linear (fully-connected) layer
+
+    Args:
+        input_: tensor to compose. Shape: [N, M]
+        output_size: number of output neurons
+        scope: name scope
+        stddev: standard deviation of gaussian distribution to use for random weight initialization
+        name: name scope
+        with_w: whether to also return parameter variables
+
+    Returns:
+      Composed tensor. Shape: [N, output_size]
+    """
+    shape = input_.get_shape().as_list()
+
+    with tf.variable_scope(scope or "Linear"):
+        matrix = tf.get_variable("Matrix", [shape[1], output_size], tf.float32,
+                                 tf.random_normal_initializer(stddev=stddev))
+        bias = tf.get_variable("bias", [output_size],
+            initializer=tf.constant_initializer(bias_start))
+        if with_w:
+            return tf.matmul(input_, matrix) + bias, matrix, bias
+        else:
+            return tf.matmul(input_, matrix) + bias
+
+
+class UserModel(Tower):
+    """
+    User Model definition
+
+    DIGITS creates an instance of this class for every tower it needs
+    to create. This includes:
+    - one for training,
+    - one for validation,
+    - one for testing.
+
+    In the case of multi-GPU training, one training instance is created
+    for every GPU. DIGITS takes care of doing the gradient averaging
+    across GPUs so this class only needs to define the inference op
+    and desired loss/cost function.
+    """
+
+    def __init__(self, *args, **kwargs):
+        """
+        Identify the correct input nodes.
+
+        In the parent class, DIGITS conveniently sets the following fields:
+        - self.is_training: whether this is a training graph
+        - self.is_inference: whether this graph is created for inference/testing
+        - self.x: input node. Shape: [N, H, W, C]
+        - self.y: label. Shape: [N] for scalar labels, [N, H, W, C] otherwise.
+                  Only defined if self._is_training is True
+        """
+        super(UserModel, self).__init__(*args, **kwargs)
+
+        # initialize graph with parameters for MNIST
+        self.dcgan_init(image_size=28,
+                        y_dim=10,
+                        output_size=28,
+                        c_dim=1,
+                        )
+
+    @model_property
+    def inference(self):
+        """op to use for inference"""
+
+        # inference op is the output of the generator after rescaling
+        # to the 8-bit range
+        return tf.to_int32(self.G * 255)
+
+    @model_property
+    def loss(self):
+        """
+        Loss function
+
+        Returns either an op or a list of dicts.
+        If the returned value is an op then DIGITS will optimize against this op
+        with respect to all trainable variables.
+        If the returned value is a list then DIGITS will optimize against each
+        loss in the list with respect to the specified variables.
+        """
+
+        # here we are returning a list because we want to alternately optimize the
+        # discriminator on real samples, the discriminator on fake samples and the
+        # generator.
+        losses = [
+            {'loss': self.d_loss_real, 'vars': self.d_vars},
+            {'loss': self.d_loss_fake, 'vars': self.d_vars},
+            {'loss': self.g_loss, 'vars': self.g_vars}
+        ]
+        return losses
+
+    def dcgan_init(self, image_size=108,
+                   output_size=64, y_dim=None, z_dim=100, gf_dim=64, df_dim=64,
+                   gfc_dim=1024, dfc_dim=1024, c_dim=3):
+        """
+        Create the model
+
+        Args:
+            output_size: (optional) The resolution in pixels of the images. [64]
+            y_dim: (optional) Dimension of dim for y. [None]
+            z_dim: (optional) Dimension of dim for Z. [100]
+            gf_dim: (optional) Dimension of gen filters in first conv layer. [64]
+            df_dim: (optional) Dimension of discrim filters in first conv layer. [64]
+            gfc_dim: (optional) Dimension of gen units for for fully connected layer. [1024]
+            dfc_dim: (optional) Dimension of discrim units for fully connected layer. [1024]
+            c_dim: (optional) Dimension of image color. For grayscale input, set to 1. [3]
+        """
+        self.image_size = image_size
+        self.output_size = output_size
+
+        self.y_dim = y_dim
+        self.z_dim = z_dim
+
+        self.gf_dim = gf_dim
+        self.df_dim = df_dim
+
+        self.gfc_dim = gfc_dim
+        self.dfc_dim = dfc_dim
+
+        self.c_dim = c_dim
+
+        self.batch_size = tf.shape(self.x)[0]
+
+        # batch normalization : deals with poor initialization helps gradient flow
+        self.d_bn1 = batch_norm(name='d_bn1')
+        self.d_bn2 = batch_norm(name='d_bn2')
+
+        self.g_bn0 = batch_norm(name='g_bn0')
+        self.g_bn1 = batch_norm(name='g_bn1')
+        self.g_bn2 = batch_norm(name='g_bn2')
+
+        self.build_model()
+
+    def build_model(self):
+        """Create the main ops"""
+
+        if not self.is_inference:
+            # create both the generator and the discriminator
+            # self.x is a batch of images - shape: [N, H, W, C]
+            # self.y is a vector of labels - shape: [N]
+
+            # sample z from a normal distribution
+            self.z = tf.random_normal(shape=[self.batch_size, self.z_dim], dtype=tf.float32, seed=None, name='z')
+
+            # rescale x to [0, 1]
+            x_reshaped = tf.reshape(self.x, shape=[self.batch_size, self.image_size, self.image_size, self.c_dim], name='x_reshaped')
+            self.images = x_reshaped / 255.
+
+            # one hot encode the label - shape: [N] -> [N, self.y_dim]
+            self.y = tf.one_hot(self.y, self.y_dim, name='y_onehot')
+
+            # create the generator
+            self.G = self.generator(self.z, self.y)
+
+            # create one instance of the discriminator for real images (the input is
+            # images from the dataset)
+            self.D, self.D_logits  = self.discriminator(self.images, self.y, reuse=False)
+
+            # create another instance of the discriminator for fake images (the input is
+            # the discriminator). Note how we are reusing variables to share weights between
+            # both instances of the discriminator
+            self.D_, self.D_logits_ = self.discriminator(self.G, self.y, reuse=True)
+
+            # aggregate losses across batch
+
+            # we are using the cross entropy loss for all these losses
+            self.d_loss_real = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(self.D_logits, tf.ones_like(self.D), name="loss_D_real"))
+            self.d_loss_fake = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(self.D_logits_, tf.zeros_like(self.D_), name="loss_D_fake"))
+            self.d_loss = (self.d_loss_real + self.d_loss_fake) / 2.
+            # the typical GAN set-up is that of a minimax game where D is trying to minimize its own error and G is trying to maximize D's error
+            # however note how we are flipping G labels here: instead of maximizing D's error, we are minimizing D's error on the 'wrong' label
+            # this trick helps produce a stronger gradient
+            self.g_loss = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(self.D_logits_, tf.ones_like(self.D_), name="loss_G"))
+
+            # create some summaries for debug and monitoring
+            self.summaries.append(histogram_summary("z", self.z))
+            self.summaries.append(histogram_summary("d", self.D))
+            self.summaries.append(histogram_summary("d_", self.D_))
+            self.summaries.append(image_summary("G", self.G, max_outputs=5))
+            self.summaries.append(image_summary("X", self.images, max_outputs=5))
+            self.summaries.append(histogram_summary("G_hist", self.G))
+            self.summaries.append(histogram_summary("X_hist", self.images))
+            self.summaries.append(scalar_summary("d_loss_real", self.d_loss_real))
+            self.summaries.append(scalar_summary("d_loss_fake", self.d_loss_fake))
+            self.summaries.append(scalar_summary("g_loss", self.g_loss))
+            self.summaries.append(scalar_summary("d_loss", self.d_loss))
+
+            # all trainable variables
+            t_vars = tf.trainable_variables()
+            # G's variables
+            self.g_vars = [var for var in t_vars if 'g_' in var.name]
+            # D's variables
+            self.d_vars = [var for var in t_vars if 'd_' in var.name]
+
+            # Extra hook for debug: log chi-square distance between G's output histogram and the dataset's histogram
+            value_range = [0.0, 1.0]
+            nbins = 100
+            hist_g = tf.histogram_fixed_width(self.G, value_range, nbins=nbins, dtype=tf.float32) / nbins
+            hist_images = tf.histogram_fixed_width(self.images, value_range, nbins=nbins, dtype=tf.float32) / nbins
+            chi_square = tf.reduce_mean(tf.div(tf.square(hist_g - hist_images), hist_g + hist_images))
+            self.summaries.append(scalar_summary("chi_square", chi_square))
+        else:
+            # Create only the generator
+
+            # self.x is the conditioned latent representation - shape: [self.batch_size, 1, self.z_dim + self.y_dim]
+            self.x = tf.reshape(self.x, shape=[self.batch_size, self.z_dim + self.y_dim])
+            # extract z and y
+            self.y = self.x[:, self.z_dim:self.z_dim + self.y_dim]
+            self.z = self.x[:, :self.z_dim]
+            # create an instance of the generator
+            self.G = self.generator(self.z, self.y)
+
+    def discriminator(self, image, y=None, reuse=False):
+        """
+        Create the discriminator
+
+        This creates a string of layers:
+        - input - [N, 28, 28, 1]
+        - concat conditioning - [N, 28, 28, 11]
+        - conv layer with 11 5x5 kernels and 2x2 stride - [N, 14, 14, 11]
+        - leaky relu - [N, 14, 14, 11]
+        - concat conditioning - [N, 14, 14, 21]
+        - conv layer with 74 5x5 kernels and 2x2 stride - [N, 7, 7, 74]
+        - batch norm - [N, 14, 14, 64]
+        - leaky relu - [N, 14, 14, 64]
+        - flatten - [N, 3626]
+        - concat conditioning - [N, 3636]
+        - linear layer with 1014 output neurons - [N, 1024]
+        - batch norm - [N, 1024]
+        - leaky relu - [N, 1024]
+        - concat conditioning - [N, 1034]
+        - linear layer with 1 output neuron - [N, 1]
+
+        Args:
+            image: batch of input images - shape: [N, H, W, C]
+            y: batch of one-hot encoded labels - shape: [N, K]
+            reuse: whether to re-use previously created variables
+        """
+        with tf.variable_scope("discriminator") as scope:
+            if reuse:
+                # re-use (share) variables
+                scope.reuse_variables()
+
+            yb = tf.reshape(y, [self.batch_size, 1, 1, self.y_dim])
+            x = conv_cond_concat(image, yb)
+
+            h0 = lrelu(conv2d(x, self.c_dim + self.y_dim, name='d_h0_conv'))
+            h0 = conv_cond_concat(h0, yb)
+
+            h1 = lrelu(self.d_bn1(conv2d(h0, self.df_dim + self.y_dim, name='d_h1_conv'), train=self.is_training))
+            sz = h1.get_shape()
+            h1 = tf.reshape(h1, [self.batch_size, int(sz[1] * sz[2] * sz[3])])
+            h1 = tf.concat(1, [h1, y])
+
+            h2 = lrelu(self.d_bn2(linear(h1, self.dfc_dim, 'd_h2_lin'), train=self.is_training))
+            h2 = tf.concat(1, [h2, y])
+
+            h3 = linear(h2, 1, 'd_h3_lin')
+
+            return tf.nn.sigmoid(h3), h3
+
+    def generator(self, z, y=None):
+        """
+        Create the generator
+
+        This creates a string of layers:
+        - input - [N, 100]
+        - concatenate conditioning - [N, 110]
+        - linear layer with 1024 output neurons - [N, 1024]
+        - batch norm - [N, 1024]
+        - relu - [N, 1024]
+        - concatenate conditioning - [N, 1034]
+        - linear layer with 7*7*128=6272 output neurons - [N, 6272]
+        - reshape 7x7 feature maps - [N, 7, 7, 128]
+        - concatenate conditioning - [N, 7, 7, 138]
+        - transpose convolution with 128 filters and stride 2 - [N, 14, 14, 128]
+        - batch norm - [N, 14, 14, 128]
+        - relu - [N, 14, 14, 128]
+        - concatenate conditioing - [N, 14, 14, 138]
+        - transpose convolution with 1 filter and stride 2 - [N, 28, 28, 1]
+        """
+        with tf.variable_scope("generator") as scope:
+
+            s = self.output_size
+            s2, s4 = int(s/2), int(s/4)
+
+            yb = tf.reshape(y, [self.batch_size, 1, 1, self.y_dim])
+            z = tf.concat(1, [z, y])
+
+            h0 = tf.nn.relu(self.g_bn0(linear(z, self.gfc_dim, 'g_h0_lin'), train=self.is_training))
+            h0 = tf.concat(1, [h0, y])
+
+            h1 = tf.nn.relu(self.g_bn1(linear(h0, self.gf_dim*2*s4*s4, 'g_h1_lin'), train=self.is_training))
+            h1 = tf.reshape(h1, [self.batch_size, s4, s4, self.gf_dim * 2])
+
+            h1 = conv_cond_concat(h1, yb)
+
+            h2 = tf.nn.relu(self.g_bn2(deconv2d(h1, [self.batch_size, s2, s2, self.gf_dim * 2], name='g_h2'), train=self.is_training))
+            h2 = conv_cond_concat(h2, yb)
+
+            return tf.nn.sigmoid(deconv2d(h2, [self.batch_size, s, s, self.c_dim], name='g_h3'))
diff --git a/examples/question-answering/memn2n.py b/examples/question-answering/memn2n.py
new file mode 100644
index 000000000..914afecfe
--- /dev/null
+++ b/examples/question-answering/memn2n.py
@@ -0,0 +1,134 @@
+class UserModel(Tower):
+
+    @model_property
+    def inference(self):
+
+        def position_encoding(sentence_size, embedding_size):
+            """
+            Position Encoding described in section 4.1 [1]
+            """
+            encoding = np.ones((embedding_size, sentence_size), dtype=np.float32)
+            ls = sentence_size+1
+            le = embedding_size+1
+            for i in range(1, le):
+                for j in range(1, ls):
+                    encoding[i-1, j-1] = (i - (le-1)/2) * (j - (ls-1)/2)
+            encoding = 1 + 4 * encoding / embedding_size / sentence_size
+            return np.transpose(encoding)
+
+        def memn2n(x, embeddings, weights, encoding, hops):
+            """
+            Create model
+            """
+
+            with tf.variable_scope("memn2n"):
+                # x has shape [batch_size, story_size, sentence_size, 2]
+                # unpack along last dimension to extract stories and questions
+                stories, questions = tf.unpack(x, axis=3)
+
+                self.summaries.append(tf.histogram_summary("stories_hist", stories))
+                self.summaries.append(tf.histogram_summary("questions_hist", questions))
+
+                # assume single sentence in question
+                questions = questions[:, 0, :]
+
+                self.summaries.append(tf.histogram_summary("question_hist", questions))
+
+                q_emb = tf.nn.embedding_lookup(embeddings['B'], questions, name='q_emb')
+                u_0 = tf.reduce_sum(q_emb * encoding, 1)
+                u = [u_0]
+                for _ in xrange(hops):
+                    m_emb = tf.nn.embedding_lookup(embeddings['A'], stories, name='m_emb')
+                    m = tf.reduce_sum(m_emb * encoding, 2) + weights['TA']
+                    # hack to get around no reduce_dot
+                    u_temp = tf.transpose(tf.expand_dims(u[-1], -1), [0, 2, 1])
+                    dotted = tf.reduce_sum(m * u_temp, 2)
+
+                    # Calculate probabilities
+                    probs = tf.nn.softmax(dotted)
+
+                    probs_temp = tf.transpose(tf.expand_dims(probs, -1), [0, 2, 1])
+                    c_temp = tf.transpose(m, [0, 2, 1])
+                    o_k = tf.reduce_sum(c_temp * probs_temp, 2)
+
+                    u_k = tf.matmul(u[-1], weights['H']) + o_k
+
+                    if self.is_training:
+                        u_k = tf.nn.dropout(u_k, 0.75)
+
+                    u.append(u_k)
+
+                o = tf.matmul(u_k, weights['W'])
+                if self.is_training:
+                    o = tf.nn.dropout(o, 0.75)
+            return o
+
+        # configuration
+        sentence_size = self.input_shape[1]
+        story_size = self.input_shape[0]
+        embedding_size = 25
+        hops = 3
+        dict_size = 40
+        encoding = tf.constant(position_encoding(sentence_size, embedding_size), name="encoding")
+        x = tf.to_int32(tf.reshape(self.x, shape=[-1, story_size, sentence_size, 2]), name='x_int')
+
+        # model parameters
+        initializer = tf.random_normal_initializer(stddev=0.1)
+        embeddings = {
+            'A': tf.get_variable('A', [dict_size, embedding_size], initializer=initializer),
+            'B': tf.get_variable('B', [dict_size, embedding_size], initializer=initializer),
+        }
+        weights = {
+            'TA': tf.get_variable('TA', [story_size, embedding_size], initializer=initializer),
+            'H': tf.get_variable('H', [embedding_size, embedding_size], initializer=initializer),
+            'W': tf.get_variable('W', [embedding_size, dict_size], initializer=initializer),
+        }
+
+        self._nil_vars = [embeddings['A'].name, embeddings['B'].name]
+
+        self.summaries.append(tf.histogram_summary("A_hist", embeddings['A']))
+        self.summaries.append(tf.histogram_summary("B_hist", embeddings['B']))
+        self.summaries.append(tf.histogram_summary("TA_hist", weights['TA']))
+        self.summaries.append(tf.histogram_summary("H_hist", weights['H']))
+        self.summaries.append(tf.histogram_summary("W_hist", weights['W']))
+        self.summaries.append(tf.histogram_summary("X_hist", x))
+
+        # create model
+        model = memn2n(x, embeddings, weights, encoding, hops)
+
+        return model
+
+    @model_property
+    def loss(self):
+        # label has shape [batch_size, 1, story_size, sentence_size]
+        # assume single-word labels
+        y = tf.to_int64(self.y[:, 0, 0, 0], name='y_int')
+        self.summaries.append(tf.histogram_summary("Y_hist", y))
+        loss = digits.classification_loss(self.inference, y)
+        accuracy = digits.classification_accuracy(self.inference, y)
+        self.summaries.append(tf.scalar_summary(accuracy.op.name, accuracy))
+        return loss
+
+    def gradientUpdate(self, grads_and_vars):
+        def add_gradient_noise(t, stddev=1e-3, name=None):
+            t = tf.convert_to_tensor(t, name="t")
+            gn = tf.random_normal(tf.shape(t), stddev=stddev)
+            return tf.add(t, gn, name=name)
+        def zero_nil_slot(t, name=None):
+            t = tf.convert_to_tensor(t, name="t")
+            s = tf.shape(t)[1]
+            z = tf.zeros(tf.pack([1, s]))
+            return tf.concat(0, [z, tf.slice(t, [1, 0], [-1, -1])], name=name)
+        max_grad_norm=40.0
+        grads_and_vars = [(tf.clip_by_norm(g, max_grad_norm), v) for g,v in grads_and_vars]
+        grads_and_vars = [(add_gradient_noise(g), v) for g,v in grads_and_vars]
+        nil_grads_and_vars = []
+        for g, v in grads_and_vars:
+            if v.name in self._nil_vars:
+                print("grad zero nil slot")
+                g = zero_nil_slot(g)
+                g = tf.Print(g, [g], message="This is g: ", first_n=10, summarize=100)
+                nil_grads_and_vars.append((g, v))
+            else:
+                nil_grads_and_vars.append((g, v))
+        return nil_grads_and_vars
diff --git a/plugins/data/bAbI/MANIFEST.in b/plugins/data/bAbI/MANIFEST.in
new file mode 100644
index 000000000..28ff74ce9
--- /dev/null
+++ b/plugins/data/bAbI/MANIFEST.in
@@ -0,0 +1 @@
+recursive-include digitsDataPluginBAbI *.html
diff --git a/plugins/data/bAbI/README b/plugins/data/bAbI/README
new file mode 100644
index 000000000..bb61cde0d
--- /dev/null
+++ b/plugins/data/bAbI/README
@@ -0,0 +1,2 @@
+This DIGITS plug-in demonstrates how to load data from the bAbI dataset.
+The dataset may be found on https://research.facebook.com/research/babi/
diff --git a/plugins/data/bAbI/digitsDataPluginBAbI/__init__.py b/plugins/data/bAbI/digitsDataPluginBAbI/__init__.py
new file mode 100644
index 000000000..79071170e
--- /dev/null
+++ b/plugins/data/bAbI/digitsDataPluginBAbI/__init__.py
@@ -0,0 +1,6 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+from .data import DataIngestion
+
+__all__ = ['DataIngestion']
diff --git a/plugins/data/bAbI/digitsDataPluginBAbI/data.py b/plugins/data/bAbI/digitsDataPluginBAbI/data.py
new file mode 100644
index 000000000..0ba2a2813
--- /dev/null
+++ b/plugins/data/bAbI/digitsDataPluginBAbI/data.py
@@ -0,0 +1,113 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+import os
+
+from digits.utils import subclass, override, constants
+from digits.extensions.data.interface import DataIngestionInterface
+from .forms import DatasetForm, InferenceForm
+from . import utils
+
+
+DATASET_TEMPLATE = "templates/dataset_template.html"
+INFERENCE_TEMPLATE = "templates/inference_template.html"
+
+
+@subclass
+class DataIngestion(DataIngestionInterface):
+    """
+    A data ingestion extension for the bAbI dataset
+    """
+
+    def __init__(self, is_inference_db=False, **kwargs):
+        super(DataIngestion, self).__init__(**kwargs)
+
+        self.userdata['is_inference_db'] = is_inference_db
+
+        if 'train_text_data' not in self.userdata:
+            # get task ID
+            try:
+                task_id = int(self.task_id)
+            except:
+                task_id = None
+            self.userdata['task_id'] = task_id
+
+            # get data - this doesn't scale well to huge datasets but this makes it
+            # straightforard to create a mapping of words to indices and figure out max
+            # dimensions of stories and sentences
+            self.userdata['train_text_data'] = utils.parse_folder_phase(
+                self.story_folder, task_id, train=True)
+            self.userdata['stats'] = utils.get_stats(self.userdata['train_text_data'])
+
+    @override
+    def encode_entry(self, entry):
+        stats = self.userdata['stats']
+        return utils.encode_sample(entry, stats['word_map'], stats['sentence_size'], stats['story_size'])
+
+    @staticmethod
+    @override
+    def get_category():
+        return "Text"
+
+    @staticmethod
+    @override
+    def get_id():
+        return "text-babi"
+
+    @staticmethod
+    @override
+    def get_dataset_form():
+        return DatasetForm()
+
+    @staticmethod
+    @override
+    def get_dataset_template(form):
+        """
+        parameters:
+        - form: form returned by get_dataset_form(). This may be populated
+           with values if the job was cloned
+        return:
+        - (template, context) tuple
+          - template is a Jinja template to use for rendering dataset creation
+          options
+          - context is a dictionary of context variables to use for rendering
+          the form
+        """
+        extension_dir = os.path.dirname(os.path.abspath(__file__))
+        template = open(os.path.join(extension_dir, DATASET_TEMPLATE), "r").read()
+        context = {'form': form}
+        return (template, context)
+
+    @override
+    def get_inference_form(self):
+        return InferenceForm()
+
+    @staticmethod
+    @override
+    def get_inference_template(form):
+        extension_dir = os.path.dirname(os.path.abspath(__file__))
+        template = open(os.path.join(extension_dir, INFERENCE_TEMPLATE), "r").read()
+        context = {'form': form}
+        return (template, context)
+
+    @staticmethod
+    @override
+    def get_title():
+        return "bAbI"
+
+    @override
+    def itemize_entries(self, stage):
+        entries = []
+        if not self.userdata['is_inference_db']:
+            data = self.userdata['train_text_data']
+            n_val_entries = int(len(data)*self.pct_val/100)
+            if stage == constants.TRAIN_DB:
+                entries = data[n_val_entries:]
+            elif stage == constants.VAL_DB:
+                entries = data[:n_val_entries]
+        elif stage == constants.TEST_DB:
+            if not bool(self.snippet):
+                raise ValueError("You must write a story and a question")
+            entries = utils.parse_lines(str(self.snippet).splitlines())
+
+        return entries
diff --git a/plugins/data/bAbI/digitsDataPluginBAbI/forms.py b/plugins/data/bAbI/digitsDataPluginBAbI/forms.py
new file mode 100644
index 000000000..90f66b745
--- /dev/null
+++ b/plugins/data/bAbI/digitsDataPluginBAbI/forms.py
@@ -0,0 +1,99 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+import os
+
+from digits import utils
+from digits.utils import subclass
+from flask.ext.wtf import Form
+from wtforms import validators
+
+
+@subclass
+class DatasetForm(Form):
+    """
+    A form used to create a Sunnybrook dataset
+    """
+
+    def validate_folder_path(form, field):
+        if not field.data:
+            pass
+        else:
+            # make sure the filesystem path exists
+            if not os.path.exists(field.data) or not os.path.isdir(field.data):
+                raise validators.ValidationError(
+                    'Folder does not exist or is not reachable')
+            else:
+                return True
+
+    story_folder = utils.forms.StringField(
+        u'Story folder',
+        validators=[
+            validators.DataRequired(),
+            validate_folder_path,
+            ],
+        tooltip="Specify the path to a folder of stories - filenames are "
+                "expected to have this format: qa[1-N]*[train|test].txt"
+        )
+
+    task_id = utils.forms.SelectField(
+        'Task ID',
+        choices=[
+            ('all', 'All'),
+            ('1', '1'),
+            ('2', '2'),
+            ('3', '3'),
+            ('4', '4'),
+            ('5', '5'),
+            ('6', '6'),
+            ('7', '7'),
+            ('8', '8'),
+            ('9', '9'),
+            ('10', '10'),
+            ('11', '11'),
+            ('12', '12'),
+            ('13', '13'),
+            ('14', '14'),
+            ('15', '15'),
+            ('16', '16'),
+            ('17', '17'),
+            ('18', '18'),
+            ('19', '19'),
+            ('20', '20'),
+            ],
+        default='1',
+        tooltip="Select a task to train on or 'all' to train a joint model "
+                "on all tasks."
+        )
+
+    pct_val = utils.forms.IntegerField(
+        u'% for validation',
+        default=10,
+        validators=[
+            validators.NumberRange(min=0, max=100)
+            ],
+        tooltip="You can choose to set apart a certain percentage of images "
+                "from the training images for the validation set."
+        )
+
+
+@subclass
+class InferenceForm(Form):
+
+    def validate_file_path(form, field):
+        if not field.data:
+            pass
+        else:
+            # make sure the filesystem path exists
+            if not os.path.exists(field.data) and not os.path.isdir(field.data):
+                raise validators.ValidationError(
+                    'File does not exist or is not reachable')
+            else:
+                return True
+    """
+    A form used to perform inference on a text classification dataset
+    """
+    snippet = utils.forms.TextAreaField(
+        u'Story/Question',
+        tooltip="Write all sentences there and end with a question"
+    )
diff --git a/plugins/data/bAbI/digitsDataPluginBAbI/templates/dataset_template.html b/plugins/data/bAbI/digitsDataPluginBAbI/templates/dataset_template.html
new file mode 100644
index 000000000..529dadbde
--- /dev/null
+++ b/plugins/data/bAbI/digitsDataPluginBAbI/templates/dataset_template.html
@@ -0,0 +1,23 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+<div class="form-group{{mark_errors([form.story_folder])}}">
+    {{ form.story_folder.label }}
+    {{ form.story_folder.tooltip }}
+    {{ form.story_folder(class='form-control autocomplete_path', placeholder='folder') }}
+</div>
+
+<div class="form-group{{mark_errors([form.task_id])}}">
+    {{ form.task_id.label }}
+    {{ form.task_id.tooltip }}
+    {{ form.task_id(class='form-control') }}
+</div>
+
+<div class="form-group{{mark_errors([form.pct_val])}}">
+    {{ form.pct_val.label }}
+    {{ form.pct_val.tooltip }}
+    {{ form.pct_val(class='form-control') }}
+</div>
diff --git a/plugins/data/bAbI/digitsDataPluginBAbI/templates/inference_template.html b/plugins/data/bAbI/digitsDataPluginBAbI/templates/inference_template.html
new file mode 100644
index 000000000..37761c76a
--- /dev/null
+++ b/plugins/data/bAbI/digitsDataPluginBAbI/templates/inference_template.html
@@ -0,0 +1,18 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+<div class="row">
+    <div class="col-sm-6">
+        <h3>Test a story/question</h3>
+        <div class="form-group">
+            <div class="form-group{{mark_errors([form.snippet])}}">
+                {{ form.snippet.label }}
+                {{ form.snippet.tooltip }}
+                {{ form.snippet(class='form-control', placeholder='image file') }}
+            </div>
+        </div>
+    </div>
+</div>
diff --git a/plugins/data/bAbI/digitsDataPluginBAbI/templates/template.html b/plugins/data/bAbI/digitsDataPluginBAbI/templates/template.html
new file mode 100644
index 000000000..2b8cf6067
--- /dev/null
+++ b/plugins/data/bAbI/digitsDataPluginBAbI/templates/template.html
@@ -0,0 +1,37 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+{{ form.data_stage(class='form-control') }}
+
+<div class="form-group{{mark_errors([form.train_data_file])}}">
+    {{ form.train_data_file.label }}
+    {{ form.train_data_file.tooltip }}
+    {{ form.train_data_file(class='form-control autocomplete_path', placeholder='.csv file') }}
+</div>
+
+<div class="form-group{{mark_errors([form.val_data_file])}}">
+    {{ form.val_data_file.label }}
+    {{ form.val_data_file.tooltip }}
+    {{ form.val_data_file(class='form-control autocomplete_path', placeholder='.csv file') }}
+</div>
+
+<div class="form-group{{mark_errors([form.alphabet])}}">
+    {{ form.alphabet.label }}
+    {{ form.alphabet.tooltip }}
+    {{ form.alphabet(class='form-control') }}
+</div>
+
+<div class="form-group{{mark_errors([form.class_labels_file])}}">
+    {{ form.class_labels_file.label }}
+    {{ form.class_labels_file.tooltip }}
+    {{ form.class_labels_file(class='form-control autocomplete_path', placeholder='.txt file') }}
+</div>
+
+<div class="form-group{{mark_errors([form.max_chars_per_sample])}}">
+    {{ form.max_chars_per_sample.label }}
+    {{ form.max_chars_per_sample.tooltip }}
+    {{ form.max_chars_per_sample(class='form-control') }}
+</div>
diff --git a/plugins/data/bAbI/digitsDataPluginBAbI/utils.py b/plugins/data/bAbI/digitsDataPluginBAbI/utils.py
new file mode 100644
index 000000000..08783c4a1
--- /dev/null
+++ b/plugins/data/bAbI/digitsDataPluginBAbI/utils.py
@@ -0,0 +1,143 @@
+
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+import copy
+import os
+import string
+
+import numpy as np
+
+
+def encode_field(field, word_map, sentence_size, story_size):
+    """
+    return a 2-D array with shape (story_size, sentence_size)
+    """
+    x = np.zeros((story_size, sentence_size))
+    for i, sentence in enumerate(field):
+        if i >= story_size:
+            raise ValueError("Field '%s' is longer than max (%d)" %
+                             (field, story_size))
+        for j, word in enumerate(sentence):
+            if j >= sentence_size:
+                raise ValueError("Sentence '%s' is longer than max (%d)" %
+                                 (field, sentence_size))
+            try:
+                idx = word_map[word]
+            except:
+                # assign to last index
+                idx = len(word_map) + 1
+            x[i, j] = idx
+    return x
+
+
+def encode_sample(sample, word_map, sentence_size, story_size):
+    """
+    return an encoded (feature, label) tuple
+    """
+    story = encode_field(sample['story'], word_map, sentence_size, story_size)
+    question = encode_field(sample['question'], word_map, sentence_size, story_size)
+    answer = encode_field(sample['answer'], word_map, sentence_size, story_size)
+
+    feature = np.zeros((2, story_size, sentence_size))
+    feature[0] = story
+    feature[1] = question
+
+    label = answer[np.newaxis, :]
+
+    return feature, label
+
+
+def find_files(path, task_id, train):
+    """
+    Find files in specified path with filenames that
+    match {task}*{phase}.txt where:
+        task="qa{task_id}_" or "" if task_id==None
+        phase="train" if train==True or "test" otherwise
+    """
+    task = "qa{}_".format(task_id) if task_id else ""
+    phase = "train" if train else "test"
+
+    files = []
+    for dirpath, dirnames, filenames in os.walk(path, followlinks=True):
+        for filename in filenames:
+            if task in filename and phase in filename:
+                files.append(os.path.join(dirpath, filename))
+
+    return files
+
+
+def get_stats(dataset):
+    """
+    return dataset statistics
+    """
+    fields = [field for sample in dataset for field in sample.values()]
+    sentences = [sentence for field in fields for sentence in field]
+    words = sorted(set([word for sentence in sentences for word in sentence]))
+
+    return {'word_map': dict((word, i) for i, word in enumerate(words, start=1)),
+            'sentence_size': max([len(sentence) for sentence in sentences]),
+            'story_size': max([len(story) for story in fields])}
+
+
+def parse_folder_phase(path, task_id, train):
+    """
+    Returns a list of samples for a phase by aggregating all samples
+    from matching files
+    """
+    phase_data = []
+    files = find_files(path, task_id, train)
+    for file in files:
+        phase_data.extend(parse_file(file))
+    return phase_data
+
+
+def parse_file(filename):
+    with open(filename) as f:
+        return parse_lines(f.readlines())
+
+
+def parse_lines(lines):
+    """
+    Returns a list of samples from a collection of lines where each sample
+    is a dictionary with 'story', 'question', 'answer' keys. Every key
+    value is a list of words without punctuation.
+    """
+    data = []
+    print "lines are %s" % lines
+    story = None
+    for line in lines:
+        # convert to lower case
+        line = line.lower()
+        # find line ID (new stories start with line ID = 1)
+        line_id, line = line.split(' ', 1)
+        try:
+            if int(line_id) == 1:
+                # new story
+                story = []
+        except:
+            if not story:
+                story = []
+            # this isn't a like id, re-integrate into line
+            line = "%s %s" % (line_id, line)
+        # is this a question?
+        if '?' in line:
+            items = remove_punctuation(line).split('\t')
+            question = items[0]
+            if len(items) > 1:
+                answer = items[1]
+            else:
+                answer = ''
+            # add to data
+            data.append({
+                'story': copy.copy(story),
+                'question': [question.split()],
+                'answer': [answer.split()],
+                })
+        else:
+            story.append(remove_punctuation(line).split())
+    return data
+
+
+def remove_punctuation(s):
+    return s.translate(string.maketrans("", ""), string.punctuation)
diff --git a/plugins/data/bAbI/setup.py b/plugins/data/bAbI/setup.py
new file mode 100644
index 000000000..40b266e00
--- /dev/null
+++ b/plugins/data/bAbI/setup.py
@@ -0,0 +1,27 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+
+import os
+from setuptools import setup, find_packages
+
+from digits.extensions.data import GROUP as DIGITS_PLUGIN_GROUP
+
+
+# Utility function to read the README file.
+def read(fname):
+    return open(os.path.join(os.path.dirname(__file__), fname)).read()
+
+
+setup(
+    name="digits_bAbI_data_plugin",
+    version="0.0.1",
+    author="Greg Heinrich",
+    description=("A data ingestion plugin for the bAbI dataset"),
+    long_description=read('README'),
+    license="Apache",
+    packages=find_packages(),
+    entry_points={
+        DIGITS_PLUGIN_GROUP: [
+            'class=digitsDataPluginBAbI:DataIngestion',
+        ]},
+    include_package_data=True,
+)
diff --git a/plugins/data/gan/MANIFEST.in b/plugins/data/gan/MANIFEST.in
new file mode 100644
index 000000000..7a2811778
--- /dev/null
+++ b/plugins/data/gan/MANIFEST.in
@@ -0,0 +1 @@
+recursive-include digitsDataPluginGan *.html
diff --git a/plugins/data/gan/README b/plugins/data/gan/README
new file mode 100644
index 000000000..e654df110
--- /dev/null
+++ b/plugins/data/gan/README
@@ -0,0 +1 @@
+This DIGITS plug-in demonstrates how to load data for a Generative Adversarial Network.
diff --git a/plugins/data/gan/digitsDataPluginGan/__init__.py b/plugins/data/gan/digitsDataPluginGan/__init__.py
new file mode 100644
index 000000000..79071170e
--- /dev/null
+++ b/plugins/data/gan/digitsDataPluginGan/__init__.py
@@ -0,0 +1,6 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+from .data import DataIngestion
+
+__all__ = ['DataIngestion']
diff --git a/plugins/data/gan/digitsDataPluginGan/data.py b/plugins/data/gan/digitsDataPluginGan/data.py
new file mode 100644
index 000000000..50d12c84d
--- /dev/null
+++ b/plugins/data/gan/digitsDataPluginGan/data.py
@@ -0,0 +1,312 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+import os
+import pickle
+
+import numpy as np
+
+from digits.utils import constants, override, image, subclass
+from digits.extensions.data.interface import DataIngestionInterface
+from .forms import DatasetForm, InferenceForm
+
+
+DATASET_TEMPLATE = "templates/dataset_template.html"
+INFERENCE_TEMPLATE = "templates/inference_template.html"
+
+CELEBA_ALL_ATTRIBUTES = """
+                         5_o_Clock_Shadow Arched_Eyebrows Attractive Bags_Under_Eyes Bald Bangs
+                         Big_Lips Big_Nose Black_Hair Blond_Hair Blurry Brown_Hair Bushy_Eyebrows
+                         Chubby Double_Chin Eyeglasses Goatee Gray_Hair Heavy_Makeup High_Cheekbones
+                         Male Mouth_Slightly_Open Mustache Narrow_Eyes No_Beard Oval_Face Pale_Skin
+                         Pointy_Nose Receding_Hairline Rosy_Cheeks Sideburns Smiling Straight_Hair
+                         Wavy_Hair Wearing_Earrings Wearing_Hat Wearing_Lipstick Wearing_Necklace
+                         Wearing_Necktie Young
+                        """.split()
+
+CELEBA_EDITABLE_ATTRIBUTES = [
+    'Bald', 'Black_Hair', 'Blond_Hair', 'Male', 'Smiling', 'Wearing_Lipstick', 'Young'
+]
+
+CELEBA_EDITABLE_ATTRIBUTES_IDS = [CELEBA_ALL_ATTRIBUTES.index(attr) for attr in CELEBA_EDITABLE_ATTRIBUTES]
+
+
+def one_hot(val, depth):
+    x = np.zeros(depth)
+    x[val] = 1
+    return x
+
+
+def slerp(val, low, high):
+    """Spherical interpolation. val has a range of 0 to 1."""
+    if val <= 0:
+        return low
+    elif val >= 1:
+        return high
+    omega = np.arccos(np.dot(low/np.linalg.norm(low), high/np.linalg.norm(high)))
+    so = np.sin(omega)
+    return np.sin((1.0-val)*omega) / so * low + np.sin(val*omega)/so * high
+
+
+def parse_lines_of_floats(s):
+    return [[float(val) for val in line.split()] for line in s.splitlines()]
+
+
+@subclass
+class DataIngestion(DataIngestionInterface):
+    """
+    A data ingestion extension for GANs
+    """
+
+    # CONFIG = "mnist"
+    CONFIG = "celeba"
+    # CONFIG = "celeba_cond"
+
+    def __init__(self, is_inference_db=False, **kwargs):
+        super(DataIngestion, self).__init__(**kwargs)
+
+        if 'dataset_type' in self.userdata:
+            self.CONFIG = self.userdata['dataset_type']
+
+        self.z_dim = 100
+        if self.CONFIG == "mnist":
+            self.y_dim = 10
+        elif self.CONFIG == "celeba":
+            self.y_dim = 0
+        elif self.CONFIG == "celeba_cond":
+            self.y_dim = 40
+
+        self.userdata['is_inference_db'] = is_inference_db
+
+        self.input_dim = self.z_dim + self.y_dim
+
+    @override
+    def encode_entry(self, entry):
+        if not self.userdata['is_inference_db']:
+            filename = entry[0]
+            label = entry[1]
+            feature = self.scale_image(filename)
+            label = np.array(label).reshape(1, 1, len(label))
+        else:
+            if self.userdata['task_id'] in ['style',
+                                            'class',
+                                            'genimg',
+                                            'attributes',
+                                            'analogy',
+                                            'animation']:
+                feature = entry
+                label = np.array([0])
+            elif self.userdata['task_id'] == 'enclist':
+                filename = entry[0]
+                label = entry[1]
+                feature = self.scale_image(filename)
+                label = np.array(label).reshape(1, 1, len(label))
+            else:
+                raise NotImplementedError
+        return feature, label
+
+    def encode_PIL_Image(self, image):
+        # convert to numpy array
+        image = np.array(image)
+        # add channel axis if input is grayscale image
+        if image.ndim == 2:
+            image = image[..., np.newaxis]
+        elif image.ndim != 3:
+            raise ValueError("Unhandled number of channels: %d" % image.ndim)
+        # transpose to CHW
+        image = image.transpose(2, 0, 1)
+        return image
+
+    @staticmethod
+    @override
+    def get_category():
+        return "Images"
+
+    @staticmethod
+    @override
+    def get_id():
+        return "image-gan"
+
+    @staticmethod
+    @override
+    def get_dataset_form():
+        return DatasetForm()
+
+    @staticmethod
+    @override
+    def get_dataset_template(form):
+        """
+        parameters:
+        - form: form returned by get_dataset_form(). This may be populated
+           with values if the job was cloned
+        return:
+        - (template, context) tuple
+          - template is a Jinja template to use for rendering dataset creation
+          options
+          - context is a dictionary of context variables to use for rendering
+          the form
+        """
+        extension_dir = os.path.dirname(os.path.abspath(__file__))
+        template = open(os.path.join(extension_dir, DATASET_TEMPLATE), "r").read()
+        context = {'form': form}
+        return (template, context)
+
+    @override
+    def get_inference_form(self):
+        return InferenceForm(CELEBA_ALL_ATTRIBUTES, CELEBA_EDITABLE_ATTRIBUTES_IDS)
+
+    @staticmethod
+    @override
+    def get_inference_template(form):
+        extension_dir = os.path.dirname(os.path.abspath(__file__))
+        template = open(os.path.join(extension_dir, INFERENCE_TEMPLATE), "r").read()
+        context = {'form': form}
+        return (template, context)
+
+    @staticmethod
+    @override
+    def get_title():
+        return "GAN"
+
+    @override
+    def itemize_entries(self, stage):
+        entries = []
+        if not self.userdata['is_inference_db']:
+            if stage == constants.TRAIN_DB:
+                # read file list
+                with open(self.userdata['file_list']) as f:
+                    lines = f.read().splitlines()
+                    # skip first 2 lines (header)
+                    for line in lines[2:]:
+                        fields = line.split()
+                        filename = fields[0]
+                        # add full path
+                        filename = os.path.join(self.userdata['image_folder'], filename)
+                        label = [int(field) for field in fields[1:]]
+                        entries.append((filename, label))
+        elif stage == constants.TEST_DB:
+            if self.userdata['task_id'] == 'style':
+                if self.userdata['style_z1_vector']:
+                    z1 = np.array([float(v) for v in self.userdata['style_z1_vector'].split()])
+                else:
+                    z1 = np.random.normal(size=(100,))
+                if self.userdata['style_z2_vector']:
+                    z2 = np.array([float(v) for v in self.userdata['style_z2_vector'].split()])
+                else:
+                    z2 = np.random.normal(size=(100,))
+                for val in np.linspace(0, 1, self.userdata['row_count']):
+                    for c in range(10):
+                        z_ = slerp(val, z1, z2)
+                        feature = np.append(z_, one_hot(c, self.y_dim)).reshape((1, 1, self.input_dim))
+                        entries.append(feature)
+            elif self.userdata['task_id'] == 'class':
+                if self.userdata['class_z_vector']:
+                    z = np.array([float(v) for v in self.userdata['class_z_vector'].split()])
+                else:
+                    z = np.random.normal(size=(100,))
+                for val in np.linspace(0, 1, self.userdata['row_count']):
+                    for i in range(10):
+                        c_0 = i
+                        c_1 = (i + 1) % 10
+                        feature_0 = np.append(z, one_hot(c_0, self.y_dim))
+                        feature_1 = np.append(z, one_hot(c_1, self.y_dim))
+                        feature = slerp(val, feature_0, feature_1).reshape((1, 1, self.input_dim))
+                        entries.append(feature)
+            elif self.userdata['task_id'] == 'genimg':
+                c = int(self.userdata['genimg_class_id'])
+                if self.userdata['genimg_z_vector']:
+                    z = np.array([float(v) for v in self.userdata['genimg_z_vector'].split()])
+                else:
+                    z = np.random.normal(size=(100,))
+                if self.y_dim > 0:
+                    z = np.append(z, one_hot(c, self.y_dim))
+                feature = z.reshape((1, 1, self.input_dim))
+                entries.append(feature)
+            elif self.userdata['task_id'] == 'attributes':
+                if self.userdata['attributes_z_vector']:
+                    z = np.array([float(v) for v in self.userdata['attributes_z_vector'].split()])
+                else:
+                    z = np.random.normal(size=(100,))
+                with open(self.userdata['attributes_file'], 'rb') as f:
+                    attributes_z = pickle.load(f)
+                    params = parse_lines_of_floats(self.userdata['attributes_params'])
+                    for img_params in params:
+                        z_img = np.copy(z)
+                        for i, coeff in enumerate(img_params):
+                            z_img += coeff * attributes_z[CELEBA_EDITABLE_ATTRIBUTES_IDS[i]]
+                        entries.append(z_img.reshape((1, 1, self.input_dim)))
+            elif self.userdata['task_id'] == 'enclist':
+                with open(self.userdata['enc_file_list']) as f:
+                    lines = f.read().splitlines()
+                    # skip first 2 lines (header)
+                    max_images = self.userdata['enc_num_images']
+                    for line in lines[2:max_images + 2]:
+                        fields = line.split()
+                        filename = fields[0]
+                        # add full path
+                        filename = os.path.join(self.userdata['enc_image_folder'], filename)
+                        label = [int(field) for field in fields[1:]]
+                        entries.append((filename, label))
+            elif self.userdata['task_id'] == 'analogy':
+                if self.userdata['attributes_z1_vector']:
+                    z1 = np.array([float(v) for v in self.userdata['attributes_z1_vector'].split()])
+                else:
+                    z1 = np.random.normal(size=(100,))
+                if self.userdata['attributes_z2_vector']:
+                    z2 = np.array([float(v) for v in self.userdata['attributes_z2_vector'].split()])
+                else:
+                    z2 = np.random.normal(size=(100,))
+                if self.userdata['attributes_z3_vector']:
+                    z3 = np.array([float(v) for v in self.userdata['attributes_z3_vector'].split()])
+                else:
+                    z3 = np.random.normal(size=(100,))
+
+                # create analogy vector
+                z4 = z2 + z3 - z1
+
+                grid_size = self.userdata['row_count']
+
+                # now interpolate across columns
+                for row in xrange(grid_size):
+                    row_k = row / float(grid_size - 1)
+                    z_left = slerp(row_k, z1, z3)
+                    z_right = slerp(row_k, z2, z4)
+                    entries.append(z_left.reshape((1, 1, self.input_dim)))
+                    for col in xrange(1, grid_size - 1):
+                        col_k = col / float(grid_size - 1)
+                        z = slerp(col_k, z_left, z_right)
+                        entries.append(z.reshape((1, 1, self.input_dim)))
+                    entries.append(z_right.reshape((1, 1, self.input_dim)))
+            elif self.userdata['task_id'] == 'animation':
+                zs = parse_lines_of_floats(self.userdata['animation_z_vectors'])
+                zs = [np.array(z) for z in zs]
+                num_transitions = self.userdata['animation_num_transitions']
+                for i, z in enumerate(zs):
+                    z_next = zs[(i + 1) % len(zs)]
+                    for k in xrange(num_transitions):
+                        z_ = slerp(float(k) / num_transitions, z, z_next)
+                        entries.append(z_.reshape((1, 1, self.input_dim)))
+            else:
+                raise ValueError("Unknown task: %s" % self.userdata['task_id'])
+        return entries
+
+    def scale_image(self, filename):
+        im = np.array(image.load_image(filename))
+
+        # center crop
+        if self.userdata['center_crop_size']:
+            crop_size = int(self.userdata['center_crop_size'])
+            width, height = im.shape[0:2]
+            i = (width // 2) - crop_size // 2
+            j = (height // 2) - crop_size // 2
+            im = im[i:i + crop_size, j:j + crop_size, :]
+
+        # resize
+        if self.userdata['resize']:
+            resize = int(self.userdata['resize'])
+            im = image.resize_image(im, resize, resize, resize_mode='squash')
+
+        # transpose to CHW
+        feature = im.transpose(2, 0, 1)
+
+        return feature
diff --git a/plugins/data/gan/digitsDataPluginGan/forms.py b/plugins/data/gan/digitsDataPluginGan/forms.py
new file mode 100644
index 000000000..97f38c0b3
--- /dev/null
+++ b/plugins/data/gan/digitsDataPluginGan/forms.py
@@ -0,0 +1,228 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+import os
+
+from flask.ext.wtf import Form
+from wtforms import HiddenField, TextAreaField, validators
+
+from digits import utils
+from digits.utils import subclass
+
+
+@subclass
+class DatasetForm(Form):
+    """
+    A form used to create a Sunnybrook dataset
+    """
+
+    def validate_file_path(form, field):
+        if not field.data:
+            pass
+        else:
+            # make sure the filesystem path exists
+            if not os.path.exists(field.data) and not os.path.isdir(field.data):
+                raise validators.ValidationError(
+                    'File does not exist or is not reachable')
+            else:
+                return True
+
+    def validate_folder_path(form, field):
+        if not field.data:
+            pass
+        else:
+            # make sure the filesystem path exists
+            if not os.path.exists(field.data) or not os.path.isdir(field.data):
+                raise validators.ValidationError(
+                    'Folder does not exist or is not reachable')
+            else:
+                return True
+
+    file_list = utils.forms.StringField(
+        u'File list (with attributes) in CelebA format',
+        validators=[
+            validate_file_path,
+        ],
+        tooltip="Provide file list in CelebA format"
+    )
+
+    image_folder = utils.forms.StringField(
+        u'Image folder',
+        validators=[
+            validators.DataRequired(),
+            validate_folder_path,
+            ],
+        tooltip="Specify the path to a folder of images."
+        )
+
+    center_crop_size = utils.forms.IntegerField(
+        u'Center crop size',
+        default=108,
+        validators=[
+            validators.NumberRange(min=0)
+        ],
+        tooltip="Specify center crop."
+    )
+
+    resize = utils.forms.IntegerField(
+        u'Resize after crop',
+        default=64,
+        tooltip="Resize after crop."
+    )
+
+
+@subclass
+class InferenceForm(Form):
+    """
+    A form used to perform inference on a text classification dataset
+    """
+
+    def __init__(self, attributes, editable_attribute_ids, **kwargs):
+        super(InferenceForm, self).__init__(**kwargs)
+        self.attributes = attributes
+        self.editable_attribute_ids = editable_attribute_ids
+
+    def validate_file_path(form, field):
+        if not field.data:
+            pass
+        else:
+            # make sure the filesystem path exists
+            if not os.path.exists(field.data) and not os.path.isdir(field.data):
+                raise validators.ValidationError(
+                    'File does not exist or is not reachable')
+            else:
+                return True
+
+    def validate_folder_path(form, field):
+        if not field.data:
+            pass
+        else:
+            # make sure the filesystem path exists
+            if not os.path.exists(field.data) or not os.path.isdir(field.data):
+                raise validators.ValidationError(
+                    'Folder does not exist or is not reachable')
+            else:
+                return True
+
+    row_count = utils.forms.IntegerField(
+        u'Rows',
+        default=10,
+        validators=[
+            validators.NumberRange(min=1)
+        ],
+        tooltip="Rows to generate in output grid."
+    )
+
+    dataset_type = utils.forms.SelectField(
+        'Dataset',
+        choices=[
+            ('mnist', 'MNIST'),
+            ('celeba', 'CelebA'),
+            ],
+        default='celeba',
+        tooltip="Select a dataset."
+        )
+
+    task_id = utils.forms.SelectField(
+        'Task ID',
+        choices=[
+            ('class', 'MNIST - Class sweep'),
+            ('style', 'MNIST - Style sweep'),
+            ('genimg', 'Generate single image'),
+            ('attributes', 'CelebA - add/remove attributes'),
+            ('enclist', 'CelebA - Encode list of images'),
+            ('analogy', 'CelebA - Analogy'),
+            ('animation', 'CelebA - Animation'),
+            ],
+        default='class',
+        tooltip="Select a task to execute."
+        )
+
+    class_z_vector = utils.forms.StringField(
+        u'Z vector (leave blank for random)',
+    )
+
+    style_z1_vector = utils.forms.StringField(
+        u'Z1 vector (leave blank for random)',
+    )
+
+    style_z2_vector = utils.forms.StringField(
+        u'Z2 vector (leave blank for random)',
+    )
+
+    genimg_z_vector = utils.forms.StringField(
+        u'Z vector (leave blank for random)',
+    )
+
+    genimg_class_id = utils.forms.IntegerField(
+        u'Class ID',
+        default=0,
+        validators=[
+            validators.NumberRange(min=0, max=9)
+        ],
+        tooltip="Class of image to generate (leave blank for CelebA)."
+    )
+
+    attributes_z_vector = utils.forms.StringField(
+        u'Z vector (leave blank for random)',
+    )
+
+    attributes_file = utils.forms.StringField(
+        u'Attributes vector file',
+        validators=[
+            validate_file_path,
+            ],
+        tooltip="Specify the path to a file that contains attributes vectors."
+        )
+
+    attributes_params = HiddenField()
+
+    enc_file_list = utils.forms.StringField(
+        u'File list',
+        validators=[
+            validate_file_path,
+            ],
+        tooltip="Specify the path to a file that contains a list of files."
+        )
+
+    enc_image_folder = utils.forms.StringField(
+        u'Image folder',
+        validators=[
+            validate_folder_path,
+            ],
+        tooltip="Specify the path to a folder of images."
+        )
+
+    enc_num_images = utils.forms.IntegerField(
+        u'Number of images to encode',
+        default=100,
+        validators=[
+            validators.NumberRange(min=0)
+        ],
+        tooltip="Max number of images to encode."
+    )
+
+    attributes_z1_vector = utils.forms.StringField(
+        u'Source Z vector (leave blank for random)',
+    )
+
+    attributes_z2_vector = utils.forms.StringField(
+        u'First Sink Z vector (leave blank for random)',
+    )
+
+    attributes_z3_vector = utils.forms.StringField(
+        u'Second Sink Z vector (leave blank for random)',
+    )
+
+    animation_num_transitions = utils.forms.IntegerField(
+        u'Number of transitions per image',
+        default=10,
+        validators=[
+            validators.NumberRange(min=1, max=100)
+        ],
+        tooltip="Number of transitions between each of the specified images"
+    )
+
+    animation_z_vectors = TextAreaField(
+        u'z vectors (one per line)',
+    )
diff --git a/plugins/data/gan/digitsDataPluginGan/templates/dataset_template.html b/plugins/data/gan/digitsDataPluginGan/templates/dataset_template.html
new file mode 100644
index 000000000..4b1ec2712
--- /dev/null
+++ b/plugins/data/gan/digitsDataPluginGan/templates/dataset_template.html
@@ -0,0 +1,29 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+<div class="form-group{{mark_errors([form.file_list])}}">
+    {{ form.file_list.label }}
+    {{ form.file_list.tooltip }}
+    {{ form.file_list(class='form-control autocomplete_path', placeholder='file') }}
+</div>
+
+<div class="form-group{{mark_errors([form.image_folder])}}">
+    {{ form.image_folder.label }}
+    {{ form.image_folder.tooltip }}
+    {{ form.image_folder(class='form-control autocomplete_path', placeholder='folder') }}
+</div>
+
+<div class="form-group{{mark_errors([form.center_crop_size])}}">
+    {{ form.center_crop_size.label }}
+    {{ form.center_crop_size.tooltip }}
+    {{ form.center_crop_size(class='form-control', placeholder='folder') }}
+</div>
+
+<div class="form-group{{mark_errors([form.resize])}}">
+    {{ form.resize.label }}
+    {{ form.resize.tooltip }}
+    {{ form.resize(class='form-control', placeholder='folder') }}
+</div>
diff --git a/plugins/data/gan/digitsDataPluginGan/templates/inference_template.html b/plugins/data/gan/digitsDataPluginGan/templates/inference_template.html
new file mode 100644
index 000000000..6b979b71c
--- /dev/null
+++ b/plugins/data/gan/digitsDataPluginGan/templates/inference_template.html
@@ -0,0 +1,255 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+<script>
+var attributes_rows = 0
+
+
+function cell_name(row, column) {
+    return "attributes_attr_" + row + "_" + column;
+}
+
+function update_attributes_params() {
+    console.log("change");
+
+    var params_str = "";
+
+    for (row=0; row<attributes_rows; row++) {
+        for (column=0; column<{{form.editable_attribute_ids|length}}; column++) {
+           var name = cell_name(row, column);
+           var cell = document.getElementById(name)
+           var value = cell.value != "" ? cell.value : "0";
+           params_str += value + " ";
+        }
+        params_str += "\n";
+    }
+
+    document.getElementById('attributes_params').value = params_str;
+
+    console.log("params: " + params_str);
+}
+
+function add_attributes_row() {
+    var table = document.getElementById("attributes_table");
+
+    // Create an empty <tr> element and add it to the 1st position of the table:
+    var row = table.insertRow(attributes_rows + 1);
+
+    for (column=0; column<{{form.editable_attribute_ids|length}}; column++) {
+        var cell = row.insertCell(column);
+        var i = document.createElement("input");
+        i.type = "text";
+        i.name = cell_name(attributes_rows, column);
+        i.id = i.name;
+        i.size = 2;
+        i.onchange = function() {
+            update_attributes_params();
+        };
+        cell.appendChild(i);
+    }
+    attributes_rows += 1;
+}
+</script>
+
+<h3>GAN inference Options</h3>
+
+<div class="form-group">
+
+    <h4>Choose a type of dataset</h4>
+
+    <div class="form-group{{mark_errors([form.dataset_type])}}">
+        {{ form.dataset_type.label }}
+        {{ form.dataset_type.tooltip }}
+        {{ form.dataset_type(class='form-control') }}
+    </div>
+
+    <h4>Choose a task</h4>
+
+    <div class="form-group{{mark_errors([form.task_id])}}">
+        {{ form.task_id.label }}
+        {{ form.task_id.tooltip }}
+        {{ form.task_id(class='form-control') }}
+    </div>
+
+    <div id="task_class">
+        <h4>MNIST Class sweep parameters</h4>
+
+        <h5>Use with "GAN" visualization method (select "Grid" task).</h5>
+
+        <div class="form-group{{mark_errors([form.class_z_vector])}}">
+            {{ form.class_z_vector.label }}
+            {{ form.class_z_vector.tooltip }}
+            {{ form.class_z_vector(class='form-control') }}
+        </div>
+    </div>
+
+    <div id="task_style">
+        <h4>MNIST Style sweep parameters</h4>
+
+        <h5>Use with "GAN" visualization method (select "Grid" task).</h5>
+
+        <div class="form-group{{mark_errors([form.style_z1_vector])}}">
+            {{ form.style_z1_vector.label }}
+            {{ form.style_z1_vector.tooltip }}
+            {{ form.style_z1_vector(class='form-control') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.style_z2_vector])}}">
+            {{ form.style_z2_vector.label }}
+            {{ form.style_z2_vector.tooltip }}
+            {{ form.style_z2_vector(class='form-control') }}
+        </div>
+    </div>
+
+    <div id="task_genimg">
+        <h4>Image generation parameters</h4>
+
+        <h5>Use with "Image Output" visualization method (select "HWC" data order)</h5>
+
+        <div class="form-group{{mark_errors([form.genimg_z_vector])}}">
+            {{ form.genimg_z_vector.label }}
+            {{ form.genimg_z_vector.tooltip }}
+            {{ form.genimg_z_vector(class='form-control') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.genimg_class_id])}}">
+            {{ form.genimg_class_id.label }}
+            {{ form.genimg_class_id.tooltip }}
+            {{ form.genimg_class_id(class='form-control') }}
+        </div>
+    </div>
+
+    <div id="task_attributes">
+        <h4>CelebA Additive Attributes</h4>
+
+        <h5>Use with "Image Output" visualization method (HWC data order).</h5>
+
+        <div class="form-group{{mark_errors([form.attributes_file])}}">
+            {{ form.attributes_file.label }}
+            {{ form.attributes_file.tooltip }}
+            {{ form.attributes_file(class='form-control autocomplete_path') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.attributes_z_vector])}}">
+            {{ form.attributes_z_vector.label }}
+            {{ form.attributes_z_vector.tooltip }}
+            {{ form.attributes_z_vector(class='form-control') }}
+        </div>
+
+        <h5>Add or remove attributes by filling corresponding box with +1 or -1
+        (or any other multiplier).</h5>
+
+        <div class="form-group{{mark_errors([form.attributes_params])}}">
+            {{ form.attributes_params.label }}
+            {{ form.attributes_params.tooltip }}
+            {{ form.attributes_params(class='form-control') }}
+        </div>
+
+        <table class="table" id="attributes_table">
+            <tr>
+                {% for attr_id in form.editable_attribute_ids %}
+                    <th>{{form.attributes[attr_id]}}</th>
+                {% endfor %}
+            </tr>
+            <tr>
+            <script>
+            add_attributes_row()
+            </script>
+            </tr>
+        </table>
+        <input type="button" value="Add row" onclick="add_attributes_row();"/>
+    </div>
+
+    <div id="task_enclist">
+        <h4>Encode file list</h4>
+
+        <h5>Use with "GAN" visualization method (select "Encoder" task).</h5>
+
+        <div class="form-group{{mark_errors([form.enc_file_list])}}">
+            {{ form.enc_file_list.label }}
+            {{ form.enc_file_list.tooltip }}
+            {{ form.enc_file_list(class='form-control autocomplete_path', placeholder='file') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.enc_image_folder])}}">
+            {{ form.enc_image_folder.label }}
+            {{ form.enc_image_folder.tooltip }}
+            {{ form.enc_image_folder(class='form-control autocomplete_path', placeholder='folder') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.enc_num_images])}}">
+            {{ form.enc_num_images.label }}
+            {{ form.enc_num_images.tooltip }}
+            {{ form.enc_num_images(class='form-control autocomplete_path', placeholder='folder') }}
+        </div>
+    </div>
+
+    <div id="task_analogy">
+        <h4>Analogy</h4>
+
+        <h5>Use with "GAN" visualization method</h5>
+
+        <div class="form-group{{mark_errors([form.attributes_z1_vector])}}">
+            {{ form.attributes_z1_vector.label }}
+            {{ form.attributes_z1_vector.tooltip }}
+            {{ form.attributes_z1_vector(class='form-control autocomplete_path', placeholder='folder') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.attributes_z2_vector])}}">
+            {{ form.attributes_z2_vector.label }}
+            {{ form.attributes_z2_vector.tooltip }}
+            {{ form.attributes_z2_vector(class='form-control autocomplete_path', placeholder='folder') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.attributes_z3_vector])}}">
+            {{ form.attributes_z3_vector.label }}
+            {{ form.attributes_z3_vector.tooltip }}
+            {{ form.attributes_z3_vector(class='form-control autocomplete_path', placeholder='folder') }}
+        </div>
+    </div>
+
+    <div id="task_animation">
+        <h4>Animation</h4>
+
+        <h5>Use with "GAN" visualization method</h5>
+
+        <div class="form-group{{mark_errors([form.animation_num_transitions])}}">
+            {{ form.animation_num_transitions.label }}
+            {{ form.animation_num_transitions.tooltip }}
+            {{ form.animation_num_transitions(class='form-control autocomplete_path', placeholder='folder') }}
+        </div>
+
+        <div class="form-group{{mark_errors([form.animation_z_vectors])}}">
+            {{ form.animation_z_vectors.label }}
+            {{ form.animation_z_vectors.tooltip }}
+            {{ form.animation_z_vectors(class='form-control autocomplete_path', placeholder='z vectors') }}
+        </div>
+    </div>
+
+</div>
+
+<script>
+$("#task_id").change(function() {
+    task_ids = [
+        'class', 'style', 'genimg', 'attributes',
+        'enclist', 'analogy', 'animation'
+    ]
+
+    console.log($(this).val())
+
+    if ($(this).val()) {
+
+        for (i=0; i<task_ids.length; i++)
+        {
+            div_name = "#task_" + task_ids[i]
+            console.log("div name: " + div_name)
+            $(div_name).hide();
+        }
+        $("#task_" + $(this).val()).show();
+    }
+});
+$("#task_id").change();
+</script>
diff --git a/plugins/data/gan/digitsDataPluginGan/templates/template.html b/plugins/data/gan/digitsDataPluginGan/templates/template.html
new file mode 100644
index 000000000..2b8cf6067
--- /dev/null
+++ b/plugins/data/gan/digitsDataPluginGan/templates/template.html
@@ -0,0 +1,37 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+{{ form.data_stage(class='form-control') }}
+
+<div class="form-group{{mark_errors([form.train_data_file])}}">
+    {{ form.train_data_file.label }}
+    {{ form.train_data_file.tooltip }}
+    {{ form.train_data_file(class='form-control autocomplete_path', placeholder='.csv file') }}
+</div>
+
+<div class="form-group{{mark_errors([form.val_data_file])}}">
+    {{ form.val_data_file.label }}
+    {{ form.val_data_file.tooltip }}
+    {{ form.val_data_file(class='form-control autocomplete_path', placeholder='.csv file') }}
+</div>
+
+<div class="form-group{{mark_errors([form.alphabet])}}">
+    {{ form.alphabet.label }}
+    {{ form.alphabet.tooltip }}
+    {{ form.alphabet(class='form-control') }}
+</div>
+
+<div class="form-group{{mark_errors([form.class_labels_file])}}">
+    {{ form.class_labels_file.label }}
+    {{ form.class_labels_file.tooltip }}
+    {{ form.class_labels_file(class='form-control autocomplete_path', placeholder='.txt file') }}
+</div>
+
+<div class="form-group{{mark_errors([form.max_chars_per_sample])}}">
+    {{ form.max_chars_per_sample.label }}
+    {{ form.max_chars_per_sample.tooltip }}
+    {{ form.max_chars_per_sample(class='form-control') }}
+</div>
diff --git a/plugins/data/gan/setup.py b/plugins/data/gan/setup.py
new file mode 100644
index 000000000..5fc97b523
--- /dev/null
+++ b/plugins/data/gan/setup.py
@@ -0,0 +1,27 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+
+import os
+from setuptools import setup, find_packages
+
+from digits.extensions.data import GROUP as DIGITS_PLUGIN_GROUP
+
+
+# Utility function to read the README file.
+def read(fname):
+    return open(os.path.join(os.path.dirname(__file__), fname)).read()
+
+
+setup(
+    name="digits_gan_data_plugin",
+    version="0.0.1",
+    author="Greg Heinrich",
+    description=("A data ingestion plugin for GANs"),
+    long_description=read('README'),
+    license="Apache",
+    packages=find_packages(),
+    entry_points={
+        DIGITS_PLUGIN_GROUP: [
+            'class=digitsDataPluginGan:DataIngestion',
+        ]},
+    include_package_data=True,
+)
diff --git a/plugins/view/gan/MANIFEST.in b/plugins/view/gan/MANIFEST.in
new file mode 100644
index 000000000..36a8647ad
--- /dev/null
+++ b/plugins/view/gan/MANIFEST.in
@@ -0,0 +1 @@
+recursive-include digitsViewPluginGan *.html
diff --git a/plugins/view/gan/README b/plugins/view/gan/README
new file mode 100644
index 000000000..8b0ecd5a1
--- /dev/null
+++ b/plugins/view/gan/README
@@ -0,0 +1 @@
+This DIGITS plug-in visualizes the output of a GAN.
\ No newline at end of file
diff --git a/plugins/view/gan/digitsViewPluginGan/__init__.py b/plugins/view/gan/digitsViewPluginGan/__init__.py
new file mode 100644
index 000000000..af82aa2f8
--- /dev/null
+++ b/plugins/view/gan/digitsViewPluginGan/__init__.py
@@ -0,0 +1,6 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+from .view import Visualization
+
+__all__ = ['Visualization']
diff --git a/plugins/view/gan/digitsViewPluginGan/forms.py b/plugins/view/gan/digitsViewPluginGan/forms.py
new file mode 100644
index 000000000..1e49a744d
--- /dev/null
+++ b/plugins/view/gan/digitsViewPluginGan/forms.py
@@ -0,0 +1,50 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+import os
+
+from digits import utils
+from digits.utils import subclass
+from flask.ext.wtf import Form
+
+
+@subclass
+class ConfigForm(Form):
+    """
+    A form used to configure gradient visualization
+    """
+
+    def validate_file_path(form, field):
+        if not field.data:
+            pass
+        else:
+            # make sure the filesystem path exists
+            if not os.path.exists(field.data) and not os.path.isdir(field.data):
+                raise validators.ValidationError(
+                    'File does not exist or is not reachable')
+            else:
+                return True
+
+
+    gan_view_task_id = utils.forms.SelectField(
+        'Task',
+        choices=[
+            ('grid', 'Grid'),
+            ('mnist_encoder', 'MNIST Encoder'),
+            ('celeba_encoder', 'CelebA Encoder'),
+            ('animation', 'Animation'),
+            ('attributes', 'CelebA get attributes'),
+            ],
+        default='grid',
+        tooltip="Select a task."
+        )
+
+    attributes_file = utils.forms.StringField(
+        u'Attributes vector file',
+        validators=[
+            validate_file_path,
+            ],
+        tooltip="Specify the path to a file that contains attributes vectors."
+        )
+
+    pass
diff --git a/plugins/view/gan/digitsViewPluginGan/templates/config_template.html b/plugins/view/gan/digitsViewPluginGan/templates/config_template.html
new file mode 100644
index 000000000..ecb3dce24
--- /dev/null
+++ b/plugins/view/gan/digitsViewPluginGan/templates/config_template.html
@@ -0,0 +1,19 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+<small>Show the output of a GAN</small>
+
+<div class="form-group{{mark_errors([form.gan_view_task_id])}}">
+    {{ form.gan_view_task_id.label }}
+    {{ form.gan_view_task_id.tooltip }}
+    {{ form.gan_view_task_id(class='form-control autocomplete_path', placeholder='folder') }}
+</div>
+
+<div class="form-group{{mark_errors([form.attributes_file])}}">
+    {{ form.attributes_file.label }}
+    {{ form.attributes_file.tooltip }}
+    {{ form.attributes_file(class='form-control autocomplete_path') }}
+</div>
diff --git a/plugins/view/gan/digitsViewPluginGan/templates/header_template.html b/plugins/view/gan/digitsViewPluginGan/templates/header_template.html
new file mode 100644
index 000000000..313fa8348
--- /dev/null
+++ b/plugins/view/gan/digitsViewPluginGan/templates/header_template.html
@@ -0,0 +1,28 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+<script type="text/javascript" src="/extension-static/view/image-segmentation/js/app.js"></script>
+<link rel="stylesheet" href="/extension-static/view/image-segmentation/css/app.css">
+
+
+<table>
+    {% if animated_image %}
+        <tr>
+            <h4>Animation</h4>
+            <img src="{{animated_image}}" style="max-width:100%;" />
+        </tr>
+    {% endif %}
+    {% if task_id == 'grid' %}
+        <tr>
+            <h4>Grid</h4>
+        </tr>
+        {% for row_id in rows %}
+            <tr>
+                {% for col_id in cols %}
+                <td>
+                <div id="{{ col_id }}_{{ row_id }}">
+                </td>
+                {% endfor %}
+            </tr>
+        {% endfor %}
+    {% endif %}
+</table>
diff --git a/plugins/view/gan/digitsViewPluginGan/templates/view_template.html b/plugins/view/gan/digitsViewPluginGan/templates/view_template.html
new file mode 100644
index 000000000..d7d234b18
--- /dev/null
+++ b/plugins/view/gan/digitsViewPluginGan/templates/view_template.html
@@ -0,0 +1,47 @@
+{# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved. #}
+
+{% from "helper.html" import print_flashes %}
+{% from "helper.html" import print_errors %}
+{% from "helper.html" import mark_errors %}
+
+{% if task_id=='grid' %}
+    <script>
+    $('#{{ row_id }}_{{ col_id }}').html('<img src="{{image}}" style="max-width:100%;" />');
+    </script>
+{% endif %}
+{% if task_id=='grid' or task_id=='animation' %}
+    {{key}}
+    <img src="{{image}}" style="max-width:100%;" />
+{% elif task_id=='encoder' %}
+    <table>
+    <tr>
+        <td width=100>
+            <img src="{{image_input}}" style="max-width:100%;" />
+        </td>
+        <td width=100>
+            <img src="{{image_output}}" style="max-width:100%;" />
+        </td>
+        <td>
+            {{z}}
+        </td>
+    </tr>
+    </table>
+{% elif task_id=='attributes' %}
+    <table>
+    <tr>
+        <td width=100>
+            <img src="{{image_input}}" style="max-width:100%;" />
+        </td>
+        <!-- <td width=100>
+            <img src="{{image_output}}" style="max-width:100%;" />
+        </td>
+        -->
+        <td>
+            {% for attribute in top5 %}
+            <span class="badge">{{attribute[1]}}</span> {{ attribute[0] }}
+            <br>
+            {% endfor %}
+        </td>
+    </tr>
+    </table>
+{% endif %}
diff --git a/plugins/view/gan/digitsViewPluginGan/view.py b/plugins/view/gan/digitsViewPluginGan/view.py
new file mode 100644
index 000000000..a5a63ffcd
--- /dev/null
+++ b/plugins/view/gan/digitsViewPluginGan/view.py
@@ -0,0 +1,270 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+from __future__ import absolute_import
+
+import os
+import tempfile
+
+# Find the best implementation available
+try:
+    from cStringIO import StringIO
+except ImportError:
+    from StringIO import StringIO
+import pickle
+
+import imageio
+import numpy as np
+import PIL.Image
+import PIL.ImageDraw
+
+import digits
+from digits.utils import subclass, override
+from digits.extensions.view.interface import VisualizationInterface
+from .forms import ConfigForm
+
+
+CONFIG_TEMPLATE = "templates/config_template.html"
+HEADER_TEMPLATE = "templates/header_template.html"
+VIEW_TEMPLATE = "templates/view_template.html"
+
+CELEBA_ATTRIBUTES = """
+                     5_o_Clock_Shadow Arched_Eyebrows Attractive Bags_Under_Eyes Bald Bangs
+                     Big_Lips Big_Nose Black_Hair Blond_Hair Blurry Brown_Hair Bushy_Eyebrows
+                     Chubby Double_Chin Eyeglasses Goatee Gray_Hair Heavy_Makeup High_Cheekbones
+                     Male Mouth_Slightly_Open Mustache Narrow_Eyes No_Beard Oval_Face Pale_Skin
+                     Pointy_Nose Receding_Hairline Rosy_Cheeks Sideburns Smiling Straight_Hair
+                     Wavy_Hair Wearing_Earrings Wearing_Hat Wearing_Lipstick Wearing_Necklace
+                     Wearing_Necktie Young
+                    """.split()
+
+
+@subclass
+class Visualization(VisualizationInterface):
+    """
+    A visualization extension to display the output of a GAN
+    """
+
+    def __init__(self, dataset, **kwargs):
+        """
+        Init
+        """
+        # memorize view template for later use
+        extension_dir = os.path.dirname(os.path.abspath(__file__))
+        self.view_template = open(
+            os.path.join(extension_dir, VIEW_TEMPLATE), "r").read()
+
+        self.normalize = True
+        self.grid_size = 10
+
+        # view options
+        self.task_id = kwargs['gan_view_task_id']
+        self.attributes_file = kwargs['attributes_file']
+
+    @staticmethod
+    def get_config_form():
+        return ConfigForm()
+
+    @staticmethod
+    def get_config_template(form):
+        """
+        parameters:
+        - form: form returned by get_config_form(). This may be populated
+        with values if the job was cloned
+        returns:
+        - (template, context) tuple
+          - template is a Jinja template to use for rendering config options
+          - context is a dictionary of context variables to use for rendering
+          the form
+        """
+        extension_dir = os.path.dirname(os.path.abspath(__file__))
+        template = open(
+            os.path.join(extension_dir, CONFIG_TEMPLATE), "r").read()
+        context = {'form': form}
+        return (template, context)
+
+    @override
+    def get_header_template(self):
+        """
+        Implements get_header_template() method from view extension interface
+        """
+
+        extension_dir = os.path.dirname(os.path.abspath(__file__))
+        template = open(
+            os.path.join(extension_dir, HEADER_TEMPLATE), "r").read()
+
+        context = {'task_id': self.task_id,
+                   'cols': range(self.grid_size),
+                   'rows': range(self.grid_size),
+                   'animated_image': None}
+
+        if hasattr(self, 'animated_images'):
+            # create animated gif
+            string_buf = StringIO()
+            fmt = "gif"
+            imageio.mimsave(string_buf, self.animated_images, format=fmt)
+            data = string_buf.getvalue().encode('base64').replace('\n', '')
+            animated_image_html = 'data:image/%s;base64,%s' % (fmt, data)
+            context['animated_image'] = animated_image_html
+
+        return template, context
+
+    @staticmethod
+    def get_id():
+        return "image-gan"
+
+    @staticmethod
+    def get_title():
+        return "GAN"
+
+    def get_image_html(self, image):
+        # assume 8-bit
+        if self.normalize:
+            image -= image.min()
+            if image.max() > 0:
+                image /= image.max()
+                image *= 255
+        else:
+            # clip
+            image = image.clip(0, 255)
+
+        # convert to uint8
+        image = image.astype('uint8')
+
+        # convert to PIL image
+        channels = image.shape[2]
+        if channels == 1:
+            # drop channel axis
+            image = PIL.Image.fromarray(image[:, :, 0])
+        elif channels == 3:
+            image = PIL.Image.fromarray(image)
+        else:
+            raise ValueError("Unhandled number of channels: %d" % channels)
+
+        #image.save(fname)
+
+        image_html = digits.utils.image.embed_image_html(image)
+
+        return image_html
+
+    @override
+    def get_view_template(self, data):
+        """
+        parameters:
+        - data: data returned by process_data()
+        returns:
+        - (template, context) tuple
+          - template is a Jinja template to use for rendering config
+          options
+          - context is a dictionary of context variables to use for
+          rendering the form
+        """
+        context = {'task_id': self.task_id}
+        context.update(data)
+        if self.task_id in ['celeba_encoder', 'mnist_encoder']:
+            context.update({'task_id': 'encoder'})
+        return self.view_template, context
+
+    @override
+    def process_data(self, input_id, input_data, output_data):
+        """
+        Process one inference and return data to visualize
+        """
+        data = output_data[output_data.keys()[0]].astype('float32')
+
+        if self.task_id == 'grid':
+            col_id = int(input_id) // self.grid_size
+            row_id = int(input_id) % self.grid_size
+            image_html = self.get_image_html(data)
+
+            img_size = data.shape[0]
+            if img_size == 28:
+                # MNIST
+                if not hasattr(self, 'animated_images'):
+                    self.animated_images = [None] * (self.grid_size ** 2)
+                self.animated_images[row_id * self.grid_size + col_id] = data.astype('uint8')
+            elif img_size == 64:
+                # CelebA
+                if not hasattr(self, 'animated_images'):
+                    self.animated_images = [None] * (4 * self.grid_size - 4)
+                print("animated: %s" % repr(self.animated_images))
+
+                if (
+                       col_id == 0 or
+                       row_id == 0 or
+                       col_id == (self.grid_size - 1) or
+                       row_id == (self.grid_size - 1)
+                   ):
+                    if row_id == 0:
+                        idx = col_id
+                    elif col_id == (self.grid_size - 1):
+                        idx = self.grid_size - 1 + row_id
+                    elif row_id == (self.grid_size - 1):
+                        idx = 3 * self.grid_size - 3 - col_id
+                    else:
+                        idx = 4 * self.grid_size - 4 - row_id
+                    self.animated_images[idx] = data.astype('uint8')
+                    print("set idx %d " % idx)
+            else:
+                raise ValueEror("Unhandled image size: %d" % img_size)
+
+            return {'image': image_html,
+                    'col_id': col_id,
+                    'row_id': row_id,
+                    'key': input_id}
+        elif self.task_id == 'mnist_encoder':
+            self.z_dim = 100
+            z = data[:self.z_dim]
+            image = data[self.z_dim:].reshape(28, 28)
+            input_data = input_data.astype('float32')
+            input_data = input_data[:, :, np.newaxis]
+            image = image[:, :, np.newaxis]
+            image_input_html = self.get_image_html(input_data)
+            image_output_html = self.get_image_html(image)
+            return {'z': z,
+                    'image_input': image_input_html,
+                    'image_output': image_output_html,
+                    'key': input_id}
+        elif self.task_id == 'celeba_encoder':
+            self.z_dim = 100
+            z = data[:self.z_dim]
+            image = data[self.z_dim:].reshape(64, 64, 3)
+            input_data = input_data.astype('float32')
+            image_input_html = self.get_image_html(input_data)
+            image_output_html = self.get_image_html(image)
+            return {'z': z,
+                    'image_input': image_input_html,
+                    'image_output': image_output_html,
+                    'key': input_id}
+        elif self.task_id == 'animation':
+            image_html = self.get_image_html(data)
+            if not hasattr(self, 'animated_images'):
+                self.animated_images = []
+            self.animated_images.append(data.astype('uint8'))
+            return {'image': image_html,
+                    'key': input_id}
+        elif self.task_id == 'attributes':
+            self.z_dim = 100
+            z = data[:self.z_dim]
+            input_data = input_data.astype('float32')
+            image_input_html = self.get_image_html(input_data)
+            image = data[self.z_dim:].reshape(64, 64, 3)
+            image_output_html = self.get_image_html(image)
+            with open(self.attributes_file, 'rb') as f:
+                attributes_z = pickle.load(f)
+
+            #inner_products = np.inner(z, attributes_z)
+            inner_products = np.empty((40))
+            for i in range(40):
+                #if i in [ 1,  2, 18, 19, 20, 21, 25, 27, 31, 33, 36]:
+                if True: #i in [ 0,  1,  2,  3,  5,  6,  7,  8,  9, 10, 11, 12, 13, 15, 16, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39]:
+                    attr = attributes_z[i]
+                    inner_products[i] = np.inner(z, attr) / np.linalg.norm(attr)
+                else:
+                    inner_products[i] = 0
+
+            top_5_indices = np.argsort(inner_products)[::-1][:5]
+            top_5 = [(CELEBA_ATTRIBUTES[idx], "%.2f" % inner_products[idx]) for idx in top_5_indices]
+            return {'image_input': image_input_html,
+                    'image_output': image_output_html,
+                    'top5': top_5}
+        else:
+            raise ValueError("Unknown task: %s" % self.task_id)
diff --git a/plugins/view/gan/setup.py b/plugins/view/gan/setup.py
new file mode 100644
index 000000000..c6c59cb42
--- /dev/null
+++ b/plugins/view/gan/setup.py
@@ -0,0 +1,29 @@
+# Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+
+import os
+from setuptools import setup, find_packages
+
+from digits.extensions.view import GROUP as DIGITS_PLUGIN_GROUP
+
+
+# Utility function to read the README file.
+def read(fname):
+    return open(os.path.join(os.path.dirname(__file__), fname)).read()
+
+
+setup(
+    name="digits_gan_view_plugin",
+    version="0.0.1",
+    author="Greg Heinrich",
+    description=("A view plugin for GANs"),
+    long_description=read('README'),
+    license="Apache",
+    packages=find_packages(),
+    entry_points={
+        DIGITS_PLUGIN_GROUP: [
+            'class=digitsViewPluginGan:Visualization',
+        ]
+    },
+    include_package_data=True,
+    install_requires=['imageio>=2.1.2'],
+)
diff --git a/setup.cfg b/setup.cfg
index 14a0e62fc..ffb823f58 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -1,7 +1,8 @@
 [flake8]
 max-line-length = 120
-exclude = venv
+exclude = venv,standard-networks
 
 [pep8]
 max-line-length = 120
 exclude = venv
+