Extract a base Model class from current Model class, rename the curre…

…nt to CNNModel, and subclasses Model. PiperOrigin-RevId: 207753123
tensorflow · Aug 7, 2018 · 634b921 · 634b921
1 parent 6eeaa75
commit 634b921
Show file tree

Hide file tree

Showing 18 changed files with 76 additions and 53 deletions.
diff --git a/scripts/tf_cnn_benchmarks/benchmark_cnn.py b/scripts/tf_cnn_benchmarks/benchmark_cnn.py
@@ -2773,8 +2773,8 @@ def add_sync_queues_and_barrier(self, name_prefix, enqueue_after_list):
       return tf.group(*queue_ops)
 
 
-class BenchmarkSeq2Seq(BenchmarkCNN):
-  """Class for benchmarking a seq2seq network."""
+class BenchmarkNMT(BenchmarkCNN):
+  """Class for benchmarking a NMT network."""
 
   def __init__(self, params, dataset=None, model=None):
     # pylint:disable=super-init-not-called
@@ -2788,16 +2788,22 @@ def _build_graph(self):
     """
     pass
 
-  def _build_model_single_session_with_dataset_prefetching(self):
-    pass
+  def _build_model(self):
+    """Build the TensorFlow graph."""
+
+    # Not implemented since it's FLAGS.dataset_use_prefetch is default True.
+    raise NotImplementedError
 
   def _build_model_single_session(self):
-    pass
+    """Build the TensorFlow graph for multiple replicas in a single_session."""
+
+    # Not implemented since it's FLAGS.dataset_use_prefetch is default True.
+    raise NotImplementedError
 
   def _build_model_with_dataset_prefetching(self):
     pass
 
-  def _build_model(self):
+  def _build_model_single_session_with_dataset_prefetching(self):
     pass
 
 

diff --git a/scripts/tf_cnn_benchmarks/benchmark_cnn_distributed_test.py b/scripts/tf_cnn_benchmarks/benchmark_cnn_distributed_test.py
@@ -434,7 +434,7 @@ def _test_variable_update(self,
       actual_losses.append([x.loss for x in outputs])
 
     inputs = test_util.get_fake_var_update_inputs()
-    expected_losses = test_util.TestModel().manually_compute_losses(
+    expected_losses = test_util.TestCNNModel().manually_compute_losses(
         inputs, num_workers, params)
     if params.variable_update == 'distributed_all_reduce':
       # In distributed all reduce, each step, the controller outputs the average

diff --git a/scripts/tf_cnn_benchmarks/benchmark_cnn_distributed_test_runner.py b/scripts/tf_cnn_benchmarks/benchmark_cnn_distributed_test_runner.py
@@ -91,7 +91,7 @@ def run_with_real_model(params):
 
 def run_with_test_model(params):
   """Runs tf_cnn_benchmarks with a test model."""
-  model = test_util.TestModel()
+  model = test_util.TestCNNModel()
   inputs = test_util.get_fake_var_update_inputs()
   with test_util.monkey_patch(benchmark_cnn,
                               LOSS_AND_ACCURACY_DIGITS_TO_SHOW=15):

diff --git a/scripts/tf_cnn_benchmarks/benchmark_cnn_test.py b/scripts/tf_cnn_benchmarks/benchmark_cnn_test.py
@@ -1003,7 +1003,7 @@ def setUp(self):
   def _get_benchmark_cnn_losses(self, inputs, params):
     """Returns the losses of BenchmarkCNN on the given inputs and params."""
     logs = []
-    model = test_util.TestModel()
+    model = test_util.TestCNNModel()
     with test_util.monkey_patch(benchmark_cnn,
                                 log_fn=test_util.print_and_add_to_list(logs),
                                 LOSS_AND_ACCURACY_DIGITS_TO_SHOW=15):
@@ -1022,16 +1022,16 @@ def _get_benchmark_cnn_losses(self, inputs, params):
   def _test_variable_update(self, params):
     """Tests variables are updated correctly when the given params are used.
 
-    A BenchmarkCNN is created with a TestModel, and is run with some scalar
+    A BenchmarkCNN is created with a TestCNNModel, and is run with some scalar
     images. The losses are then compared with the losses obtained with
-    TestModel().manually_compute_losses()
+    TestCNNModel().manually_compute_losses()
 
     Args:
       params: a Params tuple used to create BenchmarkCNN.
     """
     inputs = test_util.get_fake_var_update_inputs()
     actual_losses = self._get_benchmark_cnn_losses(inputs, params)
-    expected_losses, = test_util.TestModel().manually_compute_losses(
+    expected_losses, = test_util.TestCNNModel().manually_compute_losses(
         inputs, 1, params)
     rtol = 3e-2 if params.use_fp16 else 1e-5
     self.assertAllClose(actual_losses[:len(expected_losses)], expected_losses,

diff --git a/scripts/tf_cnn_benchmarks/models/alexnet_model.py b/scripts/tf_cnn_benchmarks/models/alexnet_model.py
@@ -25,7 +25,7 @@
 from models import model
 
 
-class AlexnetModel(model.Model):
+class AlexnetModel(model.CNNModel):
   """Alexnet cnn model."""
 
   def __init__(self):
@@ -48,7 +48,7 @@ def add_inference(self, cnn):
     cnn.dropout()
 
 
-class AlexnetCifar10Model(model.Model):
+class AlexnetCifar10Model(model.CNNModel):
   """Alexnet cnn model for cifar datasets.
 
   The model architecture follows the one defined in the tensorflow tutorial

diff --git a/scripts/tf_cnn_benchmarks/models/densenet_model.py b/scripts/tf_cnn_benchmarks/models/densenet_model.py
@@ -24,7 +24,7 @@
 from models import model as model_lib
 
 
-class DensenetCifar10Model(model_lib.Model):
+class DensenetCifar10Model(model_lib.CNNModel):
   """Densenet cnn network configuration."""
 
   def __init__(self, model, layer_counts, growth_rate):

diff --git a/scripts/tf_cnn_benchmarks/models/googlenet_model.py b/scripts/tf_cnn_benchmarks/models/googlenet_model.py
@@ -25,7 +25,8 @@
 from models import model
 
 
-class GooglenetModel(model.Model):
+class GooglenetModel(model.CNNModel):
+  """GoogLeNet."""
 
   def __init__(self):
     super(GooglenetModel, self).__init__('googlenet', 224, 32, 0.005)

diff --git a/scripts/tf_cnn_benchmarks/models/inception_model.py b/scripts/tf_cnn_benchmarks/models/inception_model.py
@@ -41,7 +41,8 @@
 from models import model
 
 
-class Inceptionv3Model(model.Model):
+class Inceptionv3Model(model.CNNModel):
+  """InceptionV3."""
 
   def __init__(self, auxiliary=False):
     self._auxiliary = auxiliary
@@ -157,7 +158,8 @@ def inception_v4_rb(cnn):
   cnn.inception_module('incept_v4_rb', cols)
 
 
-class Inceptionv4Model(model.Model):
+class Inceptionv4Model(model.CNNModel):
+  """Inceptionv4."""
 
   def __init__(self):
     super(Inceptionv4Model, self).__init__('inception4', 299, 32, 0.005)

diff --git a/scripts/tf_cnn_benchmarks/models/lenet_model.py b/scripts/tf_cnn_benchmarks/models/lenet_model.py
@@ -24,7 +24,8 @@
 from models import model
 
 
-class Lenet5Model(model.Model):
+class Lenet5Model(model.CNNModel):
+  """Lenet5."""
 
   def __init__(self):
     super(Lenet5Model, self).__init__('lenet5', 28, 32, 0.005)

diff --git a/scripts/tf_cnn_benchmarks/models/mobilenet_v2.py b/scripts/tf_cnn_benchmarks/models/mobilenet_v2.py
@@ -186,7 +186,7 @@ def training_scope(**kwargs):
   return lib.training_scope(**kwargs)
 
 
-class MobilenetModel(model.Model):
+class MobilenetModel(model.CNNModel):
   """Mobilenet model configuration."""
 
   def __init__(self):
@@ -196,4 +196,3 @@ def add_inference(self, cnn):
     with tf.contrib.slim.arg_scope(training_scope(is_training=cnn.phase_train)):
       cnn.top_layer, _ = mobilenet(cnn.top_layer, is_training=cnn.phase_train)
       cnn.top_size = cnn.top_layer.shape[-1].value
-
diff --git a/scripts/tf_cnn_benchmarks/models/model.py b/scripts/tf_cnn_benchmarks/models/model.py
@@ -19,31 +19,20 @@
 
 
 class Model(object):
-  """Base model configuration for CNN benchmarks."""
+  """Base model config for DNN benchmarks."""
 
-  def __init__(self,
-               model,
-               image_size,
-               batch_size,
-               learning_rate,
-               layer_counts=None,
-               fp16_loss_scale=128):
-    self.model = model
-    self.image_size = image_size
+  def __init__(self, model_name, batch_size, learning_rate, fp16_loss_scale):
+    self.model = model_name
     self.batch_size = batch_size
     self.default_batch_size = batch_size
     self.learning_rate = learning_rate
-    self.layer_counts = layer_counts
     # TODO(reedwm) Set custom loss scales for each model instead of using the
     # default of 128.
     self.fp16_loss_scale = fp16_loss_scale
 
   def get_model(self):
     return self.model
 
-  def get_image_size(self):
-    return self.image_size
-
   def get_batch_size(self):
     return self.batch_size
 
@@ -53,9 +42,6 @@ def set_batch_size(self, batch_size):
   def get_default_batch_size(self):
     return self.default_batch_size
 
-  def get_layer_counts(self):
-    return self.layer_counts
-
   def get_fp16_loss_scale(self):
     return self.fp16_loss_scale
 
@@ -67,6 +53,33 @@ def get_learning_rate(self, global_step, batch_size):
   def add_inference(self, unused_cnn):
     raise ValueError('Must be implemented in derived classes')
 
+  def build_network(self, inputs, **kwargs):
+    del inputs
+    del kwargs
+    raise ValueError('Must be implemented in derived classes')
+
+
+class CNNModel(Model):
+  """Base model configuration for CNN benchmarks."""
+
+  def __init__(self,
+               model,
+               image_size,
+               batch_size,
+               learning_rate,
+               layer_counts=None,
+               fp16_loss_scale=128):
+    super(CNNModel, self).__init__(model, batch_size, learning_rate,
+                                   fp16_loss_scale)
+    self.image_size = image_size
+    self.layer_counts = layer_counts
+
+  def get_image_size(self):
+    return self.image_size
+
+  def get_layer_counts(self):
+    return self.layer_counts
+
   def skip_final_affine_layer(self):
     """Returns if the caller of this class should skip the final affine layer.
 

diff --git a/scripts/tf_cnn_benchmarks/models/nasnet_model.py b/scripts/tf_cnn_benchmarks/models/nasnet_model.py
@@ -532,7 +532,7 @@ def add_and_check_endpoint(endpoint_name, net):
   return logits, end_points
 
 
-class NasnetModel(model.Model):
+class NasnetModel(model.CNNModel):
   """Nasnet model configuration."""
 
   def __init__(self):
@@ -547,7 +547,7 @@ def add_inference(self, cnn):
     cnn.top_size = cnn.top_layer.shape[-1].value
 
 
-class NasnetLargeModel(model.Model):
+class NasnetLargeModel(model.CNNModel):
   """Nasnet model configuration."""
 
   def __init__(self):
@@ -562,7 +562,7 @@ def add_inference(self, cnn):
     cnn.top_size = cnn.top_layer.shape[-1].value
 
 
-class NasnetCifarModel(model.Model):
+class NasnetCifarModel(model.CNNModel):
   """Nasnet cifar model configuration."""
 
   def __init__(self):

diff --git a/scripts/tf_cnn_benchmarks/models/official_resnet_model.py b/scripts/tf_cnn_benchmarks/models/official_resnet_model.py
@@ -23,7 +23,7 @@
 from models import model as model_lib
 
 
-class ImagenetResnetModel(model_lib.Model):
+class ImagenetResnetModel(model_lib.CNNModel):
   """Official resnet models."""
 
   def __init__(self, resnet_size, version=2):

diff --git a/scripts/tf_cnn_benchmarks/models/overfeat_model.py b/scripts/tf_cnn_benchmarks/models/overfeat_model.py
@@ -26,7 +26,8 @@
 from models import model
 
 
-class OverfeatModel(model.Model):
+class OverfeatModel(model.CNNModel):
+  """OverfeatModel."""
 
   def __init__(self):
     super(OverfeatModel, self).__init__('overfeat', 231, 32, 0.005)

diff --git a/scripts/tf_cnn_benchmarks/models/resnet_model.py b/scripts/tf_cnn_benchmarks/models/resnet_model.py
@@ -235,7 +235,7 @@ def residual_block(cnn, depth, stride, version):
   cnn.top_size = depth
 
 
-class ResnetModel(model_lib.Model):
+class ResnetModel(model_lib.CNNModel):
   """Resnet cnn network configuration."""
 
   def __init__(self, model, layer_counts):
@@ -323,7 +323,7 @@ def create_resnet152_v2_model():
   return ResnetModel('resnet152_v2', (3, 8, 36, 3))
 
 
-class ResnetCifar10Model(model_lib.Model):
+class ResnetCifar10Model(model_lib.CNNModel):
   """Resnet cnn network configuration for Cifar 10 dataset.
 
   V1 model architecture follows the one defined in the paper:

diff --git a/scripts/tf_cnn_benchmarks/models/trivial_model.py b/scripts/tf_cnn_benchmarks/models/trivial_model.py
@@ -17,7 +17,7 @@
 from models import model
 
 
-class TrivialModel(model.Model):
+class TrivialModel(model.CNNModel):
   """Trivial model configuration."""
 
   def __init__(self):
@@ -29,7 +29,7 @@ def add_inference(self, cnn):
     cnn.affine(4096)
 
 
-class TrivialCifar10Model(model.Model):
+class TrivialCifar10Model(model.CNNModel):
   """Trivial cifar10 model configuration."""
 
   def __init__(self):

diff --git a/scripts/tf_cnn_benchmarks/models/vgg_model.py b/scripts/tf_cnn_benchmarks/models/vgg_model.py
@@ -53,7 +53,7 @@ def _construct_vgg(cnn, num_conv_layers):
   cnn.dropout()
 
 
-class Vgg11Model(model.Model):
+class Vgg11Model(model.CNNModel):
 
   def __init__(self):
     super(Vgg11Model, self).__init__('vgg11', 224, 64, 0.005)
@@ -62,7 +62,7 @@ def add_inference(self, cnn):
     _construct_vgg(cnn, [1, 1, 2, 2, 2])
 
 
-class Vgg16Model(model.Model):
+class Vgg16Model(model.CNNModel):
 
   def __init__(self):
     super(Vgg16Model, self).__init__('vgg16', 224, 64, 0.005)
@@ -71,7 +71,7 @@ def add_inference(self, cnn):
     _construct_vgg(cnn, [2, 2, 3, 3, 3])
 
 
-class Vgg19Model(model.Model):
+class Vgg19Model(model.CNNModel):
 
   def __init__(self):
     super(Vgg19Model, self).__init__('vgg19', 224, 64, 0.005)

diff --git a/scripts/tf_cnn_benchmarks/test_util.py b/scripts/tf_cnn_benchmarks/test_util.py
@@ -433,7 +433,7 @@ def manually_compute_losses(numpy_inputs, inputs_placeholder, loss, num_workers,
   return losses
 
 
-class TestModel(model.Model):
+class TestCNNModel(model.CNNModel):
   """A simple model used for testing.
 
   The input is a 1-channel 1x1 image, consisting of a single number. The model
@@ -444,8 +444,8 @@ class TestModel(model.Model):
   """
 
   def __init__(self):
-    super(TestModel, self).__init__('test_model', image_size=1, batch_size=1,
-                                    learning_rate=1)
+    super(TestCNNModel, self).__init__(
+        'test_cnn_model', image_size=1, batch_size=1, learning_rate=1)
 
   VAR_A_INITIAL_VALUE = 1.
   VAR_B_INITIAL_VALUE = 2.