keras-team · abinthomasonline · Mar 3, 2023 · Mar 3, 2023 · Mar 3, 2023 · Mar 4, 2023
diff --git a/keras/callbacks.py b/keras/callbacks.py
@@ -2324,7 +2324,7 @@ class TensorBoard(Callback, version_utils.TensorBoardVersionSelector):
 
     * Metrics summary plots
     * Training graph visualization
-    * Weight histograms
+    * Activation and Weight histograms
     * Sampled profiling
 
     When used in `Model.evaluate`, in addition to epoch summaries, there will be
@@ -2346,10 +2346,11 @@ class TensorBoard(Callback, version_utils.TensorBoardVersionSelector):
         log_dir: the path of the directory where to save the log files to be
           parsed by TensorBoard. e.g. log_dir = os.path.join(working_dir,
           'logs') This directory should not be reused by any other callbacks.
-        histogram_freq: frequency (in epochs) at which to compute
+        histogram_freq: frequency (in epochs) at which to compute activation and
           weight histograms for the layers of the model. If set to 0, histograms
           won't be computed. Validation data (or split) must be specified for
-          histogram visualizations.
+          histogram visualizations. Only weight histograms are supported for
+          subclassed models.
         write_graph: whether to visualize the graph in TensorBoard. The log file
           can become quite large when write_graph is set to True.
         write_images: whether to write model weights to visualize as image in
@@ -2488,6 +2489,12 @@ def __init__(
         # Used to restore any existing `SummaryWriter` after training ends.
         self._prev_summary_state = []
 
+        # Used to track activation values for histogram.
+        self._activations = {}
+
+        # Used to cache the original layer call methods.
+        self._layer_calls = {"inner": {}, "outer": {}}
+
     def _validate_kwargs(self, kwargs):
         """Handle arguments were supported in V1."""
         if kwargs.get("write_grads", False):
@@ -2549,6 +2556,8 @@ def set_model(self, model):
             self._should_write_train_graph = True
         if self.embeddings_freq:
             self._configure_embeddings()
+        if self.histogram_freq:
+            self._configure_layer_calls()
 
     @property
     def _train_writer(self):
@@ -2736,6 +2745,41 @@ def _init_profile_batch(self, profile_batch):
             self._start_batch == 0 and self._stop_batch == 0
         )
 
+    def _configure_layer_calls(self):
+        """Configures the layer call functions to record activations."""
+        for layer in self.model.layers:
+            if not layer.trainable_variables:
+                continue
+
+            self._activations[layer.name] = tf.Variable(
+                initial_value=float("nan"),
+                trainable=False,
+                dtype=layer.output.dtype,
+                shape=tf.TensorShape(None),
+            )
+            self._layer_calls["inner"][layer.name] = layer.call
+
+            def outer_call(
+                inputs, *args, layer=layer, layer_call=layer.call, **kwargs
+            ):
+                outputs = layer_call(inputs, *args, **kwargs)
+                self._activations[layer.name].assign(outputs)
+                return outputs
+
+            self._layer_calls["outer"][layer.name] = outer_call
+
+    def _override_layer_calls(self):
+        """Overrides the `call` method of each layer to record activations."""
+        for layer in self.model.layers:
+            if layer.name in self._layer_calls["outer"]:
+                layer.call = self._layer_calls["outer"][layer.name]
+
+    def _restore_layer_calls(self):
+        """Restores the `call` method of each layer to its original value."""
+        for layer in self.model.layers:
+            if layer.name in self._layer_calls["inner"]:
+                layer.call = self._layer_calls["inner"][layer.name]
+
     def on_train_begin(self, logs=None):
         self._global_train_batch = 0
         self._previous_epoch_iterations = 0
@@ -2779,6 +2823,9 @@ def on_train_batch_begin(self, batch, logs=None):
         if self._global_train_batch == self._start_batch:
             self._start_trace()
 
+        if self.histogram_freq:
+            self._override_layer_calls()
+
     def on_train_batch_end(self, batch, logs=None):
         if self._should_write_train_graph:
             self._write_keras_model_train_graph()
@@ -2805,6 +2852,9 @@ def on_train_batch_end(self, batch, logs=None):
         if self._is_tracing and self._global_train_batch >= self._stop_batch:
             self._stop_trace()
 
+        if self.histogram_freq:
+            self._restore_layer_calls()
+
     def on_epoch_begin(self, epoch, logs=None):
         # Keeps track of epoch for profiling.
         if self.write_steps_per_second:
@@ -2902,6 +2952,17 @@ def _log_weights(self, epoch):
                             self._log_weight_as_image(
                                 weight, image_weight_name, epoch
                             )
+                    if layer.name in self._activations:
+                        activation_name = layer.name + "/activations"
+                        # Add a suffix to prevent summary tag name collision.
+                        histogram_activation_name = (
+                            activation_name + "/histogram"
+                        )
+                        tf.summary.histogram(
+                            histogram_activation_name,
+                            self._activations[layer.name],
+                            step=epoch,
+                        )
                 self._train_writer.flush()
 
     def _log_weight_as_image(self, weight, weight_name, epoch):

diff --git a/keras/callbacks_test.py b/keras/callbacks_test.py
@@ -1415,7 +1415,6 @@ def get_input_datasets():
         return model, train_ds, callback, filepath
 
     def _run_load_weights_on_restart_test_common_iterations(self):
-
         (
             model,
             train_ds,
@@ -3162,15 +3161,33 @@ def test_TensorBoard_weight_histograms(self):
                 ),
             },
         )
-        self.assertEqual(
-            self._strip_layer_names(summary_file.histograms, model_type),
-            {
-                _ObservedSummary(logdir=self.train_dir, tag="bias_0/histogram"),
-                _ObservedSummary(
-                    logdir=self.train_dir, tag="kernel_0/histogram"
-                ),
-            },
-        )
+        if "subclass" not in model_type:
+            self.assertEqual(
+                self._strip_layer_names(summary_file.histograms, model_type),
+                {
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="bias_0/histogram"
+                    ),
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="kernel_0/histogram"
+                    ),
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="activations/histogram"
+                    ),
+                },
+            )
+        else:
+            self.assertEqual(
+                self._strip_layer_names(summary_file.histograms, model_type),
+                {
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="bias_0/histogram"
+                    ),
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="kernel_0/histogram"
+                    ),
+                },
+            )
 
     def test_TensorBoard_weight_images(self):
         model = self._get_model()
@@ -3201,15 +3218,33 @@ def test_TensorBoard_weight_images(self):
                 ),
             },
         )
-        self.assertEqual(
-            self._strip_layer_names(summary_file.histograms, model_type),
-            {
-                _ObservedSummary(logdir=self.train_dir, tag="bias_0/histogram"),
-                _ObservedSummary(
-                    logdir=self.train_dir, tag="kernel_0/histogram"
-                ),
-            },
-        )
+        if "subclass" not in model_type:
+            self.assertEqual(
+                self._strip_layer_names(summary_file.histograms, model_type),
+                {
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="bias_0/histogram"
+                    ),
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="kernel_0/histogram"
+                    ),
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="activations/histogram"
+                    ),
+                },
+            )
+        else:
+            self.assertEqual(
+                self._strip_layer_names(summary_file.histograms, model_type),
+                {
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="bias_0/histogram"
+                    ),
+                    _ObservedSummary(
+                        logdir=self.train_dir, tag="kernel_0/histogram"
+                    ),
+                },
+            )
         if summary_file.convert_from_v2_summary_proto:
             expected_image_summaries = {
                 _ObservedSummary(logdir=self.train_dir, tag="bias_0/image"),