Merge pull request #690 from mv1388/merge_callback_handlers

Merge callback handlers - merge BasicCallbacksHandler into the CallbacksHandler
mv1388 · Jul 12, 2022 · 3a562e7 · 3a562e7
2 parents 13337d1 + 6386a0f
commit 3a562e7
Show file tree

Hide file tree

Showing 2 changed files with 101 additions and 267 deletions.
diff --git a/aitoolbox/torchtrain/train_loop/components/callback_handler.py b/aitoolbox/torchtrain/train_loop/components/callback_handler.py
@@ -4,182 +4,25 @@
 from aitoolbox.utils.util import is_empty_function
 
 
-class BasicCallbacksHandler:
+class CallbacksHandler:
     def __init__(self, train_loop_obj):
         """Callback handler used for the callback orchestration inside the TrainLoop
 
-        Common use of this handler is to call different methods inside the TrainLoop at different stages of the training
-        process. Thus execute desired callbacks' functionality at the desired point of the training process.
+        The use of this handler is to call specified callback methods inside the TrainLoop at different stages of
+        the training process. This executes desired callbacks' functionality at the desired point of the training
+        process.
+
+        The ``CallbacksHandler`` handler will at certain TrainLoop stage only execute those
+        callback methods which have implemented the functionality intended to be executed at this particular stage.
+        Thus, `CallbacksHandler` doesn't unnecessarily execute callbacks at stages they are not implemented at -
+        their respective callback methods are left as ``pass`` and aren't overridden with some desired code logic.
 
         Args:
             train_loop_obj (aitoolbox.torchtrain.train_loop.TrainLoop): reference to the encapsulating TrainLoop
         """
         self.train_loop_obj = train_loop_obj
         self.callbacks_cache = []
 
-    def register_callbacks(self, callbacks, cache_callbacks=False):
-        """Register TrainLoop object reference inside the listed callbacks when the TrainLoop is created
-
-        Normally, this is called from inside the train loop by the TrainLoop itself. Basically train loop "registers"
-        itself.
-
-        Args:
-            callbacks (list or None): list of callbacks
-            cache_callbacks (bool): should provided callbacks be cached and not yet registered. First subsequent time
-                this method is called without ``cache_callbacks`` enabled all the previously cached callbacks are added
-                and also registered with the current list of callbacks.
-
-        Returns:
-            None
-        """
-        if cache_callbacks:
-            self.callbacks_cache += callbacks if callbacks is not None else []
-        else:
-            if len(self.callbacks_cache) > 0:
-                callbacks = self.callbacks_cache + (callbacks if callbacks is not None else [])
-
-            self.callbacks_cache = []
-
-            if callbacks is not None and len(callbacks) > 0:
-                self.enforce_callbacks_quality(callbacks)
-                self.train_loop_obj.callbacks += \
-                    [cb.register_train_loop_object(self.train_loop_obj) for cb in callbacks
-                     if self.train_loop_obj.device.index is None or
-                     cb.device_idx_execution is None or
-                     (cb.device_idx_execution is not None and cb.device_idx_execution == self.train_loop_obj.device.index)]
-
-            if not all(0 == cb.execution_order for cb in self.train_loop_obj.callbacks):
-                self.train_loop_obj.callbacks = sorted(self.train_loop_obj.callbacks, key=lambda cb: cb.execution_order)
-
-    def execute_epoch_begin(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_epoch_begin()
-
-    def execute_epoch_end(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_epoch_end()
-
-    def execute_train_begin(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_train_begin()
-
-    def execute_train_end(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_train_end()
-
-    def execute_batch_begin(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_batch_begin()
-
-    def execute_batch_end(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_batch_end()
-
-    def execute_gradient_update(self, optimizer_idx=0):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_after_gradient_update(optimizer_idx)
-
-    def execute_optimizer_step(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_after_optimizer_step()
-
-    def execute_multiprocess_start(self):
-        for callback in self.train_loop_obj.callbacks:
-            callback.on_multiprocess_start()
-
-    def mp_filter_callbacks(self):
-        self.train_loop_obj.callbacks = self._mp_filter_cb_list(self.train_loop_obj.callbacks)
-
-    def _mp_filter_cb_list(self, callbacks_list):
-        return [cb for cb in callbacks_list
-                if cb.device_idx_execution is None or
-                (cb.device_idx_execution is not None and cb.device_idx_execution == self.train_loop_obj.device.index)]
-
-    def enforce_callbacks_quality(self, callbacks):
-        for cb in callbacks:
-            if not isinstance(cb, AbstractCallback):
-                raise TypeError(f'Callback {cb} is not inherited from the AbstractCallback')
-
-            if cb.device_idx_execution is not None and self.train_loop_obj.device.index is not None:
-                if cb.device_idx_execution >= torch.cuda.device_count():
-                    raise ValueError(f'Selected device_idx_execution of {cb.device_idx_execution} is too high. '
-                                     f'There are only {torch.cuda.device_count()} available GPU devices. '
-                                     f'Select index ranging from 0 to {torch.cuda.device_count() - 1}')
-
-    @staticmethod
-    def print_callback_info(callback_list):
-        return '\n'.join([f'\t{callback.callback_name}: {type(callback)}, execution_order: {callback.execution_order}'
-                          for callback in callback_list])
-
-    def print_registered_callback_names(self):
-        print(self)
-
-    def __str__(self):
-        return 'CALLBACKS:\n' + self.print_callback_info(self.train_loop_obj.callbacks)
-
-    def __len__(self):
-        return len(self.train_loop_obj.callbacks)
-
-    def __add__(self, other):
-        """
-
-        Args:
-            other (list): callbacks list
-
-        Returns:
-            BasicCallbacksHandler:
-        """
-        self.register_callbacks(other)
-        return self
-
-    def __iadd__(self, other):
-        """
-
-        Args:
-            other (list): callbacks list
-
-        Returns:
-            BasicCallbacksHandler:
-        """
-        self.register_callbacks(other)
-        return self
-
-    def __contains__(self, item):
-        """
-
-        Args:
-            item:
-
-        Returns:
-            bool:
-        """
-        if type(item) == str:
-            for cb in self.train_loop_obj.callbacks:
-                if cb.callback_name == item:
-                    return True
-        else:
-            for cb in self.train_loop_obj.callbacks:
-                if type(cb) == item:
-                    return True
-        return False
-
-
-class CallbacksHandler(BasicCallbacksHandler):
-    def __init__(self, train_loop_obj):
-        """Callback handler used for the callback orchestration inside the TrainLoop
-
-        Compared to `BasicCallbacksHandler`, this handler will at certain TrainLoop stage only execute those
-        callbacks which have implemented the functionality intended to be executed at this particular stage.
-        Thus, `CallbacksHandler` doesn't unnecessarily execute callbacks at stages they are not implemented at.
-
-        Common use of this handler is to call different methods inside the TrainLoop at different stages of the training
-        process. Thus execute desired callbacks' functionality at the desired point of the training process.
-
-        Args:
-            train_loop_obj (aitoolbox.torchtrain.train_loop.TrainLoop): reference to the encapsulating TrainLoop
-        """
-        super().__init__(train_loop_obj)
-
         self.cbs_on_epoch_begin = []
         self.cbs_on_epoch_end = []
         self.cbs_on_train_begin = []
@@ -201,8 +44,8 @@ def __init__(self, train_loop_obj):
     def register_callbacks(self, callbacks, cache_callbacks=False):
         """Register TrainLoop object reference inside the listed callbacks when the TrainLoop is created
 
-        Normally, this is called from inside of the train loop by the TrainLoop itself. Basically train loop "registers"
-        itself.
+        Normally, this is called from inside the train loop by the TrainLoop itself. Basically train loop "registers"
+        itself with each of the provided callbacks.
 
         Args:
             callbacks (list or None): list of callbacks
@@ -215,14 +58,26 @@ def register_callbacks(self, callbacks, cache_callbacks=False):
         """
         if cache_callbacks:
             # Just filling the self.callbacks_cache list with callbacks
-            super().register_callbacks(callbacks, cache_callbacks=cache_callbacks)
+            self.callbacks_cache += callbacks if callbacks is not None else []
         else:
-            # hack since self.callbacks_cache is emptied by the super().register_callbacks()
-            callbacks_cache = self.callbacks_cache
-            super().register_callbacks(callbacks, cache_callbacks=cache_callbacks)
-            # Retrieve cached callbacks from self.callbacks_cache and combine with current callbacks
-            callbacks = callbacks_cache + (callbacks if callbacks is not None else [])
+            # Combine any previously cached callbacks with new callbacks
+            # If there aren't any callbacks cached then the callback cache is just an empty list
+            callbacks = self.callbacks_cache + (callbacks if callbacks is not None else [])
+            # Empty the callbacks cache
             self.callbacks_cache = []
+
+            if callbacks is not None and len(callbacks) > 0:
+                self.enforce_callbacks_quality(callbacks)
+                self.train_loop_obj.callbacks += [
+                    cb.register_train_loop_object(self.train_loop_obj) for cb in callbacks
+                    if self.train_loop_obj.device.index is None or
+                       cb.device_idx_execution is None or
+                       (cb.device_idx_execution is not None and cb.device_idx_execution == self.train_loop_obj.device.index)
+                ]
+
+            if not all(0 == cb.execution_order for cb in self.train_loop_obj.callbacks):
+                self.train_loop_obj.callbacks = sorted(self.train_loop_obj.callbacks, key=lambda cb: cb.execution_order)
+
             self.split_on_execution_position(callbacks, register_train_loop=False)
 
     def execute_epoch_begin(self):
@@ -304,7 +159,7 @@ def split_on_execution_position(self, callbacks, register_train_loop=False):
                 cbs_at_position.sort(key=lambda cb: cb.execution_order)
 
     def mp_filter_callbacks(self):
-        super().mp_filter_callbacks()
+        self.mp_filter_callbacks()
         self.cbs_on_epoch_begin = self._mp_filter_cb_list(self.cbs_on_epoch_begin)
         self.cbs_on_epoch_end = self._mp_filter_cb_list(self.cbs_on_epoch_end)
         self.cbs_on_train_begin = self._mp_filter_cb_list(self.cbs_on_train_begin)
@@ -323,6 +178,22 @@ def mp_filter_callbacks(self):
             self.cbs_on_multiprocess_start
         ]
 
+    def _mp_filter_cb_list(self, callbacks_list):
+        return [cb for cb in callbacks_list
+                if cb.device_idx_execution is None or
+                (cb.device_idx_execution is not None and cb.device_idx_execution == self.train_loop_obj.device.index)]
+
+    def enforce_callbacks_quality(self, callbacks):
+        for cb in callbacks:
+            if not isinstance(cb, AbstractCallback):
+                raise TypeError(f'Callback {cb} is not inherited from the AbstractCallback')
+
+            if cb.device_idx_execution is not None and self.train_loop_obj.device.index is not None:
+                if cb.device_idx_execution >= torch.cuda.device_count():
+                    raise ValueError(f'Selected device_idx_execution of {cb.device_idx_execution} is too high. '
+                                     f'There are only {torch.cuda.device_count()} available GPU devices. '
+                                     f'Select index ranging from 0 to {torch.cuda.device_count() - 1}')
+
     def __str__(self):
         return 'CALLBACKS\n' \
                f'At on_epoch_begin:\n{self.print_callback_info(self.cbs_on_epoch_begin)}\n' \
@@ -334,3 +205,57 @@ def __str__(self):
                f'At on_after_gradient_update:\n{self.print_callback_info(self.cbs_on_after_gradient_update)}\n' \
                f'At on_after_optimizer_step:\n{self.print_callback_info(self.cbs_on_after_optimizer_step)}\n' \
                f'At on_multiprocess_start:\n{self.print_callback_info(self.cbs_on_multiprocess_start)}'
+
+    @staticmethod
+    def print_callback_info(callback_list):
+        return '\n'.join([f'\t{callback.callback_name}: {type(callback)}, execution_order: {callback.execution_order}'
+                          for callback in callback_list])
+
+    def print_registered_callback_names(self):
+        print(self)
+
+    def __len__(self):
+        return len(self.train_loop_obj.callbacks)
+
+    def __add__(self, other):
+        """
+
+        Args:
+            other (list): callbacks list
+
+        Returns:
+            CallbacksHandler:
+        """
+        self.register_callbacks(other)
+        return self
+
+    def __iadd__(self, other):
+        """
+
+        Args:
+            other (list): callbacks list
+
+        Returns:
+            CallbacksHandler:
+        """
+        self.register_callbacks(other)
+        return self
+
+    def __contains__(self, item):
+        """
+
+        Args:
+            item:
+
+        Returns:
+            bool:
+        """
+        if type(item) == str:
+            for cb in self.train_loop_obj.callbacks:
+                if cb.callback_name == item:
+                    return True
+        else:
+            for cb in self.train_loop_obj.callbacks:
+                if type(cb) == item:
+                    return True
+        return False