fgnt · boeddeker · Jul 22, 2022 · Jul 14, 2022 · Jul 14, 2022 · Jul 14, 2022
diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
@@ -12,7 +12,7 @@ jobs:
     runs-on: ubuntu-latest
     strategy:
       matrix:
-        python-version: [3.6, 3.7, 3.8]
+        python-version: [3.7, 3.8]
 
     steps:
     - uses: actions/checkout@v2

diff --git a/azure-pipelines.yml b/azure-pipelines.yml
@@ -12,9 +12,6 @@ trigger:
 
 strategy:
   matrix:
-    Python36:
-      IMAGE_NAME: 'ubuntu-18.04'
-      python.version: '3.6'
     Python37:
       IMAGE_NAME: 'ubuntu-18.04'
       python.version: '3.7'

diff --git a/padertorch/configurable.py b/padertorch/configurable.py
@@ -434,10 +434,21 @@ def from_config(
         """Produce a Configurable instance from a valid config."""
         # TODO: assert do not use defaults
 
+
         if isinstance(config, _DogmaticConfig):
             config = config.to_dict()  # if called in finalize_dogmatic dict
         assert 'factory' in config, (cls, config)
         if cls is not Configurable:
+
+            if cls.__module__ == '__main__':
+                # When a class is defined in the main script, it will be
+                # __main__.<ModelName>, but it should be <script>.<ModelName>.
+                # This fix is active when the script is called with
+                # "python -m <script> ..."
+                # but not when it is called with "python <script>.py ..."
+                # pylint: disable=self-cls-assignment
+                cls = import_class(class_to_str(cls))
+
             assert issubclass(import_class(config['factory']), cls), \
                 (config['factory'], cls)
 
@@ -1321,6 +1332,10 @@ def config_to_instance(config, strict=False):
     >>> config_to_instance(config)
     <class 'torch.nn.modules.linear.Linear'>
     """
+
+    if isinstance(config, _DogmaticConfig):
+        config = config.to_dict()  # if called in finalize_dogmatic dict
+
     if isinstance(config, dict):
         special_key = _get_special_key(config)
         if special_key:
@@ -1534,7 +1549,7 @@ def _sacred_dogmatic_to_dict(config):
         return config
 
 
-def _get_signature(cls, drop_positional_only=False):
+def _get_signature(cls, drop_positional_only=False, drop_type_annotations=False):
     """
 
     >>> _get_signature(dict)
@@ -1555,6 +1570,12 @@ def _get_signature(cls, drop_positional_only=False):
     ...
     ValueError: no signature found for builtin type <class 'set'>
 
+
+    >>> _get_signature(Configurable.from_file)
+    <Signature (config_path: pathlib.Path, in_config_path: str = '', consider_mpi=False)>
+    >>> _get_signature(Configurable.from_file, drop_type_annotations=True)
+    <Signature (config_path, in_config_path='', consider_mpi=False)>
+
     """
     if cls in [
         set,  # py38: set missing signature
@@ -1567,7 +1588,7 @@ def _get_signature(cls, drop_positional_only=False):
                 default=(),
             )]
         )
-    elif cls in [dict]:
+    elif cls.__init__ in [dict.__init__]:
         # Dict has no correct signature, hence return the signature, that is
         # needed here.
         sig = inspect.Signature(
@@ -1586,6 +1607,15 @@ def _get_signature(cls, drop_positional_only=False):
                 if p.kind != inspect.Parameter.POSITIONAL_ONLY
             ]
         )
+    if drop_type_annotations:
+        sig = sig.replace(
+            parameters=[
+                p.replace(annotation=p.empty)
+                for p in sig.parameters.values()
+            ],
+            return_annotation=sig.empty
+        )
+
     return sig
 
 
@@ -1609,7 +1639,16 @@ def get_signature(factory):
         """
         if factory in [tuple, list, set, dict]:
             return {}
-        sig = inspect.signature(factory)
+        try:
+            sig = inspect.signature(factory)
+        except ValueError:
+            if factory.__init__ in [tuple.__init__, list.__init__, set.__init__, dict.__init__]:
+                # Buildin type is in MRO and __init__ is not overwritten. e.g.
+                # ValueError: no signature found for builtin type <class 'paderbox.utils.mapping.Dispatcher'>
+                return {}
+            else:
+                raise
+
         defaults = {}
         param: inspect.Parameter
         for name, param in sig.parameters.items():
@@ -1800,7 +1839,7 @@ def _check_redundant_keys(self, msg):
                     f'{msg}\n'
                     f'Too many keywords for the factory {imported}.\n'
                     f'Redundant keys: {redundant_keys}\n'
-                    f'Signature: {_get_signature(imported)}\n'
+                    f'Signature: {_get_signature(imported, drop_type_annotations=True)}\n'
                     f'Current config with fallbacks:\n{pretty(self.data)}'
                 )
 
@@ -1946,7 +1985,7 @@ def to_dict(self):
             except KeyError as ex:
                 from IPython.lib.pretty import pretty
                 if self.special_key == 'factory' \
-                        and self.special_key  in self._key_candidates() and \
+                        and self.special_key in self._key_candidates() and \
                         k != self.special_key:
                     # KeyError has a bad __repr__, use Exception
                     missing_keys = set(self._key_candidates()) - set(self.data.keys())

diff --git a/padertorch/contrib/cb/tensorboard_symlink_tree.py b/padertorch/contrib/cb/tensorboard_symlink_tree.py
@@ -1,7 +1,7 @@
 """
 Create a symlink tree for all specified files in the current folder.
 
-    python -m padertorch.contrib.cb.tensorboard_symlink_tree ../*/*tfevents*
+    python -m padertorch.contrib.cb.tensorboard_symlink_tree ../*/*tfevents* --max_age=1days
 
 Usecase:
 
@@ -28,8 +28,13 @@
 Because of this I created a Makefile in that folder:
 
     .../tensorboard$ cat Makefile
+    symlink_tree1day:
+        find . -xtype l -delete  # Remove broken symlinks: https://unix.stackexchange.com/a/314975/283777
+        python -m padertorch.contrib.cb.tensorboard_symlink_tree --prefix=.. ../*/*tfevents* --max_age=1days
+
     symlink_tree:
-        python -m padertorch.contrib.cb.tensorboard_symlink_tree ../*/*tfevents*
+        find . -xtype l -delete  # Remove broken symlinks: https://unix.stackexchange.com/a/314975/283777
+        python -m padertorch.contrib.cb.tensorboard_symlink_tree --prefix=.. ../*/*tfevents*
 
     tensorboard:
         date && $(cd .../tensorboard && ulimit -v 10000000 && tensorboard --bind_all -v 1 --logdir=. --port=...) && date || date
@@ -38,22 +43,51 @@
 
 import os
 from pathlib import Path
+import datetime
 
 import paderbox as pb
 
 
-def main(*files, prefix=None):
+def main(*files, prefix=None, max_age=None):
     if prefix is None:
         prefix = os.path.commonpath(files)
     print('Common Prefix', prefix)
     print('Create')
+
+    files = [Path(f) for f in files]
+
+    if max_age is not None:
+        # Panda import is slow, but pd.Timedelta
+        # accepts many styles for time
+        # (e.g. '1day')
+        import pandas as pd
+        max_age = pd.Timedelta(max_age)
+        now = pd.Timestamp('now')
+
+        files = sorted(files, key=lambda file: file.stat().st_mtime)
+
     for file in files:
-        file = Path(file)
         link_name = file.relative_to(prefix)
+        if max_age is not None:
+            last_modified = file.stat().st_mtime
+            last_modified = datetime.datetime.fromtimestamp(last_modified)
+
+            if max_age > now - last_modified:
+                # Create symlink if it doesn't exist.
+                pass
+            else:
+                if not link_name.is_symlink():
+                    print(f'Skip {file}, it is {now - last_modified} > {max_age} old.')
+                continue
+
         link_name.parent.mkdir(exist_ok=True)
         source = os.path.relpath(file, link_name.parent)
         if not link_name.exists():
             print(f'\t{link_name} -> {source}')
+
+        # Create symlink if it does not exist,
+        # or check that the symlink point to the
+        # same file.
         pb.io.symlink(source, link_name)
     print('Finish')
 

diff --git a/padertorch/contrib/cb/track.py b/padertorch/contrib/cb/track.py
@@ -391,7 +391,7 @@ def get_shape(self, obj):
             try:
                 return list(obj.shape)
             except AttributeError:
-                return 'unknown'
+                return '?'
 
     def pre(self, module, input):
         self.input_shape = self.get_shape(input)
@@ -655,7 +655,7 @@ def post(self, module, input, output):
             self.maybe_add(t, 'tensors_learnable', 'tensors_fixed')
 
     def _to_str(self, value):
-        return f'{value:6}'
+        return f'{value:6_}'
 
     @property
     def data(self):
@@ -706,7 +706,7 @@ def get_size(self, tensor):
         return tensor.nelement() * tensor.element_size()
 
     def _to_str(self, value):
-        return f'{value:6} B'
+        return f'{value:6_} B'
 
     @property
     def data(self):

diff --git a/padertorch/train/runtime_tests.py b/padertorch/train/runtime_tests.py
@@ -81,6 +81,9 @@ def test_run(
         *,
         deterministic_atol=1e-5,
         deterministic_rtol=1e-5,
+        loss_atol=1e-6,
+        loss_rtol=1e-6,
+        virtual_minibatch_size=None,
 ):
     """
 
@@ -139,6 +142,13 @@ def backup_state_dict(trainer: pt.Trainer):
             'epoch',
             new=-1,
         ))
+        if virtual_minibatch_size is not None:
+            assert virtual_minibatch_size > 0, virtual_minibatch_size
+            exit_stack.enter_context(mock.patch.object(
+                trainer,
+                'virtual_minibatch_size',
+                new=virtual_minibatch_size,
+            ))
 
         class SpyMagicMock(mock.MagicMock):
             def __init__(self, *args, **kw):
@@ -316,8 +326,8 @@ def trainer_step_mock_to_inputs_output_review(review_mock):
         # nested_test_assert_allclose(dt4['review'], dt8['review'])
 
         # Expect that the initial loss is equal for two runs
-        nested_test_assert_allclose(dt1['loss'], dt5['loss'], rtol=1e-6, atol=1e-6)
-        nested_test_assert_allclose(dt2['loss'], dt6['loss'], rtol=1e-6, atol=1e-6)
+        nested_test_assert_allclose(dt1['loss'], dt5['loss'], rtol=loss_rtol, atol=loss_atol)
+        nested_test_assert_allclose(dt2['loss'], dt6['loss'], rtol=loss_rtol, atol=loss_atol)
         try:
             with np.testing.assert_raises(AssertionError):
                 # Expect that the loss changes after training.

diff --git a/padertorch/train/trainer.py b/padertorch/train/trainer.py
@@ -156,6 +156,9 @@ def test_run(
             temporary_directory=None,
             deterministic_atol=1e-5,
             deterministic_rtol=1e-5,
+            loss_atol=1e-6,
+            loss_rtol=1e-6,
+            virtual_minibatch_size=None,
     ):
         """
         Run a test on the trainer instance (i.e. model test).
@@ -193,6 +196,9 @@ def test_run(
             temporary_directory=temporary_directory,
             deterministic_atol=deterministic_atol,
             deterministic_rtol=deterministic_rtol,
+            loss_atol=loss_atol,
+            loss_rtol=loss_rtol,
+            virtual_minibatch_size=virtual_minibatch_size,
         )
 
     def train(