fix load_state_dict error when loading class weights for multi-stage …

…loss
drprojects · Jul 21, 2023 · 6b9ac9a · 6b9ac9a
1 parent b46a9d2
commit 6b9ac9a
Show file tree

Hide file tree

Showing 2 changed files with 27 additions and 8 deletions.
diff --git a/configs/eval.yaml b/configs/eval.yaml
@@ -10,6 +10,10 @@ defaults:
   - extras: default.yaml
   - hydra: default.yaml
 
+  # experiment configs allow for version control of specific hyperparameters
+  # e.g. best hyperparameters for given model and datamodule
+  - experiment: null
+
   # optional local config for machine/user specific settings
   # it's optional since it doesn't need to exist and is excluded from version control
   - optional local: default.yaml

diff --git a/src/models/segmentation.py b/src/models/segmentation.py
@@ -538,14 +538,29 @@ def configure_optimizers(self):
                 "reduce_on_plateau": reduce_on_plateau}}
 
     def load_state_dict(self, state_dict, strict=True):
-        # Little bit of acrobatics due to `criterion.weight`. This
-        # attribute, when present in the `state_dict`, causes
-        # `load_state_dict` to crash.
-        try:
-            super().load_state_dict(state_dict, strict=strict)
-        except:
-            class_weight = state_dict.pop('criterion.weight', None)
-            super().load_state_dict(state_dict, strict=strict)
+        """Basic `load_state_dict` from `torch.nn.Module` with a little
+        bit of acrobatics due to `criterion.weight`.
+
+        This attribute, when present in the `state_dict`, causes
+        `load_state_dict` to crash. More precisely, `criterion.weight`
+        is holding the per-class weights for classification losses.
+        """
+        # Recover the class weights from any 'criterion.weight' or
+        # 'criterion.*.weight' key and remove those keys from the
+        # state_dict
+        keys = []
+        for key in state_dict.keys():
+            if key.startswith('criterion.') and key.endswith('.weight'):
+                keys.append(key)
+        class_weight = state_dict[keys[0]] if len(keys) > 0 else None
+        for key in keys:
+            state_dict.pop(key)
+
+        # Load the state_dict
+        super().load_state_dict(state_dict, strict=strict)
+
+        # If need be, assign the class weights to the criterion
+        if class_weight is not None and hasattr(self.criterion, 'weight'):
             self.criterion.weight = class_weight
 
     @staticmethod