huggingface · younesbelkada · Mar 15, 2023 · Mar 10, 2023 · Mar 10, 2023
diff --git a/src/accelerate/accelerator.py b/src/accelerate/accelerator.py
@@ -1137,6 +1137,14 @@ def prepare_model(self, model: torch.nn.Module, device_placement=None):
             device_placement = self.device_placement and self.distributed_type != DistributedType.FSDP
         self._models.append(model)
         # We check only for models loaded with `accelerate`
+
+        # Checks if any of the child module has the attribute `hf_device_map`.
+        has_hf_device_map = False
+        for m in model.modules():
+            if hasattr(m, "hf_device_map"):
+                has_hf_device_map = True
+                break
+
         if getattr(model, "is_loaded_in_8bit", False) and getattr(model, "hf_device_map", False):
             model_devices = set(model.hf_device_map.values())
             if len(model_devices) > 1:
@@ -1157,7 +1165,7 @@ def prepare_model(self, model: torch.nn.Module, device_placement=None):
                 raise ValueError(
                     "You can't train a model that has been loaded in 8-bit precision with CPU or disk offload."
                 )
-        elif device_placement:
+        elif device_placement and not has_hf_device_map:
             model = model.to(self.device)
 
         if self.distributed_type == DistributedType.MULTI_GPU: