diff --git a/horovod/runner/elastic/driver.py b/horovod/runner/elastic/driver.py index 20a2dd7b97..18a697ab3f 100644 --- a/horovod/runner/elastic/driver.py +++ b/horovod/runner/elastic/driver.py @@ -187,7 +187,7 @@ def _discover_hosts(self): if update_res != HostUpdateResult.no_update: self._notify_workers_host_changes(self._host_manager.current_hosts, update_res) self._wait_hosts_cond.notify_all() - except RuntimeError as e: + except BaseException as e: if first_update: # Misconfiguration, fail the job immediately self._shutdown.set()