From ce901ba24746e569e0935f513677d34c7f053d38 Mon Sep 17 00:00:00 2001 From: Ralph Castain Date: Mon, 5 Feb 2018 19:31:43 -0800 Subject: [PATCH] Ensure we fail if remote nodes cannot find executable Signed-off-by: Ralph Castain --- orte/mca/errmgr/default_orted/errmgr_default_orted.c | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/orte/mca/errmgr/default_orted/errmgr_default_orted.c b/orte/mca/errmgr/default_orted/errmgr_default_orted.c index bce51638666..92cfc27e98a 100644 --- a/orte/mca/errmgr/default_orted/errmgr_default_orted.c +++ b/orte/mca/errmgr/default_orted/errmgr_default_orted.c @@ -594,6 +594,14 @@ static void proc_errors(int fd, short args, void *cbdata) * so that we send a consolidated error report * back to the HNP */ + if (jdata->num_local_procs == jdata->num_terminated) { + /* let the state machine know */ + if (ORTE_PROC_STATE_FAILED_TO_START == state) { + ORTE_ACTIVATE_JOB_STATE(jdata, ORTE_JOB_STATE_FAILED_TO_START); + } else { + ORTE_ACTIVATE_JOB_STATE(jdata, ORTE_JOB_STATE_FAILED_TO_LAUNCH); + } + } goto cleanup; }