Ensure we don't incorrectly return a non-zero exit code when normally terminating a slurm job.
Slurm, of course, must always be different... This commit was SVN r23371.
Этот коммит содержится в:
родитель
5d2233c950
Коммит
da61b69b15
@ -399,7 +399,11 @@ static int update_state(orte_jobid_t job,
|
|||||||
/* if we have ordered orteds to terminate, see if this one failed to tell
|
/* if we have ordered orteds to terminate, see if this one failed to tell
|
||||||
* us it had terminated
|
* us it had terminated
|
||||||
*/
|
*/
|
||||||
if (orte_orteds_term_ordered) {
|
if (orte_orteds_openend_term_ordered) {
|
||||||
|
record_dead_daemon(jdata, proc->vpid, state, 0);
|
||||||
|
check_job_complete(jdata);
|
||||||
|
break;
|
||||||
|
} else if (orte_orteds_term_ordered) {
|
||||||
record_dead_daemon(jdata, proc->vpid, state, exit_code);
|
record_dead_daemon(jdata, proc->vpid, state, exit_code);
|
||||||
check_job_complete(jdata);
|
check_job_complete(jdata);
|
||||||
break;
|
break;
|
||||||
|
@ -505,6 +505,7 @@ static int plm_slurm_terminate_orteds(void)
|
|||||||
/* tell them to die without sending a reply - we will rely on the
|
/* tell them to die without sending a reply - we will rely on the
|
||||||
* waitpid to tell us when they have exited!
|
* waitpid to tell us when they have exited!
|
||||||
*/
|
*/
|
||||||
|
orte_orteds_openend_term_ordered = true;
|
||||||
if (ORTE_SUCCESS != (rc = orte_plm_base_orted_exit(ORTE_DAEMON_EXIT_CMD))) {
|
if (ORTE_SUCCESS != (rc = orte_plm_base_orted_exit(ORTE_DAEMON_EXIT_CMD))) {
|
||||||
ORTE_ERROR_LOG(rc);
|
ORTE_ERROR_LOG(rc);
|
||||||
}
|
}
|
||||||
|
@ -96,6 +96,7 @@ bool orte_abnormal_term_ordered = false;
|
|||||||
bool orte_routing_is_enabled = false;
|
bool orte_routing_is_enabled = false;
|
||||||
bool orte_job_term_ordered = false;
|
bool orte_job_term_ordered = false;
|
||||||
bool orte_orteds_term_ordered = false;
|
bool orte_orteds_term_ordered = false;
|
||||||
|
bool orte_orteds_openend_term_ordered = false;
|
||||||
|
|
||||||
int orte_startup_timeout;
|
int orte_startup_timeout;
|
||||||
|
|
||||||
|
@ -604,6 +604,7 @@ ORTE_DECLSPEC extern bool orte_abnormal_term_ordered;
|
|||||||
ORTE_DECLSPEC extern bool orte_routing_is_enabled;
|
ORTE_DECLSPEC extern bool orte_routing_is_enabled;
|
||||||
ORTE_DECLSPEC extern bool orte_job_term_ordered;
|
ORTE_DECLSPEC extern bool orte_job_term_ordered;
|
||||||
ORTE_DECLSPEC extern bool orte_orteds_term_ordered;
|
ORTE_DECLSPEC extern bool orte_orteds_term_ordered;
|
||||||
|
ORTE_DECLSPEC extern bool orte_orteds_openend_term_ordered;
|
||||||
|
|
||||||
ORTE_DECLSPEC extern int orte_startup_timeout;
|
ORTE_DECLSPEC extern int orte_startup_timeout;
|
||||||
|
|
||||||
|
Загрузка…
x
Ссылка в новой задаче
Block a user