1
1

There seems to be a subtle race condition when we fail to spawn a

child. Marking the child as failed solve the issue.

This commit was SVN r15087.
Этот коммит содержится в:
George Bosilca 2007-06-14 22:36:47 +00:00
родитель a4d99ddef6
Коммит 35e824377e

Просмотреть файл

@ -241,7 +241,7 @@ static int orte_odls_process_kill_local_procs(orte_jobid_t job, bool set_state)
{ {
orte_odls_child_t *child; orte_odls_child_t *child;
opal_list_item_t *item, *next; opal_list_item_t *item, *next;
int rc, exit_status; int rc, exit_status = -1;
opal_list_t procs_killed; opal_list_t procs_killed;
orte_namelist_t *proc; orte_namelist_t *proc;
@ -1137,6 +1137,7 @@ DOFORK:
* across the entire cluster. Instead, we let orterun * across the entire cluster. Instead, we let orterun
* output a consolidated error message for us * output a consolidated error message for us
*/ */
child->state = ORTE_PROC_STATE_FAILED_TO_START;
quit_flag = true; quit_flag = true;
} }
/* reaquire lock so we don't double unlock... */ /* reaquire lock so we don't double unlock... */