Correct some logic for tracking launch progress
This commit was SVN r23122.
Этот коммит содержится в:
родитель
7ce34223f1
Коммит
b9f0615727
@ -211,6 +211,16 @@ static int update_state(orte_jobid_t job,
|
|||||||
case ORTE_JOB_STATE_RUNNING:
|
case ORTE_JOB_STATE_RUNNING:
|
||||||
/* update all procs in job */
|
/* update all procs in job */
|
||||||
update_local_procs_in_job(jdata, jobstate, ORTE_PROC_STATE_RUNNING, 0);
|
update_local_procs_in_job(jdata, jobstate, ORTE_PROC_STATE_RUNNING, 0);
|
||||||
|
/* record that we reported */
|
||||||
|
jdata->num_daemons_reported++;
|
||||||
|
/* report if requested */
|
||||||
|
if (orte_report_launch_progress) {
|
||||||
|
if (0 == jdata->num_daemons_reported % 100 || jdata->num_daemons_reported == orte_process_info.num_procs) {
|
||||||
|
opal_output(orte_clean_output, "Reported: %d (out of %d) daemons - %d (out of %d) procs",
|
||||||
|
(int)jdata->num_daemons_reported, (int)orte_process_info.num_procs,
|
||||||
|
(int)jdata->num_launched, (int)jdata->num_procs);
|
||||||
|
}
|
||||||
|
}
|
||||||
break;
|
break;
|
||||||
case ORTE_JOB_STATE_NEVER_LAUNCHED:
|
case ORTE_JOB_STATE_NEVER_LAUNCHED:
|
||||||
orte_never_launched = true;
|
orte_never_launched = true;
|
||||||
|
@ -336,7 +336,7 @@ static void process_msg(int fd, short event, void *data)
|
|||||||
ORTE_JOBID_PRINT(job)));
|
ORTE_JOBID_PRINT(job)));
|
||||||
|
|
||||||
name.jobid = job;
|
name.jobid = job;
|
||||||
running = true;
|
running = false;
|
||||||
/* get the job object */
|
/* get the job object */
|
||||||
if (NULL == (jdata = orte_get_job_data_object(job))) {
|
if (NULL == (jdata = orte_get_job_data_object(job))) {
|
||||||
ORTE_ERROR_LOG(ORTE_ERR_NOT_FOUND);
|
ORTE_ERROR_LOG(ORTE_ERR_NOT_FOUND);
|
||||||
@ -421,8 +421,8 @@ static void process_msg(int fd, short event, void *data)
|
|||||||
ORTE_ERROR_LOG(rc);
|
ORTE_ERROR_LOG(rc);
|
||||||
goto CLEANUP;
|
goto CLEANUP;
|
||||||
}
|
}
|
||||||
if (ORTE_PROC_STATE_RUNNING != state) {
|
if (ORTE_PROC_STATE_RUNNING == state) {
|
||||||
running = false;
|
running = true;
|
||||||
}
|
}
|
||||||
/* unpack the exit code */
|
/* unpack the exit code */
|
||||||
count = 1;
|
count = 1;
|
||||||
@ -447,8 +447,8 @@ static void process_msg(int fd, short event, void *data)
|
|||||||
} else {
|
} else {
|
||||||
rc = ORTE_SUCCESS;
|
rc = ORTE_SUCCESS;
|
||||||
}
|
}
|
||||||
|
jdata->num_daemons_reported++;
|
||||||
if (orte_report_launch_progress && running) {
|
if (orte_report_launch_progress && running) {
|
||||||
jdata->num_daemons_reported++;
|
|
||||||
if (0 == jdata->num_daemons_reported % 100 || jdata->num_daemons_reported == orte_process_info.num_procs) {
|
if (0 == jdata->num_daemons_reported % 100 || jdata->num_daemons_reported == orte_process_info.num_procs) {
|
||||||
opal_output(orte_clean_output, "Reported: %d (out of %d) daemons - %d (out of %d) procs",
|
opal_output(orte_clean_output, "Reported: %d (out of %d) daemons - %d (out of %d) procs",
|
||||||
(int)jdata->num_daemons_reported, (int)orte_process_info.num_procs,
|
(int)jdata->num_daemons_reported, (int)orte_process_info.num_procs,
|
||||||
|
Загрузка…
x
Ссылка в новой задаче
Block a user