Add trace to the daemons and orterun so we can tell when their callbacks are being exercised.
This commit was SVN r7432.
Этот коммит содержится в:
родитель
d81726833e
Коммит
86a43b1d29
@ -31,40 +31,41 @@
|
||||
#include <errno.h>
|
||||
#include <signal.h>
|
||||
|
||||
#include "include/orte_constants.h"
|
||||
#include "orte/include/orte_constants.h"
|
||||
|
||||
#include "opal/event/event.h"
|
||||
#include "opal/mca/base/base.h"
|
||||
#include "opal/threads/mutex.h"
|
||||
#include "opal/threads/condition.h"
|
||||
|
||||
#include "dps/dps.h"
|
||||
#include "opal/util/opal_environ.h"
|
||||
#include "opal/util/output.h"
|
||||
#include "opal/util/show_help.h"
|
||||
#include "util/sys_info.h"
|
||||
#include "opal/event/event.h"
|
||||
#include "opal/util/os_path.h"
|
||||
#include "opal/util/cmd_line.h"
|
||||
#include "util/proc_info.h"
|
||||
#include "util/univ_info.h"
|
||||
#include "util/session_dir.h"
|
||||
#include "opal/util/printf.h"
|
||||
#include "opal/util/daemon_init.h"
|
||||
#include "util/universe_setup_file_io.h"
|
||||
#include "opal/util/opal_environ.h"
|
||||
#include "opal/util/os_path.h"
|
||||
#include "opal/util/output.h"
|
||||
#include "opal/util/printf.h"
|
||||
#include "opal/util/show_help.h"
|
||||
#include "opal/util/trace.h"
|
||||
|
||||
#include "mca/base/base.h"
|
||||
#include "mca/errmgr/errmgr.h"
|
||||
#include "mca/ns/ns.h"
|
||||
#include "mca/ns/base/base.h"
|
||||
#include "mca/gpr/gpr.h"
|
||||
#include "mca/rml/rml.h"
|
||||
#include "mca/soh/soh.h"
|
||||
#include "mca/rmgr/rmgr.h"
|
||||
#include "mca/rmgr/base/base.h"
|
||||
#include "mca/soh/base/base.h"
|
||||
#include "orte/dps/dps.h"
|
||||
#include "orte/util/sys_info.h"
|
||||
#include "orte/util/proc_info.h"
|
||||
#include "orte/util/univ_info.h"
|
||||
#include "orte/util/session_dir.h"
|
||||
#include "orte/util/universe_setup_file_io.h"
|
||||
|
||||
#include "runtime/runtime.h"
|
||||
#include "orte/mca/errmgr/errmgr.h"
|
||||
#include "orte/mca/ns/ns.h"
|
||||
#include "orte/mca/ns/base/base.h"
|
||||
#include "orte/mca/gpr/gpr.h"
|
||||
#include "orte/mca/rml/rml.h"
|
||||
#include "orte/mca/soh/soh.h"
|
||||
#include "orte/mca/rmgr/rmgr.h"
|
||||
#include "orte/mca/rmgr/base/base.h"
|
||||
#include "orte/mca/soh/base/base.h"
|
||||
|
||||
#include "tools/orted/orted.h"
|
||||
#include "orte/runtime/runtime.h"
|
||||
|
||||
#include "orte/tools/orted/orted.h"
|
||||
|
||||
extern char **environ;
|
||||
|
||||
@ -434,6 +435,8 @@ int main(int argc, char *argv[])
|
||||
|
||||
static void signal_callback(int fd, short flags, void *arg)
|
||||
{
|
||||
OPAL_TRACE(1);
|
||||
|
||||
orted_globals.exit_condition = true;
|
||||
opal_condition_signal(&orted_globals.condition);
|
||||
}
|
||||
@ -448,6 +451,8 @@ static void orte_daemon_recv(int status, orte_process_name_t* sender,
|
||||
size_t n;
|
||||
char *contact_info;
|
||||
|
||||
OPAL_TRACE(1);
|
||||
|
||||
OPAL_THREAD_LOCK(&orted_globals.mutex);
|
||||
|
||||
if (orted_globals.debug_daemons) {
|
||||
@ -535,6 +540,8 @@ void job_state_callback(orte_gpr_notify_data_t *data, void *cbdata)
|
||||
size_t i, j, k;
|
||||
int rc;
|
||||
|
||||
OPAL_TRACE(1);
|
||||
|
||||
/* we made sure in the subscriptions that at least one
|
||||
* value is always returned
|
||||
* get the jobid from the segment name in the first value
|
||||
|
@ -30,31 +30,33 @@
|
||||
#include <sys/types.h>
|
||||
#include <sys/wait.h>
|
||||
|
||||
#include "include/orte_constants.h"
|
||||
|
||||
#include "opal/event/event.h"
|
||||
#include "class/orte_pointer_array.h"
|
||||
#include "util/proc_info.h"
|
||||
#include "opal/util/argv.h"
|
||||
#include "opal/util/opal_environ.h"
|
||||
#include "opal/util/path.h"
|
||||
#include "opal/util/cmd_line.h"
|
||||
#include "util/sys_info.h"
|
||||
#include "opal/util/output.h"
|
||||
#include "util/universe_setup_file_io.h"
|
||||
#include "opal/util/show_help.h"
|
||||
#include "opal/util/basename.h"
|
||||
#include "opal/mca/base/base.h"
|
||||
#include "opal/threads/condition.h"
|
||||
#include "opal/util/argv.h"
|
||||
#include "opal/util/basename.h"
|
||||
#include "opal/util/cmd_line.h"
|
||||
#include "opal/util/opal_environ.h"
|
||||
#include "opal/util/output.h"
|
||||
#include "opal/util/path.h"
|
||||
#include "opal/util/show_help.h"
|
||||
#include "opal/util/trace.h"
|
||||
|
||||
#include "mca/base/base.h"
|
||||
#include "mca/ns/ns.h"
|
||||
#include "mca/gpr/gpr.h"
|
||||
#include "mca/rmgr/rmgr.h"
|
||||
#include "mca/schema/schema.h"
|
||||
#include "mca/errmgr/errmgr.h"
|
||||
#include "orte/include/orte_constants.h"
|
||||
|
||||
#include "runtime/runtime.h"
|
||||
#include "runtime/orte_wait.h"
|
||||
#include "orte/class/orte_pointer_array.h"
|
||||
#include "orte/util/proc_info.h"
|
||||
#include "orte/util/sys_info.h"
|
||||
#include "orte/util/universe_setup_file_io.h"
|
||||
|
||||
#include "orte/mca/ns/ns.h"
|
||||
#include "orte/mca/gpr/gpr.h"
|
||||
#include "orte/mca/rmgr/rmgr.h"
|
||||
#include "orte/mca/schema/schema.h"
|
||||
#include "orte/mca/errmgr/errmgr.h"
|
||||
|
||||
#include "orte/runtime/runtime.h"
|
||||
#include "orte/runtime/orte_wait.h"
|
||||
|
||||
#include "orterun.h"
|
||||
#include "totalview.h"
|
||||
@ -432,6 +434,8 @@ static void dump_aborted_procs(orte_jobid_t jobid)
|
||||
NULL
|
||||
};
|
||||
|
||||
OPAL_TRACE(1);
|
||||
|
||||
/* query the job segment on the registry */
|
||||
if(ORTE_SUCCESS != (rc = orte_schema.get_job_segment_name(&segment, jobid))) {
|
||||
ORTE_ERROR_LOG(rc);
|
||||
@ -532,6 +536,8 @@ static void dump_aborted_procs(orte_jobid_t jobid)
|
||||
|
||||
static void job_state_callback(orte_jobid_t jobid, orte_proc_state_t state)
|
||||
{
|
||||
OPAL_TRACE(1);
|
||||
|
||||
OPAL_THREAD_LOCK(&orterun_globals.lock);
|
||||
|
||||
/* Note that there's only two states that we're interested in
|
||||
@ -579,6 +585,8 @@ static void job_state_callback(orte_jobid_t jobid, orte_proc_state_t state)
|
||||
|
||||
static void exit_callback(int fd, short event, void *arg)
|
||||
{
|
||||
OPAL_TRACE(1);
|
||||
|
||||
opal_show_help("help-orterun.txt", "orterun:abnormal-exit",
|
||||
true, orterun_basename, orterun_basename);
|
||||
|
||||
@ -606,6 +614,9 @@ static void signal_callback(int fd, short flags, void *arg)
|
||||
opal_event_t* event;
|
||||
|
||||
static int signalled = 0;
|
||||
|
||||
OPAL_TRACE(1);
|
||||
|
||||
if (0 != signalled++) {
|
||||
return;
|
||||
}
|
||||
|
Загрузка…
Ссылка в новой задаче
Block a user