fd6a044b7f
Properly setup the opal_process_info structure early in the initialization procedure. Define the local hostname right at the beginning of opal_init so all parts of opal can use it. Overlay that during orte_init as the user may choose to remove fqdn and strip prefixes during that time. Setup the job_session_dir and other such info immediately when it becomes available during orte_init.
155 строки
4.3 KiB
C
155 строки
4.3 KiB
C
/*
|
|
* Copyright (c) 2013 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2013 Inria. All rights reserved.
|
|
* Copyright (c) 2014 Intel, Inc. All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "proc.h"
|
|
#include "opal/util/proc.h"
|
|
#include "opal/util/arch.h"
|
|
#include "opal/mca/dstore/dstore.h"
|
|
#include "opal/mca/pmix/pmix.h"
|
|
|
|
opal_process_info_t opal_process_info = {
|
|
.nodename = NULL,
|
|
.job_session_dir = NULL,
|
|
.proc_session_dir = NULL,
|
|
.num_local_peers = 0, /* there is nobody else but me */
|
|
.my_local_rank = 0, /* I'm the only process around here */
|
|
#if OPAL_HAVE_HWLOC
|
|
.cpuset = NULL,
|
|
#endif
|
|
};
|
|
|
|
static opal_proc_t opal_local_proc = {
|
|
{ .opal_list_next = NULL,
|
|
.opal_list_prev = NULL},
|
|
OPAL_NAME_INVALID,
|
|
0,
|
|
0,
|
|
NULL,
|
|
NULL
|
|
};
|
|
static opal_proc_t* opal_proc_my_name = &opal_local_proc;
|
|
|
|
static void opal_proc_construct(opal_proc_t* proc)
|
|
{
|
|
proc->proc_arch = opal_local_arch;
|
|
proc->proc_convertor = NULL;
|
|
proc->proc_flags = 0;
|
|
proc->proc_name = 0;
|
|
}
|
|
|
|
static void opal_proc_destruct(opal_proc_t* proc)
|
|
{
|
|
proc->proc_flags = 0;
|
|
proc->proc_name = 0;
|
|
proc->proc_hostname = NULL;
|
|
proc->proc_convertor = NULL;
|
|
}
|
|
|
|
OBJ_CLASS_INSTANCE(opal_proc_t, opal_list_item_t,
|
|
opal_proc_construct, opal_proc_destruct);
|
|
|
|
static int
|
|
opal_compare_opal_procs(const opal_process_name_t proc1,
|
|
const opal_process_name_t proc2)
|
|
{
|
|
if( proc1 == proc2 ) return 0;
|
|
if( proc1 < proc2 ) return -1;
|
|
return 1;
|
|
}
|
|
|
|
opal_compare_proc_fct_t opal_compare_proc = opal_compare_opal_procs;
|
|
|
|
opal_proc_t* opal_proc_local_get(void)
|
|
{
|
|
return opal_proc_my_name;
|
|
}
|
|
|
|
int opal_proc_local_set(opal_proc_t* proc)
|
|
{
|
|
if( proc != opal_proc_my_name ) {
|
|
if( NULL != proc )
|
|
OBJ_RETAIN(proc);
|
|
if( &opal_local_proc != opal_proc_my_name )
|
|
OBJ_RELEASE(opal_proc_my_name);
|
|
if( NULL != proc ) {
|
|
opal_proc_my_name = proc;
|
|
} else {
|
|
opal_proc_my_name = &opal_local_proc;
|
|
}
|
|
}
|
|
return OPAL_SUCCESS;
|
|
}
|
|
|
|
/* this function is used to temporarily set the local
|
|
* name while OPAL and upper layers are initializing,
|
|
* thus allowing debug messages to be more easily
|
|
* understood */
|
|
void opal_proc_set_name(opal_process_name_t *name)
|
|
{
|
|
opal_local_proc.proc_name = *name;
|
|
}
|
|
|
|
/**
|
|
* The following functions are surrogates for the RTE functionality, and are not supposed
|
|
* to be called. Instead, the corresponding function pointer should be set by the upper layer
|
|
* before the call to opal_init, to make them point to the correct accessors based on the
|
|
* underlying RTE.
|
|
*/
|
|
static char*
|
|
opal_process_name_print_should_never_be_called(const opal_process_name_t procname)
|
|
{
|
|
return "My Name is Nobody";
|
|
}
|
|
|
|
static uint32_t
|
|
opal_process_name_vpid_should_never_be_called(const opal_process_name_t unused)
|
|
{
|
|
return UINT_MAX;
|
|
}
|
|
|
|
char* (*opal_process_name_print)(const opal_process_name_t) = opal_process_name_print_should_never_be_called;
|
|
uint32_t (*opal_process_name_vpid)(const opal_process_name_t) = opal_process_name_vpid_should_never_be_called;
|
|
uint32_t (*opal_process_name_jobid)(const opal_process_name_t) = opal_process_name_vpid_should_never_be_called;
|
|
|
|
char* opal_get_proc_hostname(const opal_proc_t *proc)
|
|
{
|
|
int ret;
|
|
|
|
/* if the proc is NULL, then we can't know */
|
|
if (NULL == proc) {
|
|
return "unknown";
|
|
}
|
|
|
|
/* if it is my own hostname we are after, then just hand back
|
|
* the value in opal_process_info */
|
|
if (proc == opal_proc_my_name) {
|
|
return opal_process_info.nodename;
|
|
}
|
|
|
|
/* see if we already have the data - if so, pass it back */
|
|
if (NULL != proc->proc_hostname) {
|
|
return proc->proc_hostname;
|
|
}
|
|
|
|
/* if we don't already have it, then try to get it */
|
|
OPAL_MODEX_RECV_VALUE(ret, OPAL_DSTORE_HOSTNAME, proc,
|
|
(char**)&(proc->proc_hostname), OPAL_STRING);
|
|
if (OPAL_SUCCESS != ret) {
|
|
OPAL_ERROR_LOG(ret);
|
|
return "unknown"; // return something so the caller doesn't segfault
|
|
}
|
|
|
|
/* user is not allowed to release the data */
|
|
return proc->proc_hostname;
|
|
}
|