a89dc623b0
anything for non-MPI apps. Oops! (But before you freak out, gentle reader, note that mpi_paffinity_alone for MPI apps still worked fine) When we made the switchover somewhere in the 1.3 series to have the orted's do processor binding, then stuff like: mpirun --mca mpi_paffinity_alone 1 hostname should have bound hostname to processor 0. But it didn't because of a subtle startup ordering issue: the MCA param registration for opal_paffinity_alone was in the paffinity base (vs. being in opal/runtime/opal_params.c), but it didn't actually get registered until after the global variable opal_paffinity_alone was checked to see if we wanted old-style affinity bindings. Oops. However, for MPI apps, even though the orted didn't do the binding, ompi_mpi_init() would notice that opal_paffinity_alone was set, yet the process didn't seem to be bound. So the MPI process would bind itself (this was done to support the running-without-orteds scenarios). Hence, MPI apps still obeyed mpi_paffinity_alone semantics. But note that the error described above caused the new mpirun switch --report-bindings to not work with mpi_paffinity_alone=1, meaning that the orted would not report the bindings when mpi_paffinity_alone was set to 1 (it ''did'' correctly report bindings if you used --bind-to-core or one of the other binding options). This commit separates out the paffinity base MCA param registration into a small function that can be called at the Right place during the startup sequence. This commit was SVN r22602.
118 строки
4.1 KiB
C
118 строки
4.1 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2006 Los Alamos National Security, LLC. All rights
|
|
* reserved.
|
|
* Copyright (c) 2008-2010 Cisco Systems, Inc. All rights reserved.
|
|
* Copyright (c) 2009 Oak Ridge National Labs. All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "opal_config.h"
|
|
|
|
#include <time.h>
|
|
#ifdef HAVE_SIGNAL_H
|
|
#include <signal.h>
|
|
#endif
|
|
|
|
#include "opal/constants.h"
|
|
#include "opal/runtime/opal.h"
|
|
#include "opal/datatype/opal_datatype.h"
|
|
#include "opal/mca/base/mca_base_param.h"
|
|
#include "opal/threads/mutex.h"
|
|
#include "opal/mca/paffinity/base/base.h"
|
|
|
|
int opal_register_params(void)
|
|
{
|
|
int ret;
|
|
|
|
/*
|
|
* This string is going to be used in opal/util/stacktrace.c
|
|
*/
|
|
{
|
|
char *string = NULL;
|
|
int j;
|
|
int signals[] = {
|
|
#ifdef SIGABRT
|
|
SIGABRT,
|
|
#endif
|
|
#ifdef SIGBUS
|
|
SIGBUS,
|
|
#endif
|
|
#ifdef SIGFPE
|
|
SIGFPE,
|
|
#endif
|
|
#ifdef SIGSEGV
|
|
SIGSEGV,
|
|
#endif
|
|
-1
|
|
};
|
|
for (j = 0 ; signals[j] != -1 ; ++j) {
|
|
if (j == 0) {
|
|
asprintf(&string, "%d", signals[j]);
|
|
} else {
|
|
char *tmp;
|
|
asprintf(&tmp, "%s,%d", string, signals[j]);
|
|
free(string);
|
|
string = tmp;
|
|
}
|
|
}
|
|
|
|
mca_base_param_reg_string_name("opal", "signal",
|
|
"Comma-delimited list of integer signal numbers to Open MPI to attempt to intercept. Upon receipt of the intercepted signal, Open MPI will display a stack trace and abort. Open MPI will *not* replace signals if handlers are already installed by the time MPI_INIT is invoked. Optionally append \":complain\" to any signal number in the comma-delimited list to make Open MPI complain if it detects another signal handler (and therefore does not insert its own).",
|
|
false, false, string, NULL);
|
|
free(string);
|
|
}
|
|
|
|
{
|
|
int j;
|
|
|
|
mca_base_param_reg_int_name("opal", "profile",
|
|
"Set to non-zero to profile component selections",
|
|
false, false, (int)false, &j);
|
|
opal_profile = OPAL_INT_TO_BOOL(j);
|
|
|
|
mca_base_param_reg_string_name("opal", "profile_file",
|
|
"Name of the file containing the cluster configuration information",
|
|
false, false, NULL, &opal_profile_file);
|
|
}
|
|
|
|
#if OPAL_ENABLE_DEBUG
|
|
|
|
|
|
mca_base_param_reg_int_name("opal", "progress_debug",
|
|
"Set to non-zero to debug progress engine features",
|
|
false, false, 0, NULL);
|
|
|
|
{
|
|
int value;
|
|
mca_base_param_reg_int_name("opal", "debug_locks",
|
|
"Debug mutex usage within Open MPI. On a "
|
|
"non-threaded build, this enables integer counters and "
|
|
"warning messages when double-locks are detected.",
|
|
false, false, 0, &value);
|
|
if (value) opal_mutex_check_locks = true;
|
|
}
|
|
#endif
|
|
/* The ddt engine has a few parameters */
|
|
ret = opal_datatype_register_params();
|
|
if (OPAL_SUCCESS != ret) {
|
|
return ret;
|
|
}
|
|
|
|
/* Paffinity base also has some parameters */
|
|
return opal_paffinity_base_register_params();
|
|
}
|