1
1
openmpi/orte/mca/ras/base/ras_base_frame.c
Howard Pritchard d08be74573 SLURM: launch all processes via slurmd
It turns out that the approach of having the HNP do the
fork/exec of MPI ranks on the head node in a SLURM environment
introduces problems when users/sysadmins want to use the SLURM
scancl tool or sbatch --signal option to signal a job.

This commit disables use of the HNP fork/exec procedure when
a job is launched into a SLURM controlled allocation.

update NEWS with a blurb about new ras framework mca parameter.

related to #3998

Signed-off-by: Howard Pritchard <hppritcha@gmail.com>
2017-08-02 14:56:55 -06:00

118 строки
4.2 KiB
C

/*
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
* University Research and Technology
* Corporation. All rights reserved.
* Copyright (c) 2004-2005 The University of Tennessee and The University
* of Tennessee Research Foundation. All rights
* reserved.
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
* University of Stuttgart. All rights reserved.
* Copyright (c) 2004-2005 The Regents of the University of California.
* All rights reserved.
* Copyright (c) 2011-2013 Los Alamos National Security, LLC. All rights
* reserved.
* Copyright (c) 2015 Research Organization for Information Science
* and Technology (RIST). All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "orte_config.h"
#include "orte/constants.h"
#include "orte/mca/mca.h"
#include "opal/mca/base/base.h"
#include "opal/mca/event/event.h"
#include "orte/mca/ras/base/ras_private.h"
#include "orte/mca/ras/base/base.h"
/* NOTE: the RAS does not require a proxy as only the
* HNP can open the framework in orte_init - non-HNP
* procs are not allowed to allocate resources
*/
/*
* The following file was created by configure. It contains extern
* statements and the definition of an array of pointers to each
* component's public mca_base_component_t struct.
*/
#include "orte/mca/ras/base/static-components.h"
/*
* Global variables
*/
orte_ras_base_t orte_ras_base = {0};
static int ras_register(mca_base_register_flag_t flags)
{
orte_ras_base.multiplier = 1;
mca_base_var_register("orte", "ras", "base", "multiplier",
"Simulate a larger cluster by launching N daemons/node",
MCA_BASE_VAR_TYPE_INT,
NULL, 0, 0,
OPAL_INFO_LVL_9,
MCA_BASE_VAR_SCOPE_READONLY, &orte_ras_base.multiplier);
#if SLURM_CRAY_ENV
/*
* If we are in a Cray-SLURM environment, then we cannot
* launch procs local to the HNP. The problem
* is the MPI processes launched on the head node (where the
* ORTE_PROC_IS_HNP evalues to true) get launched by a daemon
* (mpirun) which is not a child of a slurmd daemon. This
* means that any RDMA credentials obtained via the odls/alps
* local launcher are incorrect. Test for this condition. If
* found, then take steps to ensure we launch a daemon on
* the same node as mpirun and that it gets used to fork
* local procs instead of mpirun so they get the proper
* credential */
orte_ras_base.launch_orted_on_hn = true;
#else
orte_ras_base.launch_orted_on_hn = false;
#endif
mca_base_var_register("orte", "ras", "base", "launch_orted_on_hn",
"Launch an orte daemon on the head node",
MCA_BASE_VAR_TYPE_BOOL,
NULL, 0, 0,
OPAL_INFO_LVL_9,
MCA_BASE_VAR_SCOPE_READONLY, &orte_ras_base.launch_orted_on_hn);
return ORTE_SUCCESS;
}
static int orte_ras_base_close(void)
{
/* Close selected component */
if (NULL != orte_ras_base.active_module) {
orte_ras_base.active_module->finalize();
}
return mca_base_framework_components_close(&orte_ras_base_framework, NULL);
}
/**
* * Function for finding and opening either all MCA components, or the one
* * that was specifically requested via a MCA parameter.
* */
static int orte_ras_base_open(mca_base_open_flag_t flags)
{
/* set default flags */
orte_ras_base.active_module = NULL;
orte_ras_base.allocation_read = false;
orte_ras_base.total_slots_alloc = 0;
/* Open up all available components */
return mca_base_framework_components_open(&orte_ras_base_framework, flags);
}
MCA_BASE_FRAMEWORK_DECLARE(orte, ras, "ORTE Resource Allocation Subsystem",
ras_register, orte_ras_base_open, orte_ras_base_close,
mca_ras_base_static_components, 0);