264 строки
7.5 KiB
C
264 строки
7.5 KiB
C
|
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
||
|
/*
|
||
|
* Copyright (c) 2011 Mellanox Technologies. All rights reserved.
|
||
|
* Copyright (c) 2015 Los Alamos National Security, LLC. All rights
|
||
|
* reserved.
|
||
|
* $COPYRIGHT$
|
||
|
*
|
||
|
* Additional copyrights may follow
|
||
|
*
|
||
|
* $HEADER$
|
||
|
*/
|
||
|
#include "ompi_config.h"
|
||
|
#include <stdio.h>
|
||
|
|
||
|
#include <dlfcn.h>
|
||
|
#include <libgen.h>
|
||
|
|
||
|
#include "coll_hcoll.h"
|
||
|
#include "opal/mca/installdirs/installdirs.h"
|
||
|
#include "coll_hcoll_dtypes.h"
|
||
|
|
||
|
/*
|
||
|
* Public string showing the coll ompi_hcol component version number
|
||
|
*/
|
||
|
const char *mca_coll_hcoll_component_version_string =
|
||
|
"Open MPI HCOL collective MCA component version " OMPI_VERSION;
|
||
|
|
||
|
|
||
|
static int hcoll_open(void);
|
||
|
static int hcoll_close(void);
|
||
|
static int hcoll_register(void);
|
||
|
int mca_coll_hcoll_output = -1;
|
||
|
mca_coll_hcoll_component_t mca_coll_hcoll_component = {
|
||
|
|
||
|
/* First, the mca_component_t struct containing meta information
|
||
|
about the component itfca */
|
||
|
{
|
||
|
.collm_version = {
|
||
|
MCA_COLL_BASE_VERSION_2_0_0,
|
||
|
|
||
|
/* Component name and version */
|
||
|
.mca_component_name = "hcoll",
|
||
|
MCA_BASE_MAKE_VERSION(component, OMPI_MAJOR_VERSION, OMPI_MINOR_VERSION,
|
||
|
OMPI_RELEASE_VERSION),
|
||
|
|
||
|
/* Component open and close functions */
|
||
|
.mca_open_component = hcoll_open,
|
||
|
.mca_close_component = hcoll_close,
|
||
|
.mca_register_component_params = hcoll_register,
|
||
|
},
|
||
|
.collm_data = {
|
||
|
/* The component is not checkpoint ready */
|
||
|
MCA_BASE_METADATA_PARAM_NONE
|
||
|
},
|
||
|
|
||
|
/* Initialization / querying functions */
|
||
|
|
||
|
.collm_init_query = mca_coll_hcoll_init_query,
|
||
|
.collm_comm_query = mca_coll_hcoll_comm_query,
|
||
|
},
|
||
|
90, /* priority */
|
||
|
0, /* verbose level */
|
||
|
0, /* hcoll_enable */
|
||
|
NULL /*hcoll version */
|
||
|
};
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
int mca_coll_hcoll_get_lib(void)
|
||
|
{
|
||
|
|
||
|
memset(&mca_coll_hcoll_component.hcoll_ops,
|
||
|
0, sizeof(mca_coll_hcoll_component.hcoll_ops));
|
||
|
|
||
|
return OMPI_SUCCESS;
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* * Local flags
|
||
|
* */
|
||
|
enum {
|
||
|
REGINT_NEG_ONE_OK = 0x01,
|
||
|
REGINT_GE_ZERO = 0x02,
|
||
|
REGINT_GE_ONE = 0x04,
|
||
|
REGINT_NONZERO = 0x08,
|
||
|
REGINT_MAX = 0x88
|
||
|
};
|
||
|
|
||
|
enum {
|
||
|
REGSTR_EMPTY_OK = 0x01,
|
||
|
REGSTR_MAX = 0x88
|
||
|
};
|
||
|
|
||
|
|
||
|
/*
|
||
|
* Utility routine for integer parameter registration
|
||
|
*/
|
||
|
static int reg_int(const char* param_name,
|
||
|
const char* deprecated_param_name,
|
||
|
const char* param_desc,
|
||
|
int default_value, int *storage, int flags)
|
||
|
{
|
||
|
int index;
|
||
|
|
||
|
*storage = default_value;
|
||
|
index = mca_base_component_var_register(
|
||
|
&mca_coll_hcoll_component.super.collm_version,
|
||
|
param_name, param_desc, MCA_BASE_VAR_TYPE_INT,
|
||
|
NULL, 0, 0,OPAL_INFO_LVL_9,
|
||
|
MCA_BASE_VAR_SCOPE_READONLY, storage);
|
||
|
if (NULL != deprecated_param_name) {
|
||
|
(void) mca_base_var_register_synonym(index,
|
||
|
"ompi", "coll", "hcoll", deprecated_param_name,
|
||
|
MCA_BASE_VAR_SYN_FLAG_DEPRECATED);
|
||
|
}
|
||
|
|
||
|
if (0 != (flags & REGINT_NEG_ONE_OK) && -1 == *storage) {
|
||
|
return OMPI_SUCCESS;
|
||
|
}
|
||
|
|
||
|
if ((0 != (flags & REGINT_GE_ZERO) && *storage < 0) ||
|
||
|
(0 != (flags & REGINT_GE_ONE) && *storage < 1) ||
|
||
|
(0 != (flags & REGINT_NONZERO) && 0 == *storage)) {
|
||
|
opal_output(0, "Bad parameter value for parameter \"%s\"",
|
||
|
param_name);
|
||
|
return OMPI_ERR_BAD_PARAM;
|
||
|
}
|
||
|
|
||
|
return OMPI_SUCCESS;
|
||
|
}
|
||
|
|
||
|
|
||
|
static int hcoll_register(void)
|
||
|
{
|
||
|
|
||
|
int ret, tmp;
|
||
|
|
||
|
ret = OMPI_SUCCESS;
|
||
|
|
||
|
#define CHECK(expr) do { \
|
||
|
tmp = (expr); \
|
||
|
if (OMPI_SUCCESS != tmp) ret = tmp; \
|
||
|
} while (0)
|
||
|
|
||
|
|
||
|
CHECK(reg_int("priority",NULL,
|
||
|
"Priority of the hcol coll component",
|
||
|
90,
|
||
|
&mca_coll_hcoll_component.hcoll_priority,
|
||
|
0));
|
||
|
|
||
|
CHECK(reg_int("verbose", NULL,
|
||
|
"Verbose level of the hcol coll component",
|
||
|
0,
|
||
|
&mca_coll_hcoll_component.hcoll_verbose,
|
||
|
0));
|
||
|
|
||
|
CHECK(reg_int("enable",NULL,
|
||
|
"[1|0|] Enable/Disable HCOL",
|
||
|
1,
|
||
|
&mca_coll_hcoll_component.hcoll_enable,
|
||
|
0));
|
||
|
|
||
|
CHECK(reg_int("np",NULL,
|
||
|
"Minimal number of processes in the communicator"
|
||
|
" for the corresponding hcoll context to be created (default: 32)",
|
||
|
2,
|
||
|
&mca_coll_hcoll_component.hcoll_np,
|
||
|
0));
|
||
|
|
||
|
CHECK(reg_int("datatype_fallback",NULL,
|
||
|
"[1|0|] Enable/Disable user defined dattypes fallback",
|
||
|
1,
|
||
|
&mca_coll_hcoll_component.hcoll_datatype_fallback,
|
||
|
0));
|
||
|
#if HCOLL_API >= HCOLL_VERSION(3,6)
|
||
|
CHECK(reg_int("dts",NULL,
|
||
|
"[1|0|] Enable/Disable derived types support",
|
||
|
1,
|
||
|
&mca_coll_hcoll_component.derived_types_support_enabled,
|
||
|
0));
|
||
|
#else
|
||
|
mca_coll_hcoll_component.derived_types_support_enabled = 0;
|
||
|
#endif
|
||
|
mca_coll_hcoll_component.compiletime_version = HCOLL_VERNO_STRING;
|
||
|
mca_base_component_var_register(&mca_coll_hcoll_component.super.collm_version,
|
||
|
MCA_COMPILETIME_VER,
|
||
|
"Version of the libhcoll library with which Open MPI was compiled",
|
||
|
MCA_BASE_VAR_TYPE_VERSION_STRING,
|
||
|
NULL, 0, 0,
|
||
|
OPAL_INFO_LVL_3,
|
||
|
MCA_BASE_VAR_SCOPE_READONLY,
|
||
|
&mca_coll_hcoll_component.compiletime_version);
|
||
|
mca_coll_hcoll_component.runtime_version = hcoll_get_version();
|
||
|
mca_base_component_var_register(&mca_coll_hcoll_component.super.collm_version,
|
||
|
MCA_RUNTIME_VER,
|
||
|
"Version of the libhcoll library with which Open MPI is running",
|
||
|
MCA_BASE_VAR_TYPE_VERSION_STRING,
|
||
|
NULL, 0, 0,
|
||
|
OPAL_INFO_LVL_3,
|
||
|
MCA_BASE_VAR_SCOPE_READONLY,
|
||
|
&mca_coll_hcoll_component.runtime_version);
|
||
|
|
||
|
return ret;
|
||
|
}
|
||
|
|
||
|
static int hcoll_open(void)
|
||
|
{
|
||
|
mca_coll_hcoll_component_t *cm;
|
||
|
cm = &mca_coll_hcoll_component;
|
||
|
|
||
|
mca_coll_hcoll_output = opal_output_open(NULL);
|
||
|
opal_output_set_verbosity(mca_coll_hcoll_output, cm->hcoll_verbose);
|
||
|
|
||
|
hcoll_rte_fns_setup();
|
||
|
|
||
|
cm->libhcoll_initialized = false;
|
||
|
|
||
|
/* Register memory hooks */
|
||
|
if ((OPAL_MEMORY_FREE_SUPPORT | OPAL_MEMORY_MUNMAP_SUPPORT) ==
|
||
|
((OPAL_MEMORY_FREE_SUPPORT | OPAL_MEMORY_MUNMAP_SUPPORT) &
|
||
|
opal_mem_hooks_support_level()))
|
||
|
{
|
||
|
setenv("MXM_HCOLL_MEM_ON_DEMAND_MAP", "y", 0);
|
||
|
HCOL_VERBOSE(1, "Enabling on-demand memory mapping");
|
||
|
cm->using_mem_hooks = 1;
|
||
|
} else {
|
||
|
HCOL_VERBOSE(1, "Disabling on-demand memory mapping");
|
||
|
cm->using_mem_hooks = 0;
|
||
|
}
|
||
|
|
||
|
return OMPI_SUCCESS;
|
||
|
}
|
||
|
|
||
|
static int hcoll_close(void)
|
||
|
{
|
||
|
int rc;
|
||
|
mca_coll_hcoll_component_t *cm;
|
||
|
cm = &mca_coll_hcoll_component;
|
||
|
|
||
|
if (false == cm->libhcoll_initialized) {
|
||
|
return OMPI_SUCCESS;
|
||
|
}
|
||
|
|
||
|
if (cm->using_mem_hooks) {
|
||
|
opal_mem_hooks_unregister_release(mca_coll_hcoll_mem_release_cb);
|
||
|
}
|
||
|
|
||
|
#if HCOLL_API >= HCOLL_VERSION(3,2)
|
||
|
hcoll_free_init_opts(cm->init_opts);
|
||
|
#endif
|
||
|
|
||
|
HCOL_VERBOSE(5,"HCOLL FINALIZE");
|
||
|
rc = hcoll_finalize();
|
||
|
OBJ_DESTRUCT(&cm->dtypes);
|
||
|
opal_progress_unregister(mca_coll_hcoll_progress);
|
||
|
if (HCOLL_SUCCESS != rc){
|
||
|
HCOL_VERBOSE(1,"Hcol library finalize failed");
|
||
|
return OMPI_ERROR;
|
||
|
}
|
||
|
return OMPI_SUCCESS;
|
||
|
}
|