OSHMEM: fix error message when aborting on OOM
fixed by Roman, reviewed by Miked cmr=v1.8.2:reviewer=ompi-rm1.8 This commit was SVN r31752.
Этот коммит содержится в:
родитель
644aa6f737
Коммит
95e637f5ba
@ -7,7 +7,7 @@
|
|||||||
# $HEADER$
|
# $HEADER$
|
||||||
#
|
#
|
||||||
|
|
||||||
dist_oshmemdata_DATA += base/help-shmem-mca.txt
|
dist_oshmemdata_DATA += base/help-oshmem-memheap.txt
|
||||||
|
|
||||||
headers += \
|
headers += \
|
||||||
base/base.h
|
base/base.h
|
||||||
|
@ -150,7 +150,7 @@ int mca_memheap_base_select()
|
|||||||
|
|
||||||
/* Verify that some module was initialized */
|
/* Verify that some module was initialized */
|
||||||
if (NULL == mca_memheap_base_module_initialized) {
|
if (NULL == mca_memheap_base_module_initialized) {
|
||||||
opal_show_help("help-shmem-mca.txt",
|
opal_show_help("help-oshmem-memheap.txt",
|
||||||
"find-available:none-found",
|
"find-available:none-found",
|
||||||
true,
|
true,
|
||||||
"memheap");
|
"memheap");
|
||||||
|
@ -10,7 +10,7 @@
|
|||||||
#
|
#
|
||||||
|
|
||||||
dist_oshmemdata_DATA = \
|
dist_oshmemdata_DATA = \
|
||||||
help-shmem-spml-ikrit.txt
|
help-oshmem-spml-ikrit.txt
|
||||||
|
|
||||||
AM_CPPFLAGS = $(spml_ikrit_CPPFLAGS)
|
AM_CPPFLAGS = $(spml_ikrit_CPPFLAGS)
|
||||||
|
|
||||||
|
@ -413,7 +413,7 @@ int mca_spml_ikrit_add_procs(oshmem_proc_t** procs, size_t nprocs)
|
|||||||
#else
|
#else
|
||||||
err = mxm_ep_get_address(mca_spml_ikrit.mxm_ep, &my_ep_info.addr.ep_addr, &mxm_addr_len);
|
err = mxm_ep_get_address(mca_spml_ikrit.mxm_ep, &my_ep_info.addr.ep_addr, &mxm_addr_len);
|
||||||
if (MXM_OK != err) {
|
if (MXM_OK != err) {
|
||||||
orte_show_help("help-shmem-spml-ikrit.txt", "unable to get endpoint address", true,
|
orte_show_help("help-oshmem-spml-ikrit.txt", "unable to get endpoint address", true,
|
||||||
mxm_error_string(err));
|
mxm_error_string(err));
|
||||||
return OSHMEM_ERROR;
|
return OSHMEM_ERROR;
|
||||||
}
|
}
|
||||||
|
@ -74,7 +74,7 @@ static int check_mxm_tls(char *var)
|
|||||||
"%s=%s",
|
"%s=%s",
|
||||||
var, getenv(var)
|
var, getenv(var)
|
||||||
)) {
|
)) {
|
||||||
orte_show_help("help-shmem-spml-ikrit.txt", "mxm tls", true,
|
orte_show_help("help-oshmem-spml-ikrit.txt", "mxm tls", true,
|
||||||
str);
|
str);
|
||||||
free(str);
|
free(str);
|
||||||
}
|
}
|
||||||
@ -190,7 +190,7 @@ int spml_ikrit_progress(void)
|
|||||||
|
|
||||||
err = mxm_progress(mca_spml_ikrit.mxm_context);
|
err = mxm_progress(mca_spml_ikrit.mxm_context);
|
||||||
if ((MXM_OK != err) && (MXM_ERR_NO_PROGRESS != err)) {
|
if ((MXM_OK != err) && (MXM_ERR_NO_PROGRESS != err)) {
|
||||||
orte_show_help("help-shmem-spml-ikrit.txt",
|
orte_show_help("help-oshmem-spml-ikrit.txt",
|
||||||
"errors during mxm_progress",
|
"errors during mxm_progress",
|
||||||
true,
|
true,
|
||||||
mxm_error_string(err));
|
mxm_error_string(err));
|
||||||
@ -240,7 +240,7 @@ static int mca_spml_ikrit_component_open(void)
|
|||||||
SPML_VERBOSE(1,
|
SPML_VERBOSE(1,
|
||||||
"No supported device found, disqualifying spml/ikrit");
|
"No supported device found, disqualifying spml/ikrit");
|
||||||
} else {
|
} else {
|
||||||
orte_show_help("help-shmem-spml-ikrit.txt",
|
orte_show_help("help-oshmem-spml-ikrit.txt",
|
||||||
"mxm init",
|
"mxm init",
|
||||||
true,
|
true,
|
||||||
mxm_error_string(err));
|
mxm_error_string(err));
|
||||||
@ -252,7 +252,7 @@ static int mca_spml_ikrit_component_open(void)
|
|||||||
MXM_SHMEM_MQ_ID,
|
MXM_SHMEM_MQ_ID,
|
||||||
&mca_spml_ikrit.mxm_mq);
|
&mca_spml_ikrit.mxm_mq);
|
||||||
if (MXM_OK != err) {
|
if (MXM_OK != err) {
|
||||||
orte_show_help("help-shmem-spml-ikrit.txt",
|
orte_show_help("help-oshmem-spml-ikrit.txt",
|
||||||
"mxm mq create",
|
"mxm mq create",
|
||||||
true,
|
true,
|
||||||
mxm_error_string(err));
|
mxm_error_string(err));
|
||||||
@ -295,7 +295,7 @@ static int spml_ikrit_mxm_init(void)
|
|||||||
mca_spml_ikrit.mxm_ep_opts,
|
mca_spml_ikrit.mxm_ep_opts,
|
||||||
&mca_spml_ikrit.mxm_ep);
|
&mca_spml_ikrit.mxm_ep);
|
||||||
if (MXM_OK != err) {
|
if (MXM_OK != err) {
|
||||||
orte_show_help("help-shmem-spml-ikrit.txt",
|
orte_show_help("help-oshmem-spml-ikrit.txt",
|
||||||
"unable to create endpoint",
|
"unable to create endpoint",
|
||||||
true,
|
true,
|
||||||
mxm_error_string(err));
|
mxm_error_string(err));
|
||||||
|
@ -10,7 +10,7 @@
|
|||||||
#
|
#
|
||||||
|
|
||||||
dist_oshmemdata_DATA = \
|
dist_oshmemdata_DATA = \
|
||||||
help-shmem-spml-yoda.txt
|
help-oshmem-spml-yoda.txt
|
||||||
|
|
||||||
EXTRA_DIST = post_configure.sh
|
EXTRA_DIST = post_configure.sh
|
||||||
|
|
||||||
|
@ -19,3 +19,11 @@ name and its corresponding minimum value is shown below.
|
|||||||
BTL eager limit value: %d (set via btl_%s_eager_limit)
|
BTL eager limit value: %d (set via btl_%s_eager_limit)
|
||||||
BTL eager limit minimum: %d
|
BTL eager limit minimum: %d
|
||||||
MCA parameter name: btl_%s_eager_limit
|
MCA parameter name: btl_%s_eager_limit
|
||||||
|
|
||||||
|
[internal_oom_error]
|
||||||
|
'%s' operation failed. Unable to allocate buffer, need %d bytes.
|
||||||
|
Try increasing 'spml_yoda_bml_alloc_threshold' value or setting it to '0' to
|
||||||
|
force waiting for all puts completion.
|
||||||
|
|
||||||
|
spml_yoda_bml_alloc_threshold: %d
|
||||||
|
|
@ -10,6 +10,7 @@
|
|||||||
|
|
||||||
#include "oshmem_config.h"
|
#include "oshmem_config.h"
|
||||||
|
|
||||||
|
#include "opal/util/show_help.h"
|
||||||
#include "orte/include/orte/types.h"
|
#include "orte/include/orte/types.h"
|
||||||
#include "orte/runtime/orte_globals.h"
|
#include "orte/runtime/orte_globals.h"
|
||||||
|
|
||||||
@ -823,9 +824,13 @@ static inline int mca_spml_yoda_put_internal(void *dst_addr,
|
|||||||
put_via_send);
|
put_via_send);
|
||||||
|
|
||||||
if (OPAL_UNLIKELY(!des || !des->des_src )) {
|
if (OPAL_UNLIKELY(!des || !des->des_src )) {
|
||||||
SPML_ERROR("shmem OOM error need %d bytes", ncopied);
|
|
||||||
SPML_ERROR("src=%p nfrags = %d frag_size=%d",
|
SPML_ERROR("src=%p nfrags = %d frag_size=%d",
|
||||||
src_addr, nfrags, frag_size);
|
src_addr, nfrags, frag_size);
|
||||||
|
SPML_ERROR("shmem OOM error need %d bytes", ncopied);
|
||||||
|
opal_show_help("help-oshmem-spml-yoda.txt",
|
||||||
|
"internal_oom_error",
|
||||||
|
true,
|
||||||
|
"Put", ncopied, mca_spml_yoda.bml_alloc_threshold);
|
||||||
oshmem_shmem_abort(-1);
|
oshmem_shmem_abort(-1);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Загрузка…
x
Ссылка в новой задаче
Block a user