2015-04-09 20:51:36 +03:00
|
|
|
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
2005-08-22 07:05:39 +04:00
|
|
|
/*
|
2005-11-05 22:57:48 +03:00
|
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
|
|
* University Research and Technology
|
|
|
|
* Corporation. All rights reserved.
|
|
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
|
|
* of Tennessee Research Foundation. All rights
|
|
|
|
* reserved.
|
2015-06-24 06:59:57 +03:00
|
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
2005-08-22 07:05:39 +04:00
|
|
|
* University of Stuttgart. All rights reserved.
|
|
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
|
|
* All rights reserved.
|
2015-04-09 20:51:36 +03:00
|
|
|
* Copyright (c) 2007-2015 Los Alamos National Security, LLC. All rights
|
|
|
|
* reserved.
|
2015-04-15 09:14:57 +03:00
|
|
|
* Copyright (c) 2015 Research Organization for Information Science
|
|
|
|
* and Technology (RIST). All rights reserved.
|
2017-06-07 11:16:45 +03:00
|
|
|
* Copyright (c) 2017 FUJITSU LIMITED. All rights reserved.
|
2017-06-28 22:58:57 +03:00
|
|
|
* Copyright (c) 2017 IBM Corporation. All rights reserved.
|
2018-10-07 02:58:16 +03:00
|
|
|
* Copyright (c) 2018 Amazon.com, Inc. or its affiliates. All Rights reserved.
|
2005-08-22 07:05:39 +04:00
|
|
|
* $COPYRIGHT$
|
2015-06-24 06:59:57 +03:00
|
|
|
*
|
2005-08-22 07:05:39 +04:00
|
|
|
* Additional copyrights may follow
|
2015-06-24 06:59:57 +03:00
|
|
|
*
|
2005-08-22 07:05:39 +04:00
|
|
|
* $HEADER$
|
|
|
|
*/
|
|
|
|
|
2006-02-12 04:33:29 +03:00
|
|
|
#include "opal_config.h"
|
2005-08-22 07:05:39 +04:00
|
|
|
|
|
|
|
#include <string.h>
|
|
|
|
#include <errno.h>
|
|
|
|
#include <stdio.h>
|
2005-08-30 14:41:25 +04:00
|
|
|
#include <stdlib.h>
|
2017-06-07 11:16:45 +03:00
|
|
|
#include <unistd.h>
|
2005-08-22 07:05:39 +04:00
|
|
|
|
|
|
|
#include "opal/util/error.h"
|
2018-09-27 20:31:12 +03:00
|
|
|
#include "opal/util/string_copy.h"
|
2006-02-12 04:33:29 +03:00
|
|
|
#include "opal/constants.h"
|
2017-06-07 11:16:45 +03:00
|
|
|
#include "opal/util/proc.h"
|
2018-10-07 02:58:16 +03:00
|
|
|
#include "opal/util/printf.h"
|
2017-06-07 11:16:45 +03:00
|
|
|
#include "opal/runtime/opal_params.h"
|
2005-08-22 07:05:39 +04:00
|
|
|
|
|
|
|
#define MAX_CONVERTERS 5
|
2005-08-30 03:36:53 +04:00
|
|
|
#define MAX_CONVERTER_PROJECT_LEN 10
|
|
|
|
|
|
|
|
struct converter_info_t {
|
|
|
|
int init;
|
|
|
|
char project[MAX_CONVERTER_PROJECT_LEN];
|
|
|
|
int err_base;
|
|
|
|
int err_max;
|
|
|
|
opal_err2str_fn_t converter;
|
|
|
|
};
|
|
|
|
typedef struct converter_info_t converter_info_t;
|
|
|
|
|
2005-08-22 07:05:39 +04:00
|
|
|
/* all default to NULL */
|
2017-06-28 22:58:57 +03:00
|
|
|
static converter_info_t converters[MAX_CONVERTERS] = {{0}};
|
2005-08-22 07:05:39 +04:00
|
|
|
|
2011-02-13 19:09:17 +03:00
|
|
|
static int
|
|
|
|
opal_strerror_int(int errnum, const char **str)
|
2005-08-22 07:05:39 +04:00
|
|
|
{
|
2011-02-24 06:02:48 +03:00
|
|
|
int i, ret = OPAL_SUCCESS;
|
2011-02-13 19:09:17 +03:00
|
|
|
*str = NULL;
|
2005-08-22 07:05:39 +04:00
|
|
|
|
|
|
|
for (i = 0 ; i < MAX_CONVERTERS ; ++i) {
|
2011-08-08 08:10:40 +04:00
|
|
|
if (0 != converters[i].init &&
|
|
|
|
errnum < converters[i].err_base &&
|
|
|
|
converters[i].err_max < errnum) {
|
2011-02-13 19:09:17 +03:00
|
|
|
ret = converters[i].converter(errnum, str);
|
2011-08-08 08:10:40 +04:00
|
|
|
break;
|
2005-08-22 07:05:39 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2005-08-30 03:36:53 +04:00
|
|
|
/* caller must free string */
|
2011-02-13 19:09:17 +03:00
|
|
|
static int
|
2011-02-14 22:29:09 +03:00
|
|
|
opal_strerror_unknown(int errnum, char **str)
|
2005-08-30 03:36:53 +04:00
|
|
|
{
|
|
|
|
int i;
|
2011-02-13 19:09:17 +03:00
|
|
|
*str = NULL;
|
2005-08-30 03:36:53 +04:00
|
|
|
|
|
|
|
for (i = 0 ; i < MAX_CONVERTERS ; ++i) {
|
|
|
|
if (0 != converters[i].init) {
|
2015-06-24 06:59:57 +03:00
|
|
|
if (errnum < converters[i].err_base &&
|
2005-08-30 03:36:53 +04:00
|
|
|
errnum > converters[i].err_max) {
|
2018-10-07 02:58:16 +03:00
|
|
|
opal_asprintf(str, "Unknown error: %d (%s error %d)",
|
2015-06-24 06:59:57 +03:00
|
|
|
errnum, converters[i].project,
|
2005-08-30 03:36:53 +04:00
|
|
|
errnum - converters[i].err_base);
|
2011-02-13 19:09:17 +03:00
|
|
|
return OPAL_SUCCESS;
|
2005-08-30 03:36:53 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-10-07 02:58:16 +03:00
|
|
|
opal_asprintf(str, "Unknown error: %d", errnum);
|
2005-08-30 03:36:53 +04:00
|
|
|
|
2011-02-13 19:09:17 +03:00
|
|
|
return OPAL_SUCCESS;
|
2005-08-30 03:36:53 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2005-08-22 07:05:39 +04:00
|
|
|
void
|
|
|
|
opal_perror(int errnum, const char *msg)
|
|
|
|
{
|
2011-02-13 19:09:17 +03:00
|
|
|
int ret;
|
|
|
|
const char* errmsg;
|
|
|
|
ret = opal_strerror_int(errnum, &errmsg);
|
2005-08-22 07:05:39 +04:00
|
|
|
|
2012-04-06 18:23:13 +04:00
|
|
|
if (NULL != msg && errnum != OPAL_ERR_IN_ERRNO) {
|
2005-08-22 07:05:39 +04:00
|
|
|
fprintf(stderr, "%s: ", msg);
|
|
|
|
}
|
|
|
|
|
2011-02-13 19:09:17 +03:00
|
|
|
if (OPAL_SUCCESS != ret) {
|
2012-04-06 18:23:13 +04:00
|
|
|
if (errnum == OPAL_ERR_IN_ERRNO) {
|
2005-08-22 07:05:39 +04:00
|
|
|
perror(msg);
|
|
|
|
} else {
|
2011-02-14 22:29:09 +03:00
|
|
|
char *ue_msg;
|
2011-02-13 19:09:17 +03:00
|
|
|
ret = opal_strerror_unknown(errnum, &ue_msg);
|
2005-08-30 03:36:53 +04:00
|
|
|
fprintf(stderr, "%s\n", ue_msg);
|
|
|
|
free(ue_msg);
|
2005-08-22 07:05:39 +04:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
fprintf(stderr, "%s\n", errmsg);
|
|
|
|
}
|
|
|
|
|
|
|
|
fflush(stderr);
|
|
|
|
}
|
|
|
|
|
2005-08-30 03:36:53 +04:00
|
|
|
/* big enough to hold long version */
|
|
|
|
#define UNKNOWN_RETBUF_LEN 50
|
|
|
|
static char unknown_retbuf[UNKNOWN_RETBUF_LEN];
|
2005-08-22 07:05:39 +04:00
|
|
|
|
|
|
|
const char *
|
|
|
|
opal_strerror(int errnum)
|
|
|
|
{
|
2011-02-13 19:09:17 +03:00
|
|
|
int ret;
|
2007-04-25 05:55:40 +04:00
|
|
|
const char* errmsg;
|
|
|
|
|
2012-04-06 18:23:13 +04:00
|
|
|
if (errnum == OPAL_ERR_IN_ERRNO) {
|
2007-04-25 05:55:40 +04:00
|
|
|
return strerror(errno);
|
|
|
|
}
|
|
|
|
|
2011-02-13 19:09:17 +03:00
|
|
|
ret = opal_strerror_int(errnum, &errmsg);
|
2005-08-22 07:05:39 +04:00
|
|
|
|
2011-02-13 19:09:17 +03:00
|
|
|
if (OPAL_SUCCESS != ret) {
|
2011-02-14 22:29:09 +03:00
|
|
|
char *ue_msg;
|
2011-02-13 19:09:17 +03:00
|
|
|
ret = opal_strerror_unknown(errnum, &ue_msg);
|
2007-04-25 05:55:40 +04:00
|
|
|
snprintf(unknown_retbuf, UNKNOWN_RETBUF_LEN, "%s", ue_msg);
|
|
|
|
free(ue_msg);
|
|
|
|
errno = EINVAL;
|
|
|
|
return (const char*) unknown_retbuf;
|
2005-08-22 07:05:39 +04:00
|
|
|
} else {
|
|
|
|
return errmsg;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
|
|
|
opal_strerror_r(int errnum, char *strerrbuf, size_t buflen)
|
|
|
|
{
|
2011-02-13 19:09:17 +03:00
|
|
|
const char* errmsg;
|
|
|
|
int ret, len;
|
2005-08-22 07:05:39 +04:00
|
|
|
|
2011-02-13 19:09:17 +03:00
|
|
|
ret = opal_strerror_int(errnum, &errmsg);
|
|
|
|
if (OPAL_SUCCESS != ret) {
|
2012-04-06 18:23:13 +04:00
|
|
|
if (errnum == OPAL_ERR_IN_ERRNO) {
|
2005-08-24 17:44:57 +04:00
|
|
|
char *tmp = strerror(errno);
|
2018-09-27 20:31:12 +03:00
|
|
|
opal_string_copy(strerrbuf, tmp, buflen);
|
2005-08-24 17:44:57 +04:00
|
|
|
return OPAL_SUCCESS;
|
2005-08-22 07:05:39 +04:00
|
|
|
} else {
|
2011-02-14 22:29:09 +03:00
|
|
|
char *ue_msg;
|
2011-02-13 19:09:17 +03:00
|
|
|
ret = opal_strerror_unknown(errnum, &ue_msg);
|
|
|
|
len = snprintf(strerrbuf, buflen, "%s", ue_msg);
|
2005-08-30 03:36:53 +04:00
|
|
|
free(ue_msg);
|
2011-02-13 19:09:17 +03:00
|
|
|
if (len > (int) buflen) {
|
2005-08-22 07:05:39 +04:00
|
|
|
errno = ERANGE;
|
|
|
|
return OPAL_ERR_OUT_OF_RESOURCE;
|
|
|
|
} else {
|
2005-08-30 03:36:53 +04:00
|
|
|
errno = EINVAL;
|
2005-08-22 07:05:39 +04:00
|
|
|
return OPAL_SUCCESS;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
2011-02-13 19:09:17 +03:00
|
|
|
len = snprintf(strerrbuf, buflen, "%s", errmsg);
|
|
|
|
if (len > (int) buflen) {
|
2005-08-22 07:05:39 +04:00
|
|
|
errno = ERANGE;
|
|
|
|
return OPAL_ERR_OUT_OF_RESOURCE;
|
|
|
|
} else {
|
|
|
|
return OPAL_SUCCESS;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2005-08-30 03:36:53 +04:00
|
|
|
opal_error_register(const char *project, int err_base, int err_max,
|
|
|
|
opal_err2str_fn_t converter)
|
2005-08-22 07:05:39 +04:00
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0 ; i < MAX_CONVERTERS ; ++i) {
|
2005-08-30 03:36:53 +04:00
|
|
|
if (0 == converters[i].init) {
|
|
|
|
converters[i].init = 1;
|
2018-09-27 20:31:12 +03:00
|
|
|
opal_string_copy(converters[i].project, project, MAX_CONVERTER_PROJECT_LEN);
|
2008-08-06 18:53:43 +04:00
|
|
|
converters[i].project[MAX_CONVERTER_PROJECT_LEN-1] = '\0';
|
2005-08-30 03:36:53 +04:00
|
|
|
converters[i].err_base = err_base;
|
|
|
|
converters[i].err_max = err_max;
|
|
|
|
converters[i].converter = converter;
|
2005-08-22 07:05:39 +04:00
|
|
|
return OPAL_SUCCESS;
|
2015-04-09 20:51:36 +03:00
|
|
|
} else if (converters[i].err_base == err_base &&
|
|
|
|
converters[i].err_max == err_max &&
|
|
|
|
!strcmp (project, converters[i].project)) {
|
|
|
|
converters[i].converter = converter;
|
|
|
|
return OPAL_SUCCESS;
|
2005-08-22 07:05:39 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return OPAL_ERR_OUT_OF_RESOURCE;
|
|
|
|
}
|
2017-06-07 11:16:45 +03:00
|
|
|
|
|
|
|
|
|
|
|
void
|
|
|
|
opal_delay_abort(void)
|
|
|
|
{
|
|
|
|
// Though snprintf and strlen are not guaranteed to be async-signal-safe
|
|
|
|
// in POSIX, it is async-signal-safe on many implementations probably.
|
|
|
|
|
|
|
|
if (0 != opal_abort_delay) {
|
|
|
|
int delay = opal_abort_delay;
|
|
|
|
pid_t pid = getpid();
|
|
|
|
char msg[100 + OPAL_MAXHOSTNAMELEN];
|
|
|
|
|
|
|
|
if (delay < 0) {
|
|
|
|
snprintf(msg, sizeof(msg),
|
|
|
|
"[%s:%05d] Looping forever "
|
|
|
|
"(MCA parameter opal_abort_delay is < 0)\n",
|
|
|
|
opal_process_info.nodename, (int) pid);
|
2017-06-19 14:08:34 +03:00
|
|
|
write(STDERR_FILENO, msg, strlen(msg));
|
2017-06-07 11:16:45 +03:00
|
|
|
while (1) {
|
|
|
|
sleep(5);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
snprintf(msg, sizeof(msg),
|
|
|
|
"[%s:%05d] Delaying for %d seconds before aborting\n",
|
|
|
|
opal_process_info.nodename, (int) pid, delay);
|
2017-06-19 14:08:34 +03:00
|
|
|
write(STDERR_FILENO, msg, strlen(msg));
|
2017-06-07 11:16:45 +03:00
|
|
|
do {
|
|
|
|
sleep(1);
|
|
|
|
} while (--delay > 0);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|