/* * Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana * University Research and Technology * Corporation. All rights reserved. * Copyright (c) 2004-2011 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ * */ #include "orte_config.h" #include "orte/constants.h" #include #include #ifdef HAVE_FCNTL_H #include #endif #ifdef HAVE_UNISTD_H #include #endif #include "opal/util/opal_sos.h" #include "orte/util/show_help.h" #include "orte/mca/plm/base/base.h" #include "orte/mca/plm/plm.h" #include "orte/mca/errmgr/errmgr.h" #include "orte/util/proc_info.h" #include "orte/runtime/orte_cr.h" #include "orte/mca/ess/ess.h" #include "orte/mca/ess/base/base.h" #include "orte/mca/ess/tool/ess_tool.h" static int rte_init(void); static void rte_abort(int status, bool report) __opal_attribute_noreturn__; static orte_vpid_t proc_get_daemon(orte_process_name_t *proc); static int query_sys_info(char *node, char **keys, opal_list_t *values); orte_ess_base_module_t orte_ess_tool_module = { rte_init, orte_ess_base_tool_finalize, rte_abort, NULL, /* don't need a local procs fn */ proc_get_daemon, NULL, /* don't need a proc_get_hostname fn */ NULL, /* don't need a proc_get_local_rank fn */ NULL, /* don't need a proc_get_node_rank fn */ orte_ess_base_proc_get_epoch, /* proc_get_epoch */ NULL, /* don't need to update_pidmap */ NULL, /* don't need to update_nidmap */ query_sys_info, NULL /* ft_event */ }; static int rte_init(void) { int ret; char *error = NULL; /* run the prolog */ if (ORTE_SUCCESS != (ret = orte_ess_base_std_prolog())) { error = "orte_ess_base_std_prolog"; goto error; } /* If we are a tool with no name, then responsibility for * defining the name falls to the PLM component for our * respective environment - hence, we have to open the PLM * first and select that component. Note that ONLY the * HNP ever uses a PLM component, so we ONLY use the PLM * here to set our name and then close it * * NOTE: Tools with names - i.e., tools consisting of a * distributed set of processes - will select and use * the appropriate enviro-specific module and -not- this one! */ if (ORTE_SUCCESS != (ret = orte_plm_base_open())) { ORTE_ERROR_LOG(ret); error = "orte_plm_base_open"; goto error; } if (ORTE_SUCCESS != (ret = orte_plm_base_select())) { ORTE_ERROR_LOG(ret); error = "orte_plm_base_select"; goto error; } if (ORTE_SUCCESS != (ret = orte_plm.set_hnp_name())) { ORTE_ERROR_LOG(ret); error = "orte_plm_set_hnp_name"; goto error; } /* close the plm since we opened it to set our * name, but have no further use for it */ orte_plm_base_close(); /* do the rest of the standard tool init */ if (ORTE_SUCCESS != (ret = orte_ess_base_tool_setup())) { ORTE_ERROR_LOG(ret); error = "orte_ess_base_tool_setup"; goto error; } return ORTE_SUCCESS; error: orte_show_help("help-ess-tool.txt", "tool:rte_init:startup:internal-failure", true, error, ORTE_ERROR_NAME(ret), ret); return ret; } /* * If we are a tool-without-name, then we look just like the HNP. * In that scenario, it could be beneficial to get a core file, so * we call abort. */ static void rte_abort(int status, bool report) { /* do NOT do a normal finalize as this will very likely * hang the process. We are aborting due to an abnormal condition * that precludes normal cleanup * * We do need to do the following bits to make sure we leave a * clean environment. Taken from orte_finalize(): * - Assume errmgr cleans up child processes before we exit. */ /* CRS cleanup since it may have a named pipe and thread active */ orte_cr_finalize(); /* - Clean out the global structures * (not really necessary, but good practice) */ orte_proc_info_finalize(); /* Now just exit */ exit(0); } static orte_vpid_t proc_get_daemon(orte_process_name_t *proc) { return ORTE_VPID_INVALID; } static int query_sys_info(char *node, char **keys, opal_list_t *values) { return ORTE_SUCCESS; }