2005-10-07 22:24:52 +00:00
|
|
|
/*
|
2005-11-05 19:57:48 +00:00
|
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
|
|
* University Research and Technology
|
|
|
|
* Corporation. All rights reserved.
|
|
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
|
|
* of Tennessee Research Foundation. All rights
|
|
|
|
* reserved.
|
2005-10-07 22:24:52 +00:00
|
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
|
|
* University of Stuttgart. All rights reserved.
|
|
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
|
|
* All rights reserved.
|
|
|
|
* $COPYRIGHT$
|
|
|
|
*
|
|
|
|
* Additional copyrights may follow
|
|
|
|
*
|
|
|
|
* $HEADER$
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "orte_config.h"
|
2008-02-28 01:57:57 +00:00
|
|
|
#include "orte/constants.h"
|
|
|
|
#include "orte/types.h"
|
2005-10-07 22:24:52 +00:00
|
|
|
|
|
|
|
#include "opal/mca/mca.h"
|
|
|
|
#include "opal/mca/base/base.h"
|
2006-10-17 16:06:17 +00:00
|
|
|
#include "opal/class/opal_list.h"
|
2009-02-14 02:26:12 +00:00
|
|
|
#include "opal/util/output.h"
|
2006-10-17 16:06:17 +00:00
|
|
|
|
2008-06-09 14:53:58 +00:00
|
|
|
#include "orte/util/show_help.h"
|
2008-02-28 01:57:57 +00:00
|
|
|
#include "opal/dss/dss.h"
|
2005-10-07 22:24:52 +00:00
|
|
|
#include "orte/mca/errmgr/errmgr.h"
|
2008-02-28 01:57:57 +00:00
|
|
|
#include "orte/util/name_fns.h"
|
|
|
|
#include "orte/runtime/orte_globals.h"
|
2008-08-05 15:09:29 +00:00
|
|
|
#include "orte/runtime/orte_wait.h"
|
2008-02-28 01:57:57 +00:00
|
|
|
#include "orte/util/hostfile/hostfile.h"
|
|
|
|
#include "orte/util/dash_host/dash_host.h"
|
2008-03-23 23:10:15 +00:00
|
|
|
#include "orte/util/proc_info.h"
|
2005-10-07 22:24:52 +00:00
|
|
|
|
2006-09-14 21:29:51 +00:00
|
|
|
#include "orte/mca/ras/base/ras_private.h"
|
2005-10-07 22:24:52 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Function for selecting one component from all those that are
|
|
|
|
* available.
|
|
|
|
*/
|
2008-02-28 01:57:57 +00:00
|
|
|
int orte_ras_base_allocate(orte_job_t *jdata)
|
2005-10-07 22:24:52 +00:00
|
|
|
{
|
2008-02-28 01:57:57 +00:00
|
|
|
int rc;
|
2006-10-19 23:33:51 +00:00
|
|
|
opal_list_t nodes;
|
2008-04-20 02:25:45 +00:00
|
|
|
orte_node_t *node, **alloc;
|
2008-02-28 01:57:57 +00:00
|
|
|
orte_std_cntr_t i;
|
|
|
|
bool override_oversubscribed;
|
|
|
|
orte_app_context_t **apps;
|
|
|
|
|
2008-06-09 14:53:58 +00:00
|
|
|
OPAL_OUTPUT_VERBOSE((5, orte_ras_base.ras_output,
|
2008-02-28 01:57:57 +00:00
|
|
|
"%s ras:base:allocate",
|
|
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME)));
|
|
|
|
|
|
|
|
/* if we already did this, don't do it again - the pool of
|
|
|
|
* global resources is set.
|
|
|
|
*/
|
|
|
|
if (orte_ras_base.allocation_read) {
|
|
|
|
|
2008-06-09 14:53:58 +00:00
|
|
|
OPAL_OUTPUT_VERBOSE((5, orte_ras_base.ras_output,
|
2008-02-28 01:57:57 +00:00
|
|
|
"%s ras:base:allocate allocation already read",
|
|
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME)));
|
|
|
|
|
2008-07-25 13:35:12 +00:00
|
|
|
/* loop through the global node pool and set the
|
|
|
|
* number of allocated slots to the difference
|
|
|
|
* between slots and slots_in_use. Note that
|
|
|
|
* oversubscription will still allow procs to
|
|
|
|
* be mapped up to slots_max
|
|
|
|
*/
|
2008-02-28 01:57:57 +00:00
|
|
|
return ORTE_SUCCESS;
|
2006-10-19 23:33:51 +00:00
|
|
|
}
|
2008-02-28 01:57:57 +00:00
|
|
|
|
|
|
|
/* Otherwise, we have to create
|
|
|
|
* the initial set of resources that will delineate all
|
|
|
|
* further operations serviced by this HNP. This list will
|
|
|
|
* contain ALL nodes that can be used by any subsequent job.
|
|
|
|
*
|
|
|
|
* In other words, if a node isn't found in this step, then
|
|
|
|
* no job launched by this HNP will be able to utilize it.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* note that the allocation has been read so we don't
|
|
|
|
* come in here again!
|
|
|
|
*/
|
|
|
|
orte_ras_base.allocation_read = true;
|
2006-10-19 23:33:51 +00:00
|
|
|
|
2008-02-28 01:57:57 +00:00
|
|
|
/* construct a list to hold the results */
|
|
|
|
OBJ_CONSTRUCT(&nodes, opal_list_t);
|
|
|
|
|
|
|
|
/* if a component was selected, then we know we are in a managed
|
|
|
|
* environment. - the active module will return a list of what it found
|
|
|
|
*/
|
|
|
|
if (NULL != orte_ras_base.active_module) {
|
|
|
|
/* read the allocation */
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ras_base.active_module->allocate(&nodes))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
return rc;
|
2006-10-19 23:33:51 +00:00
|
|
|
}
|
2008-02-28 01:57:57 +00:00
|
|
|
}
|
|
|
|
/* If something came back, save it and we are done */
|
|
|
|
if (!opal_list_is_empty(&nodes)) {
|
|
|
|
/* store the results in the global resource pool - this removes the
|
|
|
|
* list items
|
|
|
|
*/
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ras_base_node_insert(&nodes, jdata))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
return rc;
|
2006-10-19 23:33:51 +00:00
|
|
|
}
|
2008-02-28 01:57:57 +00:00
|
|
|
OBJ_DESTRUCT(&nodes);
|
2008-04-21 20:28:59 +00:00
|
|
|
goto DISPLAY;
|
2008-08-04 14:25:19 +00:00
|
|
|
} else if (orte_allocation_required) {
|
|
|
|
/* if nothing was found, and an allocation is
|
|
|
|
* required, then error out
|
|
|
|
*/
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
orte_show_help("help-ras-base.txt", "ras-base:no-allocation", true);
|
|
|
|
ORTE_UPDATE_EXIT_STATUS(ORTE_ERROR_DEFAULT_EXIT_CODE);
|
2008-08-05 15:09:29 +00:00
|
|
|
orte_trigger_event(&orte_exit);
|
2008-08-04 14:25:19 +00:00
|
|
|
return ORTE_ERROR;
|
2006-10-19 23:33:51 +00:00
|
|
|
}
|
2006-10-31 22:16:51 +00:00
|
|
|
|
2008-02-28 01:57:57 +00:00
|
|
|
|
|
|
|
|
2008-06-09 14:53:58 +00:00
|
|
|
OPAL_OUTPUT_VERBOSE((5, orte_ras_base.ras_output,
|
2008-02-28 01:57:57 +00:00
|
|
|
"%s ras:base:allocate nothing found in module - proceeding to hostfile",
|
|
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME)));
|
|
|
|
|
|
|
|
/* nothing was found, or no active module was alive. Our next
|
|
|
|
* option is to look for a hostfile and assign our global
|
2008-03-05 04:54:57 +00:00
|
|
|
* pool from there. First, we check for a default hostfile
|
2008-08-19 15:17:40 +00:00
|
|
|
* as set by an mca param.
|
|
|
|
*
|
|
|
|
* Note that any relative node syntax found in the hostfile will
|
|
|
|
* generate an error in this scenario, so only non-relative syntax
|
|
|
|
* can be present
|
2008-03-05 04:54:57 +00:00
|
|
|
*/
|
|
|
|
if (NULL != orte_default_hostfile) {
|
2008-06-09 14:53:58 +00:00
|
|
|
OPAL_OUTPUT_VERBOSE((5, orte_ras_base.ras_output,
|
2008-03-05 04:54:57 +00:00
|
|
|
"%s ras:base:allocate parsing default hostfile %s",
|
|
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME),
|
|
|
|
orte_default_hostfile));
|
|
|
|
|
|
|
|
/* a default hostfile was provided - parse it */
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_util_add_hostfile_nodes(&nodes,
|
|
|
|
&override_oversubscribed,
|
|
|
|
orte_default_hostfile))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/* if something was found in the default hostfile, we use that as our global
|
|
|
|
* pool - set it and we are done
|
|
|
|
*/
|
|
|
|
if (!opal_list_is_empty(&nodes)) {
|
|
|
|
/* store the results in the global resource pool - this removes the
|
|
|
|
* list items
|
|
|
|
*/
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ras_base_node_insert(&nodes, jdata))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
}
|
|
|
|
/* update the jdata object with override_oversubscribed flag */
|
|
|
|
jdata->oversubscribe_override = override_oversubscribed;
|
|
|
|
/* cleanup */
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
2008-04-21 20:28:59 +00:00
|
|
|
goto DISPLAY;
|
2008-03-05 04:54:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Individual hostfile names, if given, are included
|
2008-02-28 01:57:57 +00:00
|
|
|
* in the app_contexts for this job. We therefore need to
|
|
|
|
* retrieve the app_contexts for the job, and then cycle
|
|
|
|
* through them to see if anything is there. The parser will
|
|
|
|
* add the nodes found in each hostfile to our list - i.e.,
|
|
|
|
* the resulting list contains the UNION of all nodes specified
|
|
|
|
* in hostfiles from across all app_contexts
|
2008-08-19 15:17:40 +00:00
|
|
|
*
|
|
|
|
* Note that any relative node syntax found in the hostfiles will
|
|
|
|
* generate an error in this scenario, so only non-relative syntax
|
|
|
|
* can be present
|
2008-02-28 01:57:57 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
/* convenience def */
|
|
|
|
apps = (orte_app_context_t**)jdata->apps->addr;
|
|
|
|
|
|
|
|
for (i=0; i < jdata->num_apps; i++) {
|
|
|
|
if (NULL != apps[i]->hostfile) {
|
2006-10-31 22:16:51 +00:00
|
|
|
|
2008-06-09 14:53:58 +00:00
|
|
|
OPAL_OUTPUT_VERBOSE((5, orte_ras_base.ras_output,
|
2008-02-28 01:57:57 +00:00
|
|
|
"%s ras:base:allocate checking hostfile %s",
|
|
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME),
|
|
|
|
apps[i]->hostfile));
|
|
|
|
|
|
|
|
/* hostfile was specified - parse it and add it to the list */
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_util_add_hostfile_nodes(&nodes,
|
|
|
|
&override_oversubscribed,
|
|
|
|
apps[i]->hostfile))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
return rc;
|
2005-10-07 22:24:52 +00:00
|
|
|
}
|
|
|
|
}
|
2006-11-22 13:30:21 +00:00
|
|
|
}
|
2008-02-28 01:57:57 +00:00
|
|
|
|
|
|
|
/* if something was found in the hostfile(s), we use that as our global
|
|
|
|
* pool - set it and we are done
|
|
|
|
*/
|
2006-11-22 13:30:21 +00:00
|
|
|
if (!opal_list_is_empty(&nodes)) {
|
2008-02-28 01:57:57 +00:00
|
|
|
/* store the results in the global resource pool - this removes the
|
|
|
|
* list items
|
|
|
|
*/
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ras_base_node_insert(&nodes, jdata))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
}
|
|
|
|
/* update the jdata object with override_oversubscribed flag */
|
|
|
|
jdata->oversubscribe_override = override_oversubscribed;
|
|
|
|
/* cleanup */
|
2006-11-22 13:30:21 +00:00
|
|
|
OBJ_DESTRUCT(&nodes);
|
2008-04-21 20:28:59 +00:00
|
|
|
goto DISPLAY;
|
2006-10-31 22:16:51 +00:00
|
|
|
}
|
2008-02-28 01:57:57 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
2008-06-09 14:53:58 +00:00
|
|
|
OPAL_OUTPUT_VERBOSE((5, orte_ras_base.ras_output,
|
2008-02-28 01:57:57 +00:00
|
|
|
"%s ras:base:allocate nothing found in hostfiles - checking dash-host options",
|
|
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME)));
|
|
|
|
|
|
|
|
/* Our next option is to look for hosts provided via the -host
|
|
|
|
* command line option. If they are present, we declare this
|
|
|
|
* to represent not just a mapping, but to define the global
|
|
|
|
* resource pool in the absence of any other info.
|
|
|
|
*
|
|
|
|
* -host lists are provided as part of the app_contexts for
|
|
|
|
* this job. We therefore need to retrieve the app_contexts
|
|
|
|
* for the job, and then cycle through them to see if anything
|
|
|
|
* is there. The parser will add the -host nodes to our list - i.e.,
|
|
|
|
* the resulting list contains the UNION of all nodes specified
|
|
|
|
* by -host across all app_contexts
|
2008-08-19 15:17:40 +00:00
|
|
|
*
|
|
|
|
* Note that any relative node syntax found in the -host lists will
|
|
|
|
* generate an error in this scenario, so only non-relative syntax
|
|
|
|
* can be present
|
2008-02-28 01:57:57 +00:00
|
|
|
*/
|
|
|
|
for (i=0; i < jdata->num_apps; i++) {
|
2008-03-06 12:46:36 +00:00
|
|
|
if (NULL != apps[i]->dash_host) {
|
2008-02-28 01:57:57 +00:00
|
|
|
if (ORTE_SUCCESS != (rc = orte_util_add_dash_host_nodes(&nodes,
|
|
|
|
&override_oversubscribed,
|
2008-03-05 22:12:27 +00:00
|
|
|
apps[i]->dash_host))) {
|
2008-02-28 01:57:57 +00:00
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
return rc;
|
2006-10-31 22:16:51 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2005-10-07 22:24:52 +00:00
|
|
|
|
2008-02-28 01:57:57 +00:00
|
|
|
/* if something was found in -host, we use that as our global
|
|
|
|
* pool - set it and we are done
|
|
|
|
*/
|
|
|
|
if (!opal_list_is_empty(&nodes)) {
|
|
|
|
/* store the results in the global resource pool - this removes the
|
|
|
|
* list items
|
|
|
|
*/
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ras_base_node_insert(&nodes, jdata))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
}
|
|
|
|
/* update the jdata object with override_oversubscribed flag */
|
|
|
|
jdata->oversubscribe_override = override_oversubscribed;
|
|
|
|
/* cleanup */
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
2008-04-21 20:28:59 +00:00
|
|
|
goto DISPLAY;
|
2006-10-19 23:33:51 +00:00
|
|
|
}
|
2006-10-17 16:06:17 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
2008-06-09 14:53:58 +00:00
|
|
|
OPAL_OUTPUT_VERBOSE((5, orte_ras_base.ras_output,
|
2008-02-28 01:57:57 +00:00
|
|
|
"%s ras:base:allocate nothing found in dash-host - inserting current node",
|
|
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME)));
|
2006-10-17 16:06:17 +00:00
|
|
|
|
2008-02-28 01:57:57 +00:00
|
|
|
/* if nothing was found by any of the above methods, then we have no
|
|
|
|
* earthly idea what to do - so just add the local host
|
|
|
|
*/
|
|
|
|
node = OBJ_NEW(orte_node_t);
|
|
|
|
if (NULL == node) {
|
|
|
|
ORTE_ERROR_LOG(ORTE_ERR_OUT_OF_RESOURCE);
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
return ORTE_ERR_OUT_OF_RESOURCE;
|
2006-10-17 16:06:17 +00:00
|
|
|
}
|
2008-03-23 23:10:15 +00:00
|
|
|
/* use the same name we got in orte_process_info so we avoid confusion in
|
2008-02-28 01:57:57 +00:00
|
|
|
* the session directories
|
|
|
|
*/
|
2008-03-23 23:10:15 +00:00
|
|
|
node->name = strdup(orte_process_info.nodename);
|
2008-02-28 01:57:57 +00:00
|
|
|
node->state = ORTE_NODE_STATE_UP;
|
|
|
|
node->slots_inuse = 0;
|
|
|
|
node->slots_max = 0;
|
|
|
|
node->slots = 1;
|
|
|
|
/* indicate that we don't know anything about over_subscribing */
|
|
|
|
jdata->oversubscribe_override = true;
|
|
|
|
opal_list_append(&nodes, &node->super);
|
2006-10-17 16:06:17 +00:00
|
|
|
|
2008-02-28 01:57:57 +00:00
|
|
|
/* store the results in the global resource pool - this removes the
|
|
|
|
* list items
|
|
|
|
*/
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ras_base_node_insert(&nodes, jdata))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
OBJ_DESTRUCT(&nodes);
|
2008-04-21 20:28:59 +00:00
|
|
|
|
|
|
|
DISPLAY:
|
2008-04-20 02:25:45 +00:00
|
|
|
/* shall we display the results? */
|
|
|
|
if (orte_ras_base.display_alloc) {
|
2008-06-04 20:53:12 +00:00
|
|
|
char *tmp=NULL, *tmp2, *tmp3, *pfx=NULL;
|
|
|
|
if (orte_xml_output) {
|
|
|
|
asprintf(&tmp, "<allocation>\n");
|
|
|
|
pfx = "\t";
|
2008-09-28 16:44:09 +00:00
|
|
|
} else {
|
|
|
|
asprintf(&tmp, "\n====================== ALLOCATED NODES ======================\n");
|
2008-06-04 20:53:12 +00:00
|
|
|
}
|
2008-04-20 02:25:45 +00:00
|
|
|
alloc = (orte_node_t**)orte_node_pool->addr;
|
|
|
|
for (i=0; i < orte_node_pool->size; i++) {
|
|
|
|
if (NULL == alloc[i]) {
|
|
|
|
break;
|
|
|
|
}
|
2008-06-04 20:53:12 +00:00
|
|
|
opal_dss.print(&tmp2, pfx, alloc[i], ORTE_NODE);
|
|
|
|
if (NULL == tmp) {
|
|
|
|
tmp = tmp2;
|
|
|
|
} else {
|
|
|
|
asprintf(&tmp3, "%s%s", tmp, tmp2);
|
|
|
|
free(tmp);
|
|
|
|
free(tmp2);
|
|
|
|
tmp = tmp3;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (orte_xml_output) {
|
2008-12-08 19:37:22 +00:00
|
|
|
opal_output(orte_clean_output, "%s</allocation>\n", tmp);
|
2008-06-04 20:53:12 +00:00
|
|
|
} else {
|
2008-12-08 19:37:22 +00:00
|
|
|
opal_output(orte_clean_output, "%s\n\n=================================================================\n", tmp);
|
2008-04-20 02:25:45 +00:00
|
|
|
}
|
2008-09-28 16:44:09 +00:00
|
|
|
free(tmp);
|
2008-04-20 02:25:45 +00:00
|
|
|
}
|
|
|
|
|
2008-04-21 20:28:59 +00:00
|
|
|
return rc;
|
2006-10-17 16:06:17 +00:00
|
|
|
}
|