9613b3176c
After much work by Jeff and myself, and quite a lot of discussion, it has become clear that we simply cannot resolve the infinite loops caused by RML-involved subsystems calling orte_output. The original rationale for the change to orte_output has also been reduced by shifting the output of XML-formatted vs human readable messages to an alternative approach. I have globally replaced the orte_output/ORTE_OUTPUT calls in the code base, as well as the corresponding .h file name. I have test compiled and run this on the various environments within my reach, so hopefully this will prove minimally disruptive. This commit was SVN r18619.
458 строки
14 KiB
C
458 строки
14 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "ompi_config.h"
|
|
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <stdlib.h>
|
|
|
|
#include "mpi.h"
|
|
#include "ompi/file/file.h"
|
|
#include "opal/util/argv.h"
|
|
#include "orte/util/show_help.h"
|
|
#include "opal/class/opal_list.h"
|
|
#include "opal/class/opal_object.h"
|
|
#include "opal/mca/mca.h"
|
|
#include "opal/mca/base/base.h"
|
|
#include "ompi/mca/io/io.h"
|
|
#include "ompi/mca/io/base/base.h"
|
|
#include "ompi/mca/io/base/io_base_request.h"
|
|
|
|
|
|
/*
|
|
* Local types
|
|
*/
|
|
struct avail_io_t {
|
|
opal_list_item_t super;
|
|
|
|
mca_io_base_version_t ai_version;
|
|
|
|
int ai_priority;
|
|
mca_io_base_components_t ai_component;
|
|
mca_io_base_modules_t ai_module;
|
|
struct mca_io_base_file_t *ai_module_data;
|
|
};
|
|
typedef struct avail_io_t avail_io_t;
|
|
|
|
/*
|
|
* Local functions
|
|
*/
|
|
static opal_list_t *check_components(opal_list_t *components,
|
|
ompi_file_t *file,
|
|
char **names, int num_names);
|
|
static avail_io_t *check_one_component(ompi_file_t *file,
|
|
const mca_base_component_t *component);
|
|
|
|
static avail_io_t *query(const mca_base_component_t *component,
|
|
ompi_file_t *file);
|
|
static avail_io_t *query_1_0_0(const mca_io_base_component_1_0_0_t *io_component,
|
|
ompi_file_t *file);
|
|
|
|
static void unquery(avail_io_t *avail, ompi_file_t *file);
|
|
|
|
static int module_init(ompi_file_t *file);
|
|
|
|
|
|
/*
|
|
* Stuff for the OBJ interface
|
|
*/
|
|
static OBJ_CLASS_INSTANCE(avail_io_t, opal_list_item_t, NULL, NULL);
|
|
|
|
|
|
/*
|
|
* This function is called at the initialization time of every
|
|
* file. It is used to select which io component will be
|
|
* active for a given file.
|
|
*/
|
|
int mca_io_base_file_select(ompi_file_t *file,
|
|
mca_base_component_t *preferred)
|
|
{
|
|
int err, num_names;
|
|
char *names, **name_array;
|
|
char *str;
|
|
opal_list_t *selectable;
|
|
opal_list_item_t *item;
|
|
avail_io_t *avail, selected;
|
|
|
|
/* Announce */
|
|
|
|
opal_output_verbose(10, mca_io_base_output,
|
|
"io:base:file_select: new file: %s",
|
|
file->f_filename);
|
|
|
|
/* Initialize all the relevant pointers, since they're used as
|
|
sentinel values */
|
|
|
|
file->f_io_version = MCA_IO_BASE_V_NONE;
|
|
file->f_io_selected_data = NULL;
|
|
|
|
/* See if a set of component was requested by the MCA parameter.
|
|
Don't check for error. */
|
|
|
|
names = NULL;
|
|
mca_base_param_lookup_string(mca_io_base_param, &names);
|
|
|
|
/* Compute the intersection of all of my available components with
|
|
the components from all the other processes in this file */
|
|
|
|
/* JMS CONTINUE HERE */
|
|
|
|
/* See if a preferred component was provided. If so, try to
|
|
select it. If we don't succeed, fall through and do a normal
|
|
selection. */
|
|
|
|
err = OMPI_ERROR;
|
|
if (NULL != preferred) {
|
|
str = &(preferred->mca_component_name[0]);
|
|
|
|
opal_output_verbose(10, mca_io_base_output,
|
|
"io:base:file_select: Checking preferred module: %s",
|
|
str);
|
|
selectable = check_components(&mca_io_base_components_available,
|
|
file, &str, 1);
|
|
|
|
/* If we didn't get a preferred module, then call again
|
|
without a preferred module. This makes the logic below
|
|
dramatically simpler. */
|
|
|
|
if (NULL == selectable) {
|
|
return mca_io_base_file_select(file, NULL);
|
|
}
|
|
|
|
/* We only fall through here if we were able to select one of
|
|
the preferred modules */
|
|
}
|
|
|
|
/* If there was no preferred module, then see if there were any
|
|
listed in the MCA parameter; parse them and check them all */
|
|
|
|
else if (NULL != names && 0 < strlen(names)) {
|
|
name_array = opal_argv_split(names, ',');
|
|
num_names = opal_argv_count(name_array);
|
|
|
|
opal_output_verbose(10, mca_io_base_output,
|
|
"io:base:file_select: Checking specific modules: %s",
|
|
names);
|
|
selectable = check_components(&mca_io_base_components_available,
|
|
file, name_array, num_names);
|
|
opal_argv_free(name_array);
|
|
}
|
|
|
|
/* Nope -- a specific [set of] component[s] was not requested. Go
|
|
check them all. */
|
|
|
|
else {
|
|
opal_output_verbose(10, mca_io_base_output,
|
|
"io:base:file_select: Checking all available modules");
|
|
selectable = check_components(&mca_io_base_components_available,
|
|
file, NULL, 0);
|
|
}
|
|
|
|
/* Upon return from the above, the modules list will contain the
|
|
list of modules that returned (priority >= 0). If we have no
|
|
io modules available, it's an error */
|
|
|
|
if (NULL == selectable) {
|
|
/* There's no modules available. Doh! */
|
|
/* show_help */
|
|
return OMPI_ERROR;
|
|
}
|
|
|
|
/* Do some kind of collective operation to find a module that
|
|
everyone has available */
|
|
|
|
#if 1
|
|
/* For the moment, just take the top module off the list */
|
|
|
|
item = opal_list_remove_first(selectable);
|
|
avail = (avail_io_t *) item;
|
|
selected = *avail;
|
|
OBJ_RELEASE(avail);
|
|
#else
|
|
/* JMS CONTINUE HERE */
|
|
#endif
|
|
|
|
/* Everything left in the selectable list is therefore unwanted,
|
|
and we call their unquery() method (because they all had
|
|
query() invoked, but will never have init() invoked in this
|
|
scope). */
|
|
|
|
for (item = opal_list_remove_first(selectable); item != NULL;
|
|
item = opal_list_remove_first(selectable)) {
|
|
avail = (avail_io_t *) item;
|
|
unquery(avail, file);
|
|
OBJ_RELEASE(item);
|
|
}
|
|
OBJ_RELEASE(selectable);
|
|
|
|
/* Save the pointers of the selected module on the ompi_file_t */
|
|
|
|
file->f_io_version = selected.ai_version;
|
|
file->f_io_selected_component = selected.ai_component;
|
|
file->f_io_selected_module = selected.ai_module;
|
|
file->f_io_selected_data = selected.ai_module_data;
|
|
|
|
/* Finally -- intialize the selected module. */
|
|
|
|
if (OMPI_SUCCESS != (err = module_init(file))) {
|
|
return err;
|
|
}
|
|
|
|
/* Add the component to the list of components that the io
|
|
framework is maintaining */
|
|
|
|
mca_io_base_component_add(&selected.ai_component);
|
|
|
|
/* Announce the winner */
|
|
|
|
opal_output_verbose(10, mca_io_base_output,
|
|
"io:base:file_select: Selected io module %s",
|
|
selected.ai_component.v1_0_0.io_version.mca_component_name);
|
|
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|
|
|
|
/*
|
|
* For each component in the list, if it is in the list of names (or
|
|
* the list of names is NULL), then check and see if it wants to run,
|
|
* and do the resulting priority comparison. Make a list of
|
|
* (component, module) tuples (of type avail_io_t) to be only those
|
|
* who returned that they want to run, and put them in priority order.
|
|
*/
|
|
static opal_list_t *check_components(opal_list_t *components,
|
|
ompi_file_t *file,
|
|
char **names, int num_names)
|
|
{
|
|
int i;
|
|
const mca_base_component_t *component;
|
|
opal_list_item_t *item, *item2;
|
|
bool want_to_check;
|
|
opal_list_t *selectable;
|
|
avail_io_t *avail, *avail2;
|
|
|
|
/* Make a list of the components that query successfully */
|
|
|
|
selectable = OBJ_NEW(opal_list_t);
|
|
|
|
/* Scan through the list of components. This nested loop is
|
|
O(N^2), but we should never have too many components and/or
|
|
names, so this *hopefully* shouldn't matter... */
|
|
|
|
for (item = opal_list_get_first(components);
|
|
item != opal_list_get_end(components);
|
|
item = opal_list_get_next(item)) {
|
|
component = ((mca_base_component_priority_list_item_t *)
|
|
item)->super.cli_component;
|
|
|
|
/* If we have a list of names, scan through it */
|
|
|
|
if (0 == num_names) {
|
|
want_to_check = true;
|
|
} else {
|
|
want_to_check = false;
|
|
for (i = 0; i < num_names; ++i) {
|
|
if (0 == strcmp(names[i], component->mca_component_name)) {
|
|
want_to_check = true;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* If we determined that we want to check this component, then
|
|
do so */
|
|
|
|
if (want_to_check) {
|
|
avail = check_one_component(file, component);
|
|
if (NULL != avail) {
|
|
|
|
/* Put this item on the list in priority order
|
|
(highest priority first). Should it go first? */
|
|
|
|
item2 = opal_list_get_first(selectable);
|
|
avail2 = (avail_io_t *) item2;
|
|
if (opal_list_get_end(selectable) == item2 ||
|
|
avail->ai_priority > avail2->ai_priority) {
|
|
opal_list_prepend(selectable, (opal_list_item_t*) avail);
|
|
} else {
|
|
for (i = 1; item2 != opal_list_get_end(selectable);
|
|
item2 = opal_list_get_next(selectable), ++i) {
|
|
avail2 = (avail_io_t *) item2;
|
|
if (avail->ai_priority > avail2->ai_priority) {
|
|
opal_list_insert(selectable,
|
|
(opal_list_item_t *) avail, i);
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* If we didn't find a place to put it in the
|
|
list, then append it (because it has the lowest
|
|
priority found so far) */
|
|
|
|
if (opal_list_get_end(selectable) == item2) {
|
|
opal_list_append(selectable,
|
|
(opal_list_item_t *) avail);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* If we didn't find any available components, return an error */
|
|
|
|
if (0 == opal_list_get_size(selectable)) {
|
|
OBJ_RELEASE(selectable);
|
|
return NULL;
|
|
}
|
|
|
|
/* All done */
|
|
|
|
return selectable;
|
|
}
|
|
|
|
|
|
/*
|
|
* Check a single component
|
|
*/
|
|
static avail_io_t *check_one_component(ompi_file_t *file,
|
|
const mca_base_component_t *component)
|
|
{
|
|
avail_io_t *avail;
|
|
|
|
avail = query(component, file);
|
|
if (NULL != avail) {
|
|
avail->ai_priority = (avail->ai_priority < 100) ?
|
|
avail->ai_priority : 100;
|
|
avail->ai_priority = (avail->ai_priority < 0) ?
|
|
0 : avail->ai_priority;
|
|
opal_output_verbose(10, mca_io_base_output,
|
|
"io:base:file_select: component available: %s, priority: %d",
|
|
component->mca_component_name,
|
|
avail->ai_priority);
|
|
} else {
|
|
opal_output_verbose(10, mca_io_base_output,
|
|
"io:base:file_select: component not available: %s",
|
|
component->mca_component_name);
|
|
}
|
|
|
|
return avail;
|
|
}
|
|
|
|
|
|
/**************************************************************************
|
|
* Query functions
|
|
**************************************************************************/
|
|
|
|
/*
|
|
* Take any version of a io module, query it, and return the right
|
|
* module struct
|
|
*/
|
|
static avail_io_t *query(const mca_base_component_t *component,
|
|
ompi_file_t *file)
|
|
{
|
|
const mca_io_base_component_1_0_0_t *ioc_100;
|
|
|
|
/* io v1.0.0 */
|
|
|
|
if (1 == component->mca_major_version &&
|
|
0 == component->mca_minor_version &&
|
|
0 == component->mca_release_version) {
|
|
ioc_100 = (mca_io_base_component_1_0_0_t *) component;
|
|
|
|
return query_1_0_0(ioc_100, file);
|
|
}
|
|
|
|
/* Unknown io API version -- return error */
|
|
|
|
return NULL;
|
|
}
|
|
|
|
|
|
static avail_io_t *query_1_0_0(const mca_io_base_component_1_0_0_t *component,
|
|
ompi_file_t *file)
|
|
{
|
|
int priority;
|
|
avail_io_t *avail;
|
|
const mca_io_base_module_1_0_0_t *module;
|
|
struct mca_io_base_file_t *module_data;
|
|
|
|
/* Query v1.0.0 */
|
|
|
|
avail = NULL;
|
|
module_data = NULL;
|
|
module = component->io_file_query(file, &module_data, &priority);
|
|
if (NULL != module) {
|
|
avail = OBJ_NEW(avail_io_t);
|
|
avail->ai_version = MCA_IO_BASE_V_1_0_0;
|
|
avail->ai_priority = priority;
|
|
avail->ai_component.v1_0_0 = *component;
|
|
avail->ai_module.v1_0_0 = *module;
|
|
avail->ai_module_data = module_data;
|
|
}
|
|
|
|
return avail;
|
|
}
|
|
|
|
|
|
/**************************************************************************
|
|
* Unquery functions
|
|
**************************************************************************/
|
|
|
|
static void unquery(avail_io_t *avail, ompi_file_t *file)
|
|
{
|
|
const mca_io_base_component_1_0_0_t *ioc_100;
|
|
|
|
switch(avail->ai_version) {
|
|
case MCA_IO_BASE_V_1_0_0:
|
|
ioc_100 = &(avail->ai_component.v1_0_0);
|
|
ioc_100->io_file_unquery(file, avail->ai_module_data);
|
|
break;
|
|
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
|
|
/**************************************************************************
|
|
* Module_Init functions
|
|
**************************************************************************/
|
|
|
|
/*
|
|
* Initialize a module
|
|
*/
|
|
static int module_init(ompi_file_t *file)
|
|
{
|
|
const mca_io_base_module_1_0_0_t *iom_100;
|
|
|
|
switch(file->f_io_version) {
|
|
case MCA_IO_BASE_V_1_0_0:
|
|
iom_100 = &(file->f_io_selected_module.v1_0_0);
|
|
return iom_100->io_module_file_open(file->f_comm, file->f_filename,
|
|
file->f_amode, file->f_info,
|
|
file);
|
|
break;
|
|
|
|
default:
|
|
return OMPI_ERROR;
|
|
break;
|
|
}
|
|
|
|
/* No way to reach here */
|
|
}
|