dadca7da88
This merge adds Checkpoint/Restart support to Open MPI. The initial frameworks and components support a LAM/MPI-like implementation. This commit follows the risk assessment presented to the Open MPI core development group on Feb. 22, 2007. This commit closes trac:158 More details to follow. This commit was SVN r14051. The following SVN revisions from the original message are invalid or inconsistent and therefore were not cross-referenced: r13912 The following Trac tickets were found above: Ticket 158 --> https://svn.open-mpi.org/trac/ompi/ticket/158
172 строки
5.6 KiB
C
172 строки
5.6 KiB
C
/*
|
|
* Copyright (c) 2004-2007 The Trustees of Indiana University.
|
|
* All rights reserved.
|
|
* Copyright (c) 2004-2005 The Trustees of the University of Tennessee.
|
|
* All rights reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "opal_config.h"
|
|
|
|
#include "opal/constants.h"
|
|
#include "opal/mca/crs/crs.h"
|
|
#include "opal/mca/crs/base/base.h"
|
|
#include "crs_self.h"
|
|
|
|
/*
|
|
* Public string for version number
|
|
*/
|
|
const char *opal_crs_self_component_version_string =
|
|
"OPAL CRS self MCA component version " OMPI_VERSION;
|
|
|
|
/*
|
|
* Local functionality
|
|
*/
|
|
static int crs_self_open(void);
|
|
static int crs_self_close(void);
|
|
|
|
/*
|
|
* Instantiate the public struct with all of our public information
|
|
* and pointer to our public functions in it
|
|
*/
|
|
opal_crs_self_component_t mca_crs_self_component = {
|
|
/* First do the base component stuff */
|
|
{
|
|
/* Handle the general mca_component_t struct containing
|
|
* meta information about the component itself
|
|
*/
|
|
{
|
|
OPAL_CRS_BASE_VERSION_1_0_0,
|
|
/* Component name and version */
|
|
"self",
|
|
OMPI_MAJOR_VERSION,
|
|
OMPI_MINOR_VERSION,
|
|
OMPI_RELEASE_VERSION,
|
|
|
|
/* Component open and close functions */
|
|
crs_self_open,
|
|
crs_self_close
|
|
},
|
|
|
|
/* Next the MCA v1.0.0 component meta data */
|
|
{
|
|
/* The component is checkpoint ready */
|
|
MCA_BASE_METADATA_PARAM_CHECKPOINT
|
|
},
|
|
|
|
/* Query Function */
|
|
opal_crs_self_component_query,
|
|
/* Verbosity level */
|
|
0,
|
|
/* opal_output handler */
|
|
-1,
|
|
/* Default priority */
|
|
20
|
|
},
|
|
/* Default prefix */
|
|
PREFIX_DEFAULT,
|
|
/* If we are restarting right out of the gate */
|
|
false,
|
|
/* Checkpointing enabled */
|
|
true,
|
|
/* Callbacks */
|
|
NULL,
|
|
NULL,
|
|
NULL
|
|
};
|
|
|
|
static int crs_self_open(void)
|
|
{
|
|
int value;
|
|
|
|
/*
|
|
* This should be the last componet to ever get used since
|
|
* it doesn't do anything.
|
|
*/
|
|
mca_base_param_reg_int(&mca_crs_self_component.super.crs_version,
|
|
"priority",
|
|
"Priority of the CRS self component",
|
|
false, false,
|
|
mca_crs_self_component.super.priority,
|
|
&mca_crs_self_component.super.priority);
|
|
|
|
mca_base_param_reg_int(&mca_crs_self_component.super.crs_version,
|
|
"verbose",
|
|
"Verbose level for the CRS self component",
|
|
false, false,
|
|
mca_crs_self_component.super.verbose,
|
|
&mca_crs_self_component.super.verbose);
|
|
/* If there is a custom verbose level for this component than use it
|
|
* otherwise take our parents level and output channel
|
|
*/
|
|
if ( 0 != mca_crs_self_component.super.verbose) {
|
|
mca_crs_self_component.super.output_handle = opal_output_open(NULL);
|
|
opal_output_set_verbosity(mca_crs_self_component.super.output_handle,
|
|
mca_crs_self_component.super.verbose);
|
|
} else {
|
|
mca_crs_self_component.super.output_handle = opal_crs_base_output;
|
|
}
|
|
|
|
/*
|
|
* Handler names
|
|
*/
|
|
mca_base_param_reg_string(&mca_crs_self_component.super.crs_version,
|
|
"prefix",
|
|
"Prefix for user defined callback functions",
|
|
false, false,
|
|
mca_crs_self_component.prefix,
|
|
&mca_crs_self_component.prefix);
|
|
|
|
mca_base_param_reg_int(&mca_crs_self_component.super.crs_version,
|
|
"do_restart",
|
|
"Start execution by calling restart callback",
|
|
false, false,
|
|
mca_crs_self_component.do_restart,
|
|
&value);
|
|
if(value == 0)
|
|
mca_crs_self_component.do_restart = false;
|
|
else
|
|
mca_crs_self_component.do_restart = true;
|
|
|
|
/*
|
|
* Debug Output
|
|
*/
|
|
opal_output_verbose(10, mca_crs_self_component.super.output_handle,
|
|
"crs:self: open()");
|
|
opal_output_verbose(20, mca_crs_self_component.super.output_handle,
|
|
"crs:self: open: priority = %d",
|
|
mca_crs_self_component.super.priority);
|
|
opal_output_verbose(20, mca_crs_self_component.super.output_handle,
|
|
"crs:self: open: verbosity = %d",
|
|
mca_crs_self_component.super.verbose);
|
|
opal_output_verbose(20, mca_crs_self_component.super.output_handle,
|
|
"crs:self: open: prefix = %s",
|
|
mca_crs_self_component.prefix);
|
|
opal_output_verbose(20, mca_crs_self_component.super.output_handle,
|
|
"crs:self: open: do_restart = %d",
|
|
mca_crs_self_component.do_restart);
|
|
|
|
return OPAL_SUCCESS;
|
|
}
|
|
|
|
static int crs_self_close(void)
|
|
{
|
|
opal_output_verbose(10, mca_crs_self_component.super.output_handle,
|
|
"crs:self: close()");
|
|
|
|
if(NULL != mca_crs_self_component.prefix ) {
|
|
free(mca_crs_self_component.prefix);
|
|
mca_crs_self_component.prefix = NULL;
|
|
}
|
|
|
|
return OPAL_SUCCESS;
|
|
}
|