8b8bee04d6
This patch contains the following items: * Fix the flag passed to open() for the read side of the named pipe between the local and app coordinator. There is a race condition when using O_RDWR on a named pipe (not sure how that bug got in there in the first place). * Adjust control in the C/R thread timing * Clarify return code in BLCR component * Allow the user to adjust the max wait time for the named pipes in the FileM local coordinator by using the MCA parameter "snapc_full_max_wait_time" (Default: 20 seconds) * If the application terminates while there are active FileM operations, force mpirun to wait on these operations to complete. * Allow the user to set the local copy command (Default: cp) via MCA parameter "filem_rsh_cp" * Implement the ability to throttle the number of outgoing connections in FileM. At larger scales this type of explicit throttling helps prevent overwhelming the HNP machine. Default: 10, set via MCA parameter: {{{filem_rsh_max_outgoing}}} This commit was SVN r21167. The following SVN revision numbers were found above: r21131 --> open-mpi/ompi@0deb009225
87 строки
2.4 KiB
C
87 строки
2.4 KiB
C
/*
|
|
* Copyright (c) 2004-2009 The Trustees of Indiana University.
|
|
* All rights reserved.
|
|
* Copyright (c) 2004-2005 The Trustees of the University of Tennessee.
|
|
* All rights reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
*
|
|
* RSH FILEM component
|
|
*
|
|
*/
|
|
|
|
#ifndef MCA_FILEM_RSH_EXPORT_H
|
|
#define MCA_FILEM_RSH_EXPORT_H
|
|
|
|
#include "orte_config.h"
|
|
|
|
#include "opal/mca/mca.h"
|
|
#include "orte/mca/filem/filem.h"
|
|
|
|
#if defined(c_plusplus) || defined(__cplusplus)
|
|
extern "C" {
|
|
#endif
|
|
|
|
#define ORTE_FILEM_RSH_ASK 0
|
|
#define ORTE_FILEM_RSH_ALLOW 1
|
|
#define ORTE_FILEM_RSH_DONE 2
|
|
|
|
/*
|
|
* Local Component structures
|
|
*/
|
|
struct orte_filem_rsh_component_t {
|
|
/** Base FILEM component */
|
|
orte_filem_base_component_t super;
|
|
|
|
/** RSH cp command: rsh = rcp, ssh = scp */
|
|
char * cp_command;
|
|
|
|
/** Unix cp command */
|
|
char * cp_local_command;
|
|
|
|
/** SSH remote login command */
|
|
char * remote_sh_command;
|
|
};
|
|
typedef struct orte_filem_rsh_component_t orte_filem_rsh_component_t;
|
|
ORTE_MODULE_DECLSPEC extern orte_filem_rsh_component_t mca_filem_rsh_component;
|
|
|
|
extern int orte_filem_rsh_max_incomming;
|
|
extern int orte_filem_rsh_max_outgoing;
|
|
|
|
int orte_filem_rsh_component_query(mca_base_module_t **module, int *priority);
|
|
|
|
/*
|
|
* Module functions
|
|
*/
|
|
int orte_filem_rsh_module_init(void);
|
|
int orte_filem_rsh_module_finalize(void);
|
|
|
|
int orte_filem_rsh_put(orte_filem_base_request_t *request);
|
|
int orte_filem_rsh_put_nb(orte_filem_base_request_t *request);
|
|
|
|
int orte_filem_rsh_get(orte_filem_base_request_t *request);
|
|
int orte_filem_rsh_get_nb(orte_filem_base_request_t *request);
|
|
|
|
int orte_filem_rsh_rm( orte_filem_base_request_t *request);
|
|
int orte_filem_rsh_rm_nb( orte_filem_base_request_t *request);
|
|
|
|
int orte_filem_rsh_wait( orte_filem_base_request_t *request);
|
|
int orte_filem_rsh_wait_all( opal_list_t *request_list);
|
|
|
|
#if defined(c_plusplus) || defined(__cplusplus)
|
|
}
|
|
#endif
|
|
|
|
#endif /* MCA_FILEM_RSH_EXPORT_H */
|