4c28c8cbd0
using the modex or RML to share sm initialization information, have node rank 0 create a file containing initialization information in a well-known place. Then during add_procs, the rest of the node processes requiring sm BTL initialization will just read from that file to complete their initialization. This commit was SVN r27789.
216 строки
8.1 KiB
C
216 строки
8.1 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2009-2010 Cisco Systems, Inc. All rights reserved.
|
|
* Copyright (c) 2010-2012 Los Alamos National Security, LLC.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#ifndef _COMMON_SM_H_
|
|
#define _COMMON_SM_H_
|
|
|
|
#include "ompi_config.h"
|
|
|
|
#include "opal/mca/mca.h"
|
|
#include "opal/class/opal_object.h"
|
|
#include "opal/class/opal_list.h"
|
|
#include "opal/sys/atomic.h"
|
|
#include "opal/mca/shmem/shmem.h"
|
|
|
|
#include "ompi/mca/mpool/mpool.h"
|
|
#include "ompi/proc/proc.h"
|
|
#include "ompi/group/group.h"
|
|
#include "ompi/mca/btl/base/base.h"
|
|
#include "ompi/mca/btl/base/btl_base_error.h"
|
|
|
|
BEGIN_C_DECLS
|
|
|
|
struct mca_mpool_base_module_t;
|
|
|
|
typedef struct mca_common_sm_seg_header_t {
|
|
/* lock to control atomic access */
|
|
opal_atomic_lock_t seg_lock;
|
|
/* indicates whether or not the segment is ready for use */
|
|
volatile int32_t seg_inited;
|
|
/* number of local processes that are attached to the shared memory segment.
|
|
* this is primarily used as a way of determining whether or not it is safe
|
|
* to unlink the shared memory backing store. for example, once seg_att
|
|
* is equal to the number of local processes, then we can safely unlink.
|
|
*/
|
|
volatile size_t seg_num_procs_inited;
|
|
/* offset to next available memory location available for allocation */
|
|
size_t seg_offset;
|
|
/* total size of the segment */
|
|
size_t seg_size;
|
|
} mca_common_sm_seg_header_t;
|
|
|
|
typedef struct mca_common_sm_module_t {
|
|
/* double link list element */
|
|
opal_list_item_t super;
|
|
/* pointer to header embedded in the shared memory segment */
|
|
mca_common_sm_seg_header_t *module_seg;
|
|
/* base address of the segment */
|
|
unsigned char *module_seg_addr;
|
|
/* base address of data segment */
|
|
unsigned char *module_data_addr;
|
|
/* shared memory backing facility object that encapsulates shmem info */
|
|
opal_shmem_ds_t shmem_ds;
|
|
} mca_common_sm_module_t;
|
|
|
|
OBJ_CLASS_DECLARATION(mca_common_sm_module_t);
|
|
|
|
/**
|
|
* This routine reorders procs array to have all the local procs at the
|
|
* beginning and returns the number of local procs through out_num_local_procs.
|
|
* The proc with the lowest name is at the beginning of the reordered procs
|
|
* array.
|
|
*
|
|
* @returnvalue OMPI_SUCCESS on success, something else, otherwise.
|
|
*/
|
|
OMPI_DECLSPEC extern int
|
|
mca_common_sm_local_proc_reorder(ompi_proc_t **procs,
|
|
size_t num_procs,
|
|
size_t *out_num_local_procs);
|
|
|
|
/**
|
|
* This routine is used to create and attach to a shared memory segment
|
|
* (whether it's an mmaped file or a SYSV IPC segment). It is assumed that
|
|
* the shared memory segment does not exist before this call.
|
|
*
|
|
* @returnvalue pointer to control structure at head of shared memory segment.
|
|
* Returns NULL if an error occurred.
|
|
*/
|
|
OMPI_DECLSPEC extern mca_common_sm_module_t *
|
|
mca_common_sm_module_create_and_attach(size_t size,
|
|
char *file_name,
|
|
size_t size_ctl_structure,
|
|
size_t data_seg_alignment);
|
|
|
|
/**
|
|
* This routine is used to attach to the shared memory segment associated with
|
|
* *seg_meta. It is assumed that the shared memory segment associated with
|
|
* *seg_meta was already created with mca_common_sm_module_create.
|
|
*
|
|
* @seg_meta points to shared memory information used for initialization and setup.
|
|
*
|
|
* @returnvalue pointer to control structure at head of shared memory segment.
|
|
* Returns NULL if an error occurred.
|
|
*/
|
|
OMPI_DECLSPEC extern mca_common_sm_module_t *
|
|
mca_common_sm_module_attach(opal_shmem_ds_t *seg_meta,
|
|
size_t size_ctl_structure,
|
|
size_t data_seg_alignment);
|
|
|
|
/**
|
|
* A thin wrapper around opal_shmem_unlink.
|
|
*
|
|
* @ modp points to an initialized mca_common_sm_module_t.
|
|
*
|
|
* @returnvalue OMPI_SUCCESS if the operation completed successfully,
|
|
* OMPI_ERROR otherwise.
|
|
*/
|
|
OMPI_DECLSPEC extern int
|
|
mca_common_sm_module_unlink(mca_common_sm_module_t *modp);
|
|
|
|
/**
|
|
* This routine is used to set up a shared memory segment (whether
|
|
* it's an mmaped file or a SYSV IPC segment). It is assumed that
|
|
* the shared memory segment does not exist before any of the current
|
|
* set of processes try and open it.
|
|
*
|
|
* @param procs - array of (ompi_proc_t *)'s to create this shared
|
|
* memory segment for. This array must be writable; it may be edited
|
|
* (in undefined ways) if the array contains procs that are not on
|
|
* this host. It is assumed that the caller will simply free this
|
|
* array upon return. (INOUT)
|
|
*
|
|
* @param num_procs - length of the procs array (IN)
|
|
*
|
|
* @param size - size of the segment, in bytes (IN)
|
|
*
|
|
* @param name - unique string identifier of this segment (IN)
|
|
*
|
|
* @param size_ctl_structure size of the control structure at
|
|
* the head of the segment. The control structure
|
|
* is assumed to have mca_common_sm_seg_header_t
|
|
* as its first segment (IN)
|
|
*
|
|
* @param data_set_alignment alignment of the data segment. this
|
|
* follows the control structure. If this
|
|
* value if 0, then assume that there will
|
|
* be no data segment following the control
|
|
* structure. (IN)
|
|
*
|
|
* @returnvalue pointer to control structure at head of shared memory segment.
|
|
*/
|
|
OMPI_DECLSPEC extern mca_common_sm_module_t *
|
|
mca_common_sm_init(ompi_proc_t **procs,
|
|
size_t num_procs,
|
|
size_t size,
|
|
char *file_name,
|
|
size_t size_ctl_structure,
|
|
size_t data_seg_alignment);
|
|
|
|
/**
|
|
* This routine is used to set up a shared memory segment (whether
|
|
* it's an mmaped file or a SYSV IPC segment). It is assumed that
|
|
* the shared memory segment does not exist before any of the current
|
|
* set of processes try and open it.
|
|
*
|
|
* This routine is the same as mca_common_sm_mmap_init() except that
|
|
* it takes an (ompi_group_t *) parameter to specify the peers rather
|
|
* than an array of procs. Unlike mca_common_sm_mmap_init(), the
|
|
* group must contain *only* local peers, or this function will return
|
|
* NULL and not create any shared memory segment.
|
|
*/
|
|
OMPI_DECLSPEC extern mca_common_sm_module_t *
|
|
mca_common_sm_init_group(ompi_group_t *group,
|
|
size_t size,
|
|
char *file_name,
|
|
size_t size_ctl_structure,
|
|
size_t data_seg_alignment);
|
|
|
|
/**
|
|
* callback from the sm mpool
|
|
*/
|
|
OMPI_DECLSPEC extern void *
|
|
mca_common_sm_seg_alloc(struct mca_mpool_base_module_t *mpool,
|
|
size_t *size,
|
|
mca_mpool_base_registration_t **registration);
|
|
|
|
/**
|
|
* This function will release all local resources attached to the
|
|
* shared memory segment. We assume that the operating system will
|
|
* release the memory resources when the last process release it.
|
|
*
|
|
* @param mca_common_sm_module - instance that is shared between
|
|
* components that use shared memory.
|
|
*
|
|
* @return OMPI_SUCCESS if everything was okay, otherwise return OMPI_ERROR.
|
|
*/
|
|
|
|
OMPI_DECLSPEC extern int
|
|
mca_common_sm_fini(mca_common_sm_module_t *mca_common_sm_module);
|
|
|
|
/**
|
|
* instance that is shared between components that use shared memory.
|
|
*/
|
|
OMPI_DECLSPEC extern mca_common_sm_module_t *mca_common_sm_module;
|
|
|
|
END_C_DECLS
|
|
|
|
#endif /* _COMMON_SM_H_ */
|