check point.
This commit was SVN r17457.
Этот коммит содержится в:
родитель
58bf7f5a1d
Коммит
292d930eea
@ -20,7 +20,10 @@ not_used_yet =
|
|||||||
|
|
||||||
sources = \
|
sources = \
|
||||||
coll_sm2.h \
|
coll_sm2.h \
|
||||||
coll_sm2_component.c
|
coll_sm2_component.c \
|
||||||
|
coll_sm2_module.c \
|
||||||
|
coll_sm2_allreduce.c \
|
||||||
|
coll_sm2_barrier.c
|
||||||
|
|
||||||
# Make the output library in this directory, and name it either
|
# Make the output library in this directory, and name it either
|
||||||
# mca_<type>_<name>.la (for DSO builds) or libmca_<type>_<name>.la
|
# mca_<type>_<name>.la (for DSO builds) or libmca_<type>_<name>.la
|
||||||
|
@ -28,6 +28,7 @@
|
|||||||
#include "ompi/mca/coll/coll.h"
|
#include "ompi/mca/coll/coll.h"
|
||||||
#include "ompi/mca/mpool/mpool.h"
|
#include "ompi/mca/mpool/mpool.h"
|
||||||
#include "ompi/mca/common/sm/common_sm_mmap.h"
|
#include "ompi/mca/common/sm/common_sm_mmap.h"
|
||||||
|
#include "ompi/request/request.h"
|
||||||
|
|
||||||
BEGIN_C_DECLS
|
BEGIN_C_DECLS
|
||||||
|
|
||||||
@ -96,6 +97,9 @@ BEGIN_C_DECLS
|
|||||||
/** MCA parameter: number of regions per memory bank */
|
/** MCA parameter: number of regions per memory bank */
|
||||||
size_t sm2_num_regions_per_bank;
|
size_t sm2_num_regions_per_bank;
|
||||||
|
|
||||||
|
/** MCA parameter: order of barrier tree */
|
||||||
|
int order_barrier_tree;
|
||||||
|
|
||||||
};
|
};
|
||||||
|
|
||||||
/**
|
/**
|
||||||
@ -104,6 +108,67 @@ BEGIN_C_DECLS
|
|||||||
typedef struct mca_coll_sm2_component_t mca_coll_sm2_component_t;
|
typedef struct mca_coll_sm2_component_t mca_coll_sm2_component_t;
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* N-order tree node description
|
||||||
|
*/
|
||||||
|
struct tree_node_t {
|
||||||
|
int my_rank;
|
||||||
|
int tree_size;
|
||||||
|
int n_parents;
|
||||||
|
int n_children;
|
||||||
|
int parent_rank;
|
||||||
|
int *children_ranks;
|
||||||
|
};
|
||||||
|
typedef struct tree_node_t tree_node_t;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Barrier request objects
|
||||||
|
*/
|
||||||
|
|
||||||
|
/* shared memory data strucutures */
|
||||||
|
struct mca_coll_sm2_nb_request_process_shared_mem_t {
|
||||||
|
/* flag used to indicate the status of this memory region */
|
||||||
|
long long flag;
|
||||||
|
|
||||||
|
/* pading */
|
||||||
|
char padding[CACHE_LINE_SIZE-sizeof(long long)];
|
||||||
|
};
|
||||||
|
typedef struct mca_coll_sm2_nb_request_process_shared_mem_t
|
||||||
|
mca_coll_sm2_nb_request_process_shared_mem_t;
|
||||||
|
|
||||||
|
|
||||||
|
/* enum for phase at which the nb barrier is in */
|
||||||
|
enum{
|
||||||
|
NB_BARRIER_FAN_IN,
|
||||||
|
NB_BARRIER_FAN_OUT,
|
||||||
|
/* done and not started are the same for all practicle
|
||||||
|
* purposes, as the init funtion always sets this flag
|
||||||
|
*/
|
||||||
|
NB_BARRIER_DONE
|
||||||
|
};
|
||||||
|
/* process private data structures */
|
||||||
|
struct mca_coll_sm2_nb_request_process_private_mem_t {
|
||||||
|
struct ompi_request_t super;
|
||||||
|
/* tag that will be used as unique barrier identifier */
|
||||||
|
long long tag;
|
||||||
|
|
||||||
|
/* pointer to module */
|
||||||
|
/* shared memory strucuture index - will be flip-flopping between structures */
|
||||||
|
int sm_index;
|
||||||
|
|
||||||
|
/* this processes base address of the barrier shared memory region */
|
||||||
|
mca_coll_sm2_nb_request_process_shared_mem_t *barrier_base_address[2];
|
||||||
|
|
||||||
|
/* module pointer */
|
||||||
|
mca_coll_sm2_module_t *coll_sm2_module;
|
||||||
|
|
||||||
|
/* barrier phase */
|
||||||
|
sm2_barrier_phase;
|
||||||
|
|
||||||
|
};
|
||||||
|
typedef struct mca_coll_sm2_nb_request_process_private_mem_t
|
||||||
|
mca_coll_sm2_nb_request_process_private_mem_t;
|
||||||
|
|
||||||
struct mca_coll_sm2_module_t {
|
struct mca_coll_sm2_module_t {
|
||||||
/* base structure */
|
/* base structure */
|
||||||
mca_coll_base_module_1_1_0_t super;
|
mca_coll_base_module_1_1_0_t super;
|
||||||
@ -117,12 +182,65 @@ BEGIN_C_DECLS
|
|||||||
/* Memory pointer to shared file */
|
/* Memory pointer to shared file */
|
||||||
char *shared_memory_region;
|
char *shared_memory_region;
|
||||||
|
|
||||||
|
/* Pointer to the collective buffers */
|
||||||
|
char *collective_buffer_region;
|
||||||
|
|
||||||
|
/* size of memory region, per process, for memory bank management */
|
||||||
|
size_t sm2_size_management_region_per_proc;
|
||||||
|
|
||||||
|
/* size of each memory segment */
|
||||||
|
size_t segment_size;
|
||||||
|
|
||||||
|
/* size, per process, of each memory segment */
|
||||||
|
size_t segement_size_per_process;
|
||||||
|
|
||||||
|
/* number of memory banks */
|
||||||
|
int sm2_module_num_memory_banks;
|
||||||
|
|
||||||
|
/* number of buffers per memory bank */
|
||||||
|
int sm2_module_num_regions_per_bank;
|
||||||
|
|
||||||
|
/* total number of working buffers */
|
||||||
|
int sm2_module_num_buffers;
|
||||||
|
|
||||||
|
/* allocated buffer index - local counter */
|
||||||
|
int sm2_allocated_buffer_index;
|
||||||
|
|
||||||
|
/* freed allocated buffer index - local counter */
|
||||||
|
int sm2_freed_buffer_index;
|
||||||
|
|
||||||
|
/* index of first buffer in next memory bank - need to
|
||||||
|
* make sure next bank is ready for use, before we use it.
|
||||||
|
* We complete the non-blocking barrier before allocating
|
||||||
|
* this buffer.
|
||||||
|
*/
|
||||||
|
int sm2_first_buffer_index_next_bank;
|
||||||
|
|
||||||
|
/* index of last buffer in this memory bank -
|
||||||
|
* We start the non-blocking barrier after allocating
|
||||||
|
* this buffer.
|
||||||
|
*/
|
||||||
|
int sm2_last_buffer_index_this_bank;
|
||||||
|
|
||||||
|
/* communicator - there is a one-to-one association between
|
||||||
|
* the communicator and the module
|
||||||
|
*/
|
||||||
|
struct ompi_communicator_t *module_comm;
|
||||||
|
|
||||||
|
/* non-blocking barrier strcutres used for mangeing the shared
|
||||||
|
* buffers */
|
||||||
|
tree_node_t barrier_tree;
|
||||||
|
|
||||||
|
mca_coll_sm2_nb_request_process_private_mem_t *barrier_request;
|
||||||
|
|
||||||
|
/* unique tag used for non-blocking collectives */
|
||||||
|
long long nb_barrier_tag;
|
||||||
|
|
||||||
};
|
};
|
||||||
|
|
||||||
typedef struct mca_coll_sm2_module_t mca_coll_sm2_module_t;
|
typedef struct mca_coll_sm2_module_t mca_coll_sm2_module_t;
|
||||||
OBJ_CLASS_DECLARATION(mca_coll_sm2_module_t);
|
OBJ_CLASS_DECLARATION(mca_coll_sm2_module_t);
|
||||||
|
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Global component instance
|
* Global component instance
|
||||||
*/
|
*/
|
||||||
@ -145,6 +263,11 @@ BEGIN_C_DECLS
|
|||||||
struct mca_coll_base_module_1_1_0_t *
|
struct mca_coll_base_module_1_1_0_t *
|
||||||
mca_coll_sm2_comm_query(struct ompi_communicator_t *comm, int *priority);
|
mca_coll_sm2_comm_query(struct ompi_communicator_t *comm, int *priority);
|
||||||
|
|
||||||
|
/* non-blocking barrier - init function */
|
||||||
|
int mca_coll_sm2_nbbarrier_intra(struct ompi_communicator_t *comm,
|
||||||
|
mca_coll_sm2_nb_request_process_private_mem_t *request,
|
||||||
|
struct mca_coll_base_module_1_1_0_t *module);
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Macro to setup flag usage
|
* Macro to setup flag usage
|
||||||
*/
|
*/
|
||||||
|
@ -41,7 +41,7 @@
|
|||||||
/*
|
/*
|
||||||
* Public string showing the coll ompi_sm V2 component version number
|
* Public string showing the coll ompi_sm V2 component version number
|
||||||
*/
|
*/
|
||||||
const char *mca_coll_sm_component_version_string =
|
const char *mca_coll_sm2_component_version_string =
|
||||||
"Open MPI sm-V2 collective MCA component version " OMPI_VERSION;
|
"Open MPI sm-V2 collective MCA component version " OMPI_VERSION;
|
||||||
|
|
||||||
|
|
||||||
@ -58,20 +58,6 @@ static int sm2_module_enable(struct mca_coll_base_module_1_1_0_t *module,
|
|||||||
static int sm2_open(void);
|
static int sm2_open(void);
|
||||||
static int sm2_close(void);
|
static int sm2_close(void);
|
||||||
|
|
||||||
static bool have_local_peers(ompi_group_t *group, size_t size)
|
|
||||||
{
|
|
||||||
size_t i;
|
|
||||||
ompi_proc_t *proc;
|
|
||||||
|
|
||||||
for (i = 0; i < size; ++i) {
|
|
||||||
proc = ompi_group_peer_lookup(group,i);
|
|
||||||
if (0 == (proc->proc_flags & OMPI_PROC_FLAG_LOCAL)) {
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return true;
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline int mca_coll_sm2_param_register_int(
|
static inline int mca_coll_sm2_param_register_int(
|
||||||
const char* param_name, int default_value)
|
const char* param_name, int default_value)
|
||||||
{
|
{
|
||||||
@ -81,142 +67,6 @@ static inline int mca_coll_sm2_param_register_int(
|
|||||||
return param_value;
|
return param_value;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
|
||||||
* Create mmaped shared file
|
|
||||||
*/
|
|
||||||
|
|
||||||
static int allocate_shared_file(size_t size, char *file_name,
|
|
||||||
struct ompi_communicator_t *comm, char **sm_backing_file)
|
|
||||||
{
|
|
||||||
int fd = -1;
|
|
||||||
int group_size,my_rank;
|
|
||||||
|
|
||||||
bool i_create_shared_file=false;
|
|
||||||
size_t p;
|
|
||||||
int rc=0, sm_file_inited=0;
|
|
||||||
struct iovec iov[2];
|
|
||||||
int sm_file_created;
|
|
||||||
ompi_proc_t **comm_proc_list;
|
|
||||||
|
|
||||||
/* get the list of procs */
|
|
||||||
comm_proc_list=comm->c_local_group->grp_proc_pointers;
|
|
||||||
|
|
||||||
group_size=ompi_comm_size(comm);
|
|
||||||
my_rank=ompi_comm_rank(comm);
|
|
||||||
|
|
||||||
/* determine who will actually create the file */
|
|
||||||
if( my_rank == 0 ) {
|
|
||||||
i_create_shared_file=true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* open the backing file. */
|
|
||||||
if( i_create_shared_file ) {
|
|
||||||
/* process initializing the file */
|
|
||||||
fd = open(file_name, O_CREAT|O_RDWR, 0600);
|
|
||||||
if (fd < 0) {
|
|
||||||
opal_output(0,"mca_common_sm_mmap_init: open %s failed with errno=%d\n",
|
|
||||||
file_name, errno);
|
|
||||||
goto file_opened;
|
|
||||||
}
|
|
||||||
/* map the file and initialize segment state */
|
|
||||||
*sm_backing_file = (char *)
|
|
||||||
mmap(NULL, size, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
|
|
||||||
if( (void*)-1 == sm_backing_file ) {
|
|
||||||
opal_output(0, "mca_common_sm_mmap_init: mmap failed with errno=%d\n",
|
|
||||||
errno);
|
|
||||||
goto file_opened;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* truncate the file to the requested size */
|
|
||||||
if(ftruncate(fd, size) != 0) {
|
|
||||||
opal_output(0,
|
|
||||||
"mca_common_sm_mmap_init: ftruncate failed with errno=%d\n",
|
|
||||||
errno);
|
|
||||||
goto file_opened;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* if we got this far, the file has been initialized correctly */
|
|
||||||
sm_file_inited=1;
|
|
||||||
|
|
||||||
file_opened:
|
|
||||||
|
|
||||||
/* signal the rest of the local procs that the backing file
|
|
||||||
* has been created - not very scalable, but for small shared
|
|
||||||
* memory nodes is adequate for now
|
|
||||||
*/
|
|
||||||
for(p=1 ; p < group_size ; p++ ) {
|
|
||||||
sm_file_created=OMPI_RML_TAG_COLL_SM2_BACK_FILE_CREATED;
|
|
||||||
iov[0].iov_base=&sm_file_created;
|
|
||||||
iov[0].iov_len=sizeof(sm_file_created);
|
|
||||||
iov[1].iov_base=&sm_file_inited;
|
|
||||||
iov[1].iov_len=sizeof(sm_file_inited);
|
|
||||||
rc=orte_rml.send(&(comm_proc_list[p]->proc_name),iov,2,
|
|
||||||
OMPI_RML_TAG_COLL_SM2_BACK_FILE_CREATED,0);
|
|
||||||
if( rc < 0 ) {
|
|
||||||
opal_output(0,
|
|
||||||
"allocate_shared_file: orte_rml.send failed to %lu with errno=%d\n",
|
|
||||||
(unsigned long)p, errno);
|
|
||||||
goto return_error;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
if ( 0 == sm_file_inited ) {
|
|
||||||
/* error - the sm backing file did not get opened correctly */
|
|
||||||
goto return_error;
|
|
||||||
}
|
|
||||||
} else {
|
|
||||||
/* all other procs wait for the file to be initialized
|
|
||||||
before using the backing file */
|
|
||||||
iov[0].iov_base=&sm_file_created;
|
|
||||||
iov[0].iov_len=sizeof(sm_file_created);
|
|
||||||
iov[1].iov_base=&sm_file_inited;
|
|
||||||
iov[1].iov_len=sizeof(sm_file_inited);
|
|
||||||
rc=orte_rml.recv(&(comm_proc_list[0]->proc_name),iov,2,
|
|
||||||
OMPI_RML_TAG_COLL_SM2_BACK_FILE_CREATED,0);
|
|
||||||
if( rc < 0 ) {
|
|
||||||
opal_output(0, "allocate_shared_file: orte_rml.recv failed from %ld with errno=%d\n",
|
|
||||||
0L, errno);
|
|
||||||
goto return_error;
|
|
||||||
}
|
|
||||||
/* check to see if file inited correctly */
|
|
||||||
if( 0 == sm_file_inited ) {
|
|
||||||
goto return_error;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* open backing file */
|
|
||||||
fd = open(file_name, O_RDWR, 0600);
|
|
||||||
if (fd < 0) {
|
|
||||||
opal_output(0,"mca_common_sm_mmap_init: open %s failed with errno=%d\n",
|
|
||||||
file_name, errno);
|
|
||||||
goto return_error;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* map the file and initialize segment state */
|
|
||||||
*sm_backing_file = (char *)
|
|
||||||
mmap(NULL, size, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
|
|
||||||
if( (void*)-1 == sm_backing_file ) {
|
|
||||||
opal_output(0, "mca_common_sm_mmap_init: mmap failed with errno=%d\n",
|
|
||||||
errno);
|
|
||||||
goto return_error;
|
|
||||||
}
|
|
||||||
|
|
||||||
}
|
|
||||||
|
|
||||||
/* enable access by other processes on this host */
|
|
||||||
close(fd);
|
|
||||||
|
|
||||||
return OMPI_SUCCESS;
|
|
||||||
|
|
||||||
return_error:
|
|
||||||
if( -1 != fd ) {
|
|
||||||
close(fd);
|
|
||||||
}
|
|
||||||
|
|
||||||
if( NULL != sm_backing_file ) munmap((void*) sm_backing_file,size);
|
|
||||||
|
|
||||||
return OMPI_ERROR;
|
|
||||||
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Instantiate the public struct with all of our public information
|
* Instantiate the public struct with all of our public information
|
||||||
* and pointers to our public functions in it
|
* and pointers to our public functions in it
|
||||||
@ -265,34 +115,10 @@ mca_coll_sm2_component_t mca_coll_sm2_component = {
|
|||||||
/* sm-component specifc information */
|
/* sm-component specifc information */
|
||||||
|
|
||||||
/* (default) priority */
|
/* (default) priority */
|
||||||
/* JMS temporarily lowered until we can get more testing */
|
|
||||||
0,
|
0,
|
||||||
|
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
static void
|
|
||||||
mca_coll_sm2_module_construct(mca_coll_sm2_module_t *module)
|
|
||||||
{
|
|
||||||
/* debug */
|
|
||||||
fprintf(stderr," sm2 constructor called \n");
|
|
||||||
fflush(stderr);
|
|
||||||
/* end debug */
|
|
||||||
}
|
|
||||||
|
|
||||||
static void
|
|
||||||
mca_coll_sm2_module_destruct(mca_coll_sm2_module_t *module)
|
|
||||||
{
|
|
||||||
int ret;
|
|
||||||
/* remove shared memory backing file */
|
|
||||||
if( module->shared_memory_region) {
|
|
||||||
ret=munmap(module->shared_memory_region,
|
|
||||||
module->size_sm2_backing_file);
|
|
||||||
/* this is cleanup, no recovery will be done */
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Open the component
|
* Open the component
|
||||||
*/
|
*/
|
||||||
@ -339,6 +165,10 @@ static int sm2_open(void)
|
|||||||
cs->sm2_num_regions_per_bank=
|
cs->sm2_num_regions_per_bank=
|
||||||
mca_coll_sm2_param_register_int("sm2_num_regions_per_bank",8);
|
mca_coll_sm2_param_register_int("sm2_num_regions_per_bank",8);
|
||||||
|
|
||||||
|
/* Order of Barrier Tree */
|
||||||
|
cs->order_barrier_tree=
|
||||||
|
mca_coll_sm2_param_register_int("order_barrier_tree",2);
|
||||||
|
|
||||||
return OMPI_SUCCESS;
|
return OMPI_SUCCESS;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -362,212 +192,3 @@ int mca_coll_sm2_init_query(bool enable_progress_threads,
|
|||||||
/* done */
|
/* done */
|
||||||
return OMPI_SUCCESS;
|
return OMPI_SUCCESS;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
/* query to see if the module is available for use on the given
|
|
||||||
* communicator, and if so, what it's priority is. This is where
|
|
||||||
* the backing shared-memory file is created.
|
|
||||||
*/
|
|
||||||
struct mca_coll_base_module_1_1_0_t *
|
|
||||||
mca_coll_sm2_comm_query(struct ompi_communicator_t *comm, int *priority)
|
|
||||||
{
|
|
||||||
/* local variables */
|
|
||||||
mca_coll_sm2_module_t *sm_module;
|
|
||||||
int group_size,ret;
|
|
||||||
size_t alignment,size,size_tot,size_tot_per_proc_per_seg;
|
|
||||||
size_t tot_size_per_bank,size_tot_per_segment;
|
|
||||||
size_t tot_size_mem_banks;
|
|
||||||
size_t ctl_memory_per_proc_per_segment;
|
|
||||||
size_t mem_management_per_proc_per_block;
|
|
||||||
size_t mem_management_per_proc;
|
|
||||||
size_t mem_management_total;
|
|
||||||
size_t size_sm2_backing_file;
|
|
||||||
size_t len;
|
|
||||||
|
|
||||||
/*
|
|
||||||
* This is activated only for intra-communicators
|
|
||||||
*/
|
|
||||||
if (OMPI_COMM_IS_INTER(comm) ) {
|
|
||||||
return NULL;
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
|
||||||
* Use only if more than on proc in the communicator
|
|
||||||
*/
|
|
||||||
if (1 == ompi_comm_size(comm) ) {
|
|
||||||
return NULL;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* check to see if all procs are on the same node, and therefore
|
|
||||||
* can communicate using shared memory
|
|
||||||
*/
|
|
||||||
if ( !have_local_peers(comm->c_local_group, ompi_comm_size(comm))) {
|
|
||||||
return NULL;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Get our priority */
|
|
||||||
*priority = mca_coll_sm2_component.sm2_priority;
|
|
||||||
|
|
||||||
/* allocate and initialize an sm-v2 module */
|
|
||||||
sm_module = OBJ_NEW(mca_coll_sm2_module_t);
|
|
||||||
|
|
||||||
sm_module->super.coll_module_enable = sm2_module_enable;
|
|
||||||
sm_module->super.ft_event = NULL;
|
|
||||||
sm_module->super.coll_allgather = NULL;
|
|
||||||
sm_module->super.coll_allgatherv = NULL;
|
|
||||||
sm_module->super.coll_allreduce = NULL;
|
|
||||||
sm_module->super.coll_alltoall = NULL;
|
|
||||||
sm_module->super.coll_alltoallv = NULL;
|
|
||||||
sm_module->super.coll_alltoallw = NULL;
|
|
||||||
sm_module->super.coll_barrier = NULL;
|
|
||||||
sm_module->super.coll_bcast = NULL;
|
|
||||||
sm_module->super.coll_exscan = NULL;
|
|
||||||
sm_module->super.coll_gather = NULL;
|
|
||||||
sm_module->super.coll_gatherv = NULL;
|
|
||||||
sm_module->super.coll_reduce = NULL;
|
|
||||||
sm_module->super.coll_reduce_scatter = NULL;
|
|
||||||
sm_module->super.coll_scan = NULL;
|
|
||||||
sm_module->super.coll_scatter = NULL;
|
|
||||||
sm_module->super.coll_scatterv = NULL;
|
|
||||||
|
|
||||||
/*
|
|
||||||
* create backing file
|
|
||||||
*/
|
|
||||||
|
|
||||||
/*
|
|
||||||
* set group size
|
|
||||||
*/
|
|
||||||
group_size=ompi_comm_size(comm);
|
|
||||||
|
|
||||||
/*
|
|
||||||
* get control region size
|
|
||||||
*/
|
|
||||||
/* just enough place for one flag per process */
|
|
||||||
ctl_memory_per_proc_per_segment=sizeof(int);
|
|
||||||
if( mca_coll_sm2_component.sm2_ctl_size_per_proc > ctl_memory_per_proc_per_segment )
|
|
||||||
ctl_memory_per_proc_per_segment=mca_coll_sm2_component.sm2_ctl_size_per_proc;
|
|
||||||
ctl_memory_per_proc_per_segment=ctl_memory_per_proc_per_segment * group_size ;
|
|
||||||
|
|
||||||
/* pad this up to the alignment needed by the data segment, as the
|
|
||||||
* that data segment will directly follow the control segment in
|
|
||||||
* memory.
|
|
||||||
*/
|
|
||||||
alignment=mca_coll_sm2_component.sm2_data_alignment;
|
|
||||||
ctl_memory_per_proc_per_segment=
|
|
||||||
(alignment + ctl_memory_per_proc_per_segment -1) / alignment;
|
|
||||||
ctl_memory_per_proc_per_segment*=alignment;
|
|
||||||
mca_coll_sm2_component.sm2_ctl_size_allocated=ctl_memory_per_proc_per_segment;
|
|
||||||
|
|
||||||
/* get data region size - allocation happens on a page granularity, with
|
|
||||||
* a minimum of a page allocated per proc, so adjust to this
|
|
||||||
*/
|
|
||||||
size=mca_coll_sm2_component.sm2_data_seg_size;
|
|
||||||
if( size > mca_coll_sm2_component.sm2_max_data_seg_size )
|
|
||||||
size=mca_coll_sm2_component.sm2_max_data_seg_size;
|
|
||||||
size_tot_per_proc_per_seg=size+ mca_coll_sm2_component.sm2_ctl_size_allocated;
|
|
||||||
if( size_tot_per_proc_per_seg < getpagesize())
|
|
||||||
size_tot_per_proc_per_seg=getpagesize();
|
|
||||||
/* round this up to the nearest integer page-size multiple */
|
|
||||||
size_tot_per_proc_per_seg= ( size_tot_per_proc_per_seg + getpagesize() - 1)/
|
|
||||||
getpagesize();
|
|
||||||
size_tot_per_proc_per_seg*=getpagesize();
|
|
||||||
|
|
||||||
/* compute segment memory needed */
|
|
||||||
size_tot_per_segment=group_size * size_tot_per_proc_per_seg ;
|
|
||||||
|
|
||||||
/* compute memory per bank */
|
|
||||||
tot_size_per_bank=size_tot_per_segment*mca_coll_sm2_component.sm2_num_regions_per_bank;
|
|
||||||
|
|
||||||
/* compute total memory in the memory banks */
|
|
||||||
tot_size_mem_banks=tot_size_per_bank*mca_coll_sm2_component.sm2_num_mem_banks;
|
|
||||||
|
|
||||||
/* compute the amount of memory needed for the anynchromous barriers used to
|
|
||||||
* manage the memory resources.
|
|
||||||
*/
|
|
||||||
/* for each bank, 2 sets of barrier buffers */
|
|
||||||
mem_management_per_proc_per_block= 2 * CACHE_LINE_SIZE ;
|
|
||||||
/* add in number of banks */
|
|
||||||
mem_management_per_proc= mem_management_per_proc_per_block *
|
|
||||||
mca_coll_sm2_component.sm2_num_mem_banks;
|
|
||||||
/* round up to page multiples */
|
|
||||||
mem_management_per_proc=(mem_management_per_proc +
|
|
||||||
getpagesize() -1 ) / getpagesize();
|
|
||||||
mem_management_per_proc*=getpagesize();
|
|
||||||
|
|
||||||
/* total memory management required */
|
|
||||||
mem_management_total=mem_management_per_proc * group_size;
|
|
||||||
|
|
||||||
/* total size of backing file */
|
|
||||||
size_sm2_backing_file=mem_management_total+tot_size_mem_banks;
|
|
||||||
sm_module->size_sm2_backing_file=size_sm2_backing_file;
|
|
||||||
|
|
||||||
/* set file name */
|
|
||||||
len=asprintf(&(sm_module->coll_sm2_file_name),
|
|
||||||
"%s"OPAL_PATH_SEP"sm_coll_v2%s_%0d",orte_process_info.job_session_dir,
|
|
||||||
orte_system_info.nodename,ompi_comm_get_cid(comm));
|
|
||||||
if( 0 > len ) {
|
|
||||||
goto CLEANUP;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* allocate backing file */
|
|
||||||
ret=allocate_shared_file(size_sm2_backing_file,
|
|
||||||
sm_module->coll_sm2_file_name, comm,
|
|
||||||
&(sm_module->shared_memory_region));
|
|
||||||
if( MPI_SUCCESS != ret ) {
|
|
||||||
goto CLEANUP;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* debug */
|
|
||||||
fprintf(stderr," GGGG file %s len %ld prt %p \n",
|
|
||||||
sm_module->coll_sm2_file_name,
|
|
||||||
sm_module->size_sm2_backing_file,
|
|
||||||
sm_module->shared_memory_region);
|
|
||||||
fflush(stderr);
|
|
||||||
/* end debug */
|
|
||||||
|
|
||||||
/* initialize local counters */
|
|
||||||
|
|
||||||
/* set pointers */
|
|
||||||
|
|
||||||
/* touch pages to apply memory affinity - Note: do we really need this or will
|
|
||||||
* the algorithms do this */
|
|
||||||
|
|
||||||
/* return */
|
|
||||||
return &(sm_module->super);
|
|
||||||
|
|
||||||
|
|
||||||
CLEANUP:
|
|
||||||
OBJ_RELEASE(sm_module);
|
|
||||||
|
|
||||||
if( NULL == sm_module->coll_sm2_file_name ) {
|
|
||||||
free(sm_module->coll_sm2_file_name);
|
|
||||||
}
|
|
||||||
|
|
||||||
return NULL;
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
|
||||||
* Init module on the communicator
|
|
||||||
*/
|
|
||||||
static int
|
|
||||||
sm2_module_enable(struct mca_coll_base_module_1_1_0_t *module,
|
|
||||||
struct ompi_communicator_t *comm)
|
|
||||||
{
|
|
||||||
/* local variables */
|
|
||||||
char output_buffer[2*MPI_MAX_OBJECT_NAME];
|
|
||||||
|
|
||||||
memset(&output_buffer[0],0,sizeof(output_buffer));
|
|
||||||
snprintf(output_buffer,sizeof(output_buffer),"%s (cid %d)", comm->c_name,
|
|
||||||
comm->c_contextid);
|
|
||||||
opal_output_verbose(10, mca_coll_base_output,
|
|
||||||
"coll:sm2:enable: new communicator: %s", output_buffer);
|
|
||||||
|
|
||||||
/* All done */
|
|
||||||
return OMPI_SUCCESS;
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
OBJ_CLASS_INSTANCE(mca_coll_sm2_module_t,
|
|
||||||
mca_coll_base_module_1_1_0_t,
|
|
||||||
mca_coll_sm2_module_construct,
|
|
||||||
mca_coll_sm2_module_destruct);
|
|
||||||
|
Загрузка…
x
Ссылка в новой задаче
Block a user