/* * Copyright (c) 2004-2007 The Trustees of Indiana University and Indiana * University Research and Technology * Corporation. All rights reserved. * Copyright (c) 2004-2006 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. * Copyright (c) 2007 Sun Microsystems, Inc. All rights reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ */ #include "ompi_config.h" #if HAVE_UNISTD_H #include #endif /* HAVE_UNISTD_H*/ #ifdef HAVE_STDLIB_H #include #endif /* HAVE_STDLIB_H */ #include #include "opal/util/output.h" #include "opal/mca/base/base.h" #include "opal/mca/base/mca_base_param.h" #include "ompi/mca/allocator/base/base.h" #include "mpool_sm.h" #include "ompi/mca/common/sm/common_sm_mmap.h" #include "orte/util/proc_info.h" #include "orte/util/sys_info.h" #include "ompi/proc/proc.h" /* * Local functions */ static int mca_mpool_sm_open(void); static int mca_mpool_sm_close( void ); static mca_mpool_base_module_t* mca_mpool_sm_init( struct mca_mpool_base_resources_t* resources); mca_mpool_sm_component_t mca_mpool_sm_component = { { /* First, the mca_base_component_t struct containing meta information about the component itself */ { /* Indicate that we are a mpool v1.0.0 component (which also implies a specific MCA version) */ MCA_MPOOL_BASE_VERSION_1_0_0, "sm", /* MCA component name */ OMPI_MAJOR_VERSION, /* MCA component major version */ OMPI_MINOR_VERSION, /* MCA component minor version */ OMPI_RELEASE_VERSION, /* MCA component release version */ mca_mpool_sm_open, /* component open */ mca_mpool_sm_close }, /* Next the MCA v1.0.0 component meta data */ { /* The component is not checkpoint ready */ MCA_BASE_METADATA_PARAM_NONE }, mca_mpool_sm_init } }; static char *max_size_param, *min_size_param, *peer_size_param; static long default_max, default_min, default_peer; /** * component open/close/init function */ static int mca_mpool_sm_open(void) { int value = 0; char *size_str = NULL; default_max = 512*1024*1024; default_min = 128*1024*1024; default_peer = 32*1024*1024; /* register SM component parameters */ mca_base_param_reg_string(&mca_mpool_sm_component.super.mpool_version, "allocator", "Name of allocator component to use with sm mpool", false, false, "bucket", &mca_mpool_sm_component.sm_allocator_name); /* register values as string instead of int. A string-converted * signed long int allows the max_size or the sm_size * to be set up to 2GB-1 for 32 bit and much greater for 64 bit. */ asprintf(&size_str, "%ld", default_max); mca_base_param_reg_string(&mca_mpool_sm_component.super.mpool_version, "max_size", "Maximum size of the sm mpool shared memory file", false, false, size_str, &max_size_param); free(size_str); asprintf(&size_str, "%ld", default_min); mca_base_param_reg_string(&mca_mpool_sm_component.super.mpool_version, "min_size", "Minimum size of the sm mpool shared memory file", false, false, size_str, &min_size_param); free(size_str); asprintf(&size_str, "%ld", default_peer); mca_base_param_reg_string(&mca_mpool_sm_component.super.mpool_version, "per_peer_size", "Size (in bytes) to allocate per local peer in " "the sm mpool shared memory file, bounded by " "min_size and max_size", false, false, size_str, &peer_size_param); free(size_str); mca_base_param_reg_int(&mca_mpool_sm_component.super.mpool_version, "verbose", "Enable verbose output for mpool sm component", false, false, 0, &value); if (value != 0) { mca_mpool_sm_component.verbose = opal_output_open(NULL); } else { mca_mpool_sm_component.verbose = -1; } mca_mpool_sm_component.sm_size = 0; return OMPI_SUCCESS; } static int mca_mpool_sm_close( void ) { if( NULL != mca_common_sm_mmap ) { if( OMPI_SUCCESS == mca_common_sm_mmap_fini( mca_common_sm_mmap ) ) { unlink( mca_common_sm_mmap->map_path ); } OBJ_RELEASE( mca_common_sm_mmap ); } return OMPI_SUCCESS; } static mca_mpool_base_module_t* mca_mpool_sm_init( struct mca_mpool_base_resources_t* resources) { char *file_name; int len; mca_mpool_sm_module_t* mpool_module; mca_allocator_base_component_t* allocator_component; long max_size, min_size, peer_size; ompi_proc_t **procs; size_t num_all_procs, i, num_local_procs = 0; /* README: this needs to change if procs in different jobs (even spawned ones) are to talk using shared memory */ procs = ompi_proc_world(&num_all_procs); for (i = 0 ; i < num_all_procs ; ++i) { if (procs[i]->proc_flags & OMPI_PROC_FLAG_LOCAL) { num_local_procs++; } } free(procs); /* parse the max, min and peer sizes, and validate them */ /* absolutely necessary to reset errno each time */ errno = 0; max_size = strtol(max_size_param, (char **)NULL, 10); if (errno == ERANGE) { opal_output(0, "mca_mpool_sm_init: max_size overflows! set to default (%ld)", default_max); max_size = default_max; } else if (errno == EINVAL) { opal_output(0, "mca_mpool_sm_init: invalid max_size entered. set it to (%ld)", default_max); max_size = default_max; } errno = 0; min_size = strtol(min_size_param, (char **)NULL, 10); if (errno == ERANGE) { opal_output(0, "mca_mpool_sm_init: min_size overflows! set to default (%ld)", default_min); min_size = default_min; } else if (errno == EINVAL) { opal_output(0, "mca_mpool_sm_init: invalid min_size entered. set it to (%ld)", default_min); min_size = default_min; } errno = 0; peer_size = strtol(peer_size_param, (char **)NULL, 10); if (errno == ERANGE) { opal_output(0, "mca_mpool_sm_init: peer_size overflows! set to default (%ld)", default_peer); peer_size = default_peer; } else if (errno == EINVAL) { opal_output(0, "mca_mpool_sm_init: invalid peer_size entered. set it to (%ld)", default_peer); peer_size = default_peer; } /* more checks... */ if (min_size > max_size) { opal_output(0, "mca_mpool_sm_init: adjusting max_size to be min_size (%ld)", min_size); max_size = min_size; } /* sm_size is a product of peer_size * num_local_procs. To prevent the * sm_size from overflowing SIZE_MAX, we first calculate the quotient. * If quotient is less than the peer_size, it means the product * (peer_size * num_local_procs) is going to overflow SIZE_MAX, then we'll * set sm_size to max_size. */ if ((double)LONG_MAX / num_local_procs < peer_size) { /* enable verbose would show if sm_size overflows */ opal_output(mca_mpool_sm_component.verbose, "mca_mpool_sm_init: sm_size overflows, set sm_size to max_size (%ld)", LONG_MAX); mca_mpool_sm_component.sm_size = max_size; } else { mca_mpool_sm_component.sm_size = peer_size * num_local_procs; } if (min_size > mca_mpool_sm_component.sm_size) { mca_mpool_sm_component.sm_size = min_size; } if (max_size < mca_mpool_sm_component.sm_size) { mca_mpool_sm_component.sm_size = max_size; } allocator_component = mca_allocator_component_lookup( mca_mpool_sm_component.sm_allocator_name); /* if specified allocator cannot be loaded - look for an alternative */ if(NULL == allocator_component) { if(opal_list_get_size(&mca_allocator_base_components) == 0) { mca_base_component_list_item_t* item = (mca_base_component_list_item_t*) opal_list_get_first(&mca_allocator_base_components); allocator_component = (mca_allocator_base_component_t*)item->cli_component; opal_output(0, "mca_mpool_sm_init: unable to locate allocator: %s - using %s\n", mca_mpool_sm_component.sm_allocator_name, allocator_component->allocator_version.mca_component_name); } else { opal_output(0, "mca_mpool_sm_init: unable to locate allocator: %s\n", mca_mpool_sm_component.sm_allocator_name); return NULL; } } mpool_module = (mca_mpool_sm_module_t*)malloc(sizeof(mca_mpool_sm_module_t)); mca_mpool_sm_module_init(mpool_module); /* create initial shared memory mapping */ len = asprintf( &file_name, "%s"OPAL_PATH_SEP"shared_mem_pool.%s", orte_process_info.job_session_dir, orte_system_info.nodename ); if ( 0 > len ) { return NULL; } opal_output(mca_mpool_sm_component.verbose, "mca_mpool_sm_init: shared memory size used: (%ld)", mca_mpool_sm_component.sm_size); if(NULL == (mca_common_sm_mmap = mca_common_sm_mmap_init(mca_mpool_sm_component.sm_size, file_name,sizeof(mca_common_sm_mmap_t), 8 ) )) { opal_output(0, "mca_mpool_sm_init: unable to create shared memory mapping (%s)", file_name); free(file_name); return NULL; } free(file_name); /* setup allocator */ mpool_module->sm_allocator = allocator_component->allocator_init(true, mca_common_sm_mmap_seg_alloc, NULL, NULL); if(NULL == mpool_module->sm_allocator) { opal_output(0, "mca_mpool_sm_init: unable to initialize allocator"); return NULL; } return &mpool_module->super; }