5ccab7bcda
- Move mca_btl_udapl_error/mca_btl_module_init to mca_btl_udapl.c and rename it - White space cleanups - Free the uDAPL evd and ia handles in mca_btl_udapl_finalize This commit was SVN r8705.
349 строки
11 KiB
C
349 строки
11 KiB
C
/*
|
|
* Copyright (c) 2004-2006 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
|
|
#include "ompi_config.h"
|
|
#include "ompi/include/constants.h"
|
|
#include "opal/event/event.h"
|
|
#include "opal/util/if.h"
|
|
#include "opal/util/argv.h"
|
|
#include "opal/util/output.h"
|
|
#include "ompi/mca/pml/pml.h"
|
|
#include "ompi/mca/btl/btl.h"
|
|
|
|
#include "opal/mca/base/mca_base_param.h"
|
|
#include "mca/errmgr/errmgr.h"
|
|
#include "mca/mpool/base/base.h"
|
|
#include "btl_udapl.h"
|
|
#include "btl_udapl_frag.h"
|
|
#include "btl_udapl_endpoint.h"
|
|
#include "ompi/mca/btl/base/base.h"
|
|
#include "ompi/mca/btl/base/btl_base_error.h"
|
|
#include "ompi/datatype/convertor.h"
|
|
#include "btl_udapl_endpoint.h"
|
|
#include "orte/util/proc_info.h"
|
|
#include "ompi/mca/pml/base/pml_base_module_exchange.h"
|
|
|
|
mca_btl_udapl_component_t mca_btl_udapl_component = {
|
|
{
|
|
/* First, the mca_base_component_t struct containing meta information
|
|
about the component itself */
|
|
|
|
{
|
|
/* Indicate that we are a pml v1.0.0 component (which also implies a
|
|
specific MCA version) */
|
|
|
|
MCA_BTL_BASE_VERSION_1_0_0,
|
|
|
|
"udapl", /* MCA component name */
|
|
OMPI_MAJOR_VERSION, /* MCA component major version */
|
|
OMPI_MINOR_VERSION, /* MCA component minor version */
|
|
OMPI_RELEASE_VERSION, /* MCA component release version */
|
|
mca_btl_udapl_component_open, /* component open */
|
|
mca_btl_udapl_component_close /* component close */
|
|
},
|
|
|
|
/* Next the MCA v1.0.0 component meta data */
|
|
|
|
{
|
|
/* Whether the component is checkpointable or not */
|
|
|
|
false
|
|
},
|
|
|
|
mca_btl_udapl_component_init,
|
|
mca_btl_udapl_component_progress,
|
|
}
|
|
};
|
|
|
|
|
|
/*
|
|
* utility routines for parameter registration
|
|
*/
|
|
|
|
static inline char* mca_btl_udapl_param_register_string(
|
|
const char* param_name,
|
|
const char* default_value)
|
|
{
|
|
char *param_value;
|
|
int id = mca_base_param_register_string("btl","udapl",param_name,NULL,default_value);
|
|
mca_base_param_lookup_string(id, ¶m_value);
|
|
return param_value;
|
|
}
|
|
|
|
static inline int mca_btl_udapl_param_register_int(
|
|
const char* param_name,
|
|
int default_value)
|
|
{
|
|
int id = mca_base_param_register_int("btl","udapl",param_name,NULL,default_value);
|
|
int param_value = default_value;
|
|
mca_base_param_lookup_int(id,¶m_value);
|
|
return param_value;
|
|
}
|
|
|
|
/*
|
|
* Called by MCA framework to open the component, registers
|
|
* component parameters.
|
|
*/
|
|
|
|
int mca_btl_udapl_component_open(void)
|
|
{
|
|
int param, value;
|
|
|
|
opal_output(0, "udapl_component_open\n");
|
|
|
|
/* initialize state */
|
|
mca_btl_udapl_component.udapl_num_btls=0;
|
|
mca_btl_udapl_component.udapl_btls=NULL;
|
|
|
|
/* initialize objects */
|
|
OBJ_CONSTRUCT(&mca_btl_udapl_component.udapl_procs, opal_list_t);
|
|
OBJ_CONSTRUCT(&mca_btl_udapl_component.udapl_lock, opal_mutex_t);
|
|
|
|
/* register uDAPL component parameters */
|
|
mca_btl_udapl_component.udapl_free_list_num =
|
|
mca_btl_udapl_param_register_int ("free_list_num", 8);
|
|
mca_btl_udapl_component.udapl_free_list_max =
|
|
mca_btl_udapl_param_register_int ("free_list_max", -1);
|
|
mca_btl_udapl_component.udapl_free_list_inc =
|
|
mca_btl_udapl_param_register_int ("free_list_inc", 8);
|
|
mca_btl_udapl_component.udapl_debug =
|
|
mca_btl_udapl_param_register_int("debug", 1);
|
|
mca_btl_udapl_component.udapl_mpool_name =
|
|
mca_btl_udapl_param_register_string("mpool", "udapl");
|
|
mca_btl_udapl_component.udapl_max_btls =
|
|
mca_btl_udapl_param_register_int("max_modules", 4);
|
|
mca_btl_udapl_component.udapl_evd_qlen =
|
|
mca_btl_udapl_param_register_int("evd_qlen", 8);
|
|
mca_btl_udapl_component.udapl_num_high_priority =
|
|
mca_btl_udapl_param_register_int("num_high_priority", 8);
|
|
mca_btl_udapl_component.udapl_num_repost =
|
|
mca_btl_udapl_param_register_int("num_repost", 4);
|
|
mca_btl_udapl_component.udapl_num_mru =
|
|
mca_btl_udapl_param_register_int("num_mru", 64);
|
|
mca_btl_udapl_component.udapl_port_name=
|
|
mca_btl_udapl_param_register_string("port_name", "OMPI");
|
|
|
|
/* register uDAPL module parameters */
|
|
mca_btl_udapl_module.super.btl_exclusivity =
|
|
mca_btl_udapl_param_register_int ("exclusivity", MCA_BTL_EXCLUSIVITY_DEFAULT - 10);
|
|
mca_btl_udapl_module.super.btl_eager_limit =
|
|
mca_btl_udapl_param_register_int ("eager_limit", 32*1024);
|
|
mca_btl_udapl_module.super.btl_min_send_size =
|
|
mca_btl_udapl_param_register_int ("min_send_size", 32*1024);
|
|
mca_btl_udapl_module.super.btl_max_send_size =
|
|
mca_btl_udapl_param_register_int ("max_send_size", 64*1024);
|
|
mca_btl_udapl_module.super.btl_min_rdma_size =
|
|
mca_btl_udapl_param_register_int("min_rdma_size", 512*1024);
|
|
mca_btl_udapl_module.super.btl_max_rdma_size =
|
|
mca_btl_udapl_param_register_int("max_rdma_size", 128*1024);
|
|
mca_btl_udapl_module.super.btl_bandwidth =
|
|
mca_btl_udapl_param_register_int("bandwidth", 225);
|
|
|
|
/* compute the eager frag size */
|
|
#if 0
|
|
mca_btl_udapl_component.udapl_eager_frag_size =
|
|
udapl_min_size_for_length(mca_btl_udapl_module.super.btl_eager_limit) - 1;
|
|
mca_btl_udapl_module.super.btl_eager_limit =
|
|
udapl_max_length_for_size(mca_btl_udapl_component.udapl_eager_frag_size) -
|
|
sizeof(mca_btl_base_header_t);
|
|
#endif
|
|
|
|
/* compute the max frag size */
|
|
#if 0
|
|
mca_btl_udapl_component.udapl_max_frag_size =
|
|
udapl_min_size_for_length(mca_btl_udapl_module.super.btl_max_send_size) - 1;
|
|
mca_btl_udapl_module.super.btl_max_send_size =
|
|
udapl_max_length_for_size(mca_btl_udapl_component.udapl_max_frag_size) -
|
|
sizeof(mca_btl_base_header_t);
|
|
#endif
|
|
|
|
/* leave pinned option */
|
|
value = 0;
|
|
param = mca_base_param_find("mpi", NULL, "leave_pinned");
|
|
mca_base_param_lookup_int(param, &value);
|
|
mca_btl_udapl_component.leave_pinned = value;
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|
|
|
|
/*
|
|
* component cleanup - sanity checking of queue lengths
|
|
*/
|
|
|
|
int mca_btl_udapl_component_close(void)
|
|
{
|
|
opal_output(0, "udapl_component_close\n");
|
|
|
|
/* TODO - what needs to be done here? */
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|
|
|
|
/*
|
|
* Register uDAPL component addressing information. The MCA framework
|
|
* will make this available to all peers.
|
|
*/
|
|
|
|
static int
|
|
mca_btl_udapl_modex_send(void)
|
|
{
|
|
int rc;
|
|
size_t i;
|
|
size_t size;
|
|
mca_btl_udapl_addr_t *addrs = NULL;
|
|
|
|
opal_output(0, "udapl_modex_send\n");
|
|
|
|
size = mca_btl_udapl_component.udapl_num_btls * sizeof (mca_btl_udapl_addr_t);
|
|
if (0 != size) {
|
|
addrs = (mca_btl_udapl_addr_t *)malloc (size);
|
|
if (NULL == addrs) {
|
|
return OMPI_ERR_OUT_OF_RESOURCE;
|
|
}
|
|
|
|
for (i = 0; i < mca_btl_udapl_component.udapl_num_btls; i++) {
|
|
mca_btl_udapl_module_t *btl = mca_btl_udapl_component.udapl_btls[i];
|
|
addrs[i] = btl->udapl_addr;
|
|
}
|
|
}
|
|
rc = mca_pml_base_modex_send (&mca_btl_udapl_component.super.btl_version, addrs, size);
|
|
if (NULL != addrs) {
|
|
free (addrs);
|
|
}
|
|
return rc;
|
|
}
|
|
|
|
|
|
/*
|
|
* Initialize the uDAPL component,
|
|
* check how many interfaces are available and create a btl module for each.
|
|
*/
|
|
|
|
mca_btl_base_module_t **
|
|
mca_btl_udapl_component_init (int *num_btl_modules,
|
|
bool enable_progress_threads,
|
|
bool enable_mpi_threads)
|
|
{
|
|
DAT_PROVIDER_INFO* datinfo;
|
|
mca_btl_base_module_t **btls;
|
|
mca_btl_udapl_module_t *btl;
|
|
size_t i;
|
|
|
|
opal_output(0, "udapl_component_init\n");
|
|
|
|
/* enumerate uDAPL interfaces */
|
|
datinfo = malloc(mca_btl_udapl_component.udapl_max_btls * sizeof(DAT_PROVIDER_INFO));
|
|
if(NULL == datinfo) {
|
|
return NULL;
|
|
}
|
|
if(DAT_SUCCESS != dat_registry_list_providers(mca_btl_udapl_component.udapl_max_btls,
|
|
(DAT_COUNT*)&mca_btl_udapl_component.udapl_num_btls, &datinfo)) {
|
|
free(datinfo);
|
|
return NULL;
|
|
}
|
|
|
|
/* Make sure we have some interfaces */
|
|
if(0 == mca_btl_udapl_component.udapl_num_btls) {
|
|
mca_btl_base_error_no_nics("uDAPL", "NIC");
|
|
free(datinfo);
|
|
return NULL;
|
|
}
|
|
|
|
/* create a BTL module for each interface */
|
|
mca_btl_udapl_component.udapl_btls =
|
|
malloc(mca_btl_udapl_component.udapl_num_btls *
|
|
sizeof(mca_btl_udapl_module_t *));
|
|
if(NULL == mca_btl_udapl_component.udapl_btls) {
|
|
free(datinfo);
|
|
return NULL;
|
|
}
|
|
|
|
for(i = 0; i < mca_btl_udapl_component.udapl_num_btls; i++) {
|
|
opal_output(0, "udapl creating btl for %s\n", datinfo[i].ia_name);
|
|
|
|
btl = malloc(sizeof(mca_btl_udapl_module_t));
|
|
if(NULL == btl) {
|
|
free(datinfo);
|
|
free(mca_btl_udapl_component.udapl_btls);
|
|
return NULL;
|
|
}
|
|
|
|
/* copy default values into the new BTL */
|
|
memcpy(btl, &mca_btl_udapl_module, sizeof(mca_btl_udapl_module_t));
|
|
|
|
if(OMPI_SUCCESS != mca_btl_udapl_init(datinfo[i].ia_name, btl)) {
|
|
opal_output(0, "udapl module init for %s failed\n",
|
|
datinfo[i].ia_name);
|
|
/*TODO - how do i correctly handle an error here? */
|
|
free(btl);
|
|
}
|
|
|
|
/* successful btl creation */
|
|
mca_btl_udapl_component.udapl_btls[i] = btl;
|
|
}
|
|
|
|
/* finished with datinfo */
|
|
free(datinfo);
|
|
|
|
/* publish uDAPL parameters with the MCA framework */
|
|
if (OMPI_SUCCESS != mca_btl_udapl_modex_send()) {
|
|
return NULL;
|
|
}
|
|
|
|
/* return array of BTLs */
|
|
btls = (mca_btl_base_module_t**) malloc (
|
|
mca_btl_udapl_component.udapl_num_btls * sizeof(mca_btl_base_module_t *));
|
|
if (NULL == btls) {
|
|
return NULL;
|
|
}
|
|
|
|
memcpy(btls, mca_btl_udapl_component.udapl_btls,
|
|
mca_btl_udapl_component.udapl_num_btls * sizeof(mca_btl_udapl_module_t *));
|
|
*num_btl_modules = mca_btl_udapl_component.udapl_num_btls;
|
|
return btls;
|
|
}
|
|
|
|
|
|
/*
|
|
* uDAPL component progress.
|
|
*/
|
|
|
|
|
|
int mca_btl_udapl_component_progress()
|
|
{
|
|
static int32_t inprogress = 0;
|
|
int count = 0;
|
|
size_t i;
|
|
|
|
opal_output(0, "udapl_component_progress\n");
|
|
|
|
/* could get into deadlock in this case as we post recvs after callback completes */
|
|
if(OPAL_THREAD_ADD32(&inprogress, 1) > 1) {
|
|
OPAL_THREAD_ADD32(&inprogress, -1);
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|
|
for( i = 0; i < mca_btl_udapl_component.udapl_num_btls; ) {
|
|
|
|
}
|
|
OPAL_THREAD_ADD32(&inprogress, -1);
|
|
return count;
|
|
}
|
|
|