275 строки
10 KiB
C
275 строки
10 KiB
C
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
|
/*
|
|
* Copyright (c) 2004-2007 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2009 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2007-2010 Cisco Systems, Inc. All rights reserved.
|
|
* Copyright (c) 2010 Oracle and/or its affiliates. All rights reserved.
|
|
* Copyright (c) 2014 Research Organization for Information Science
|
|
* and Technology (RIST). All rights reserved.
|
|
* Copyright (c) 2015 Los Alamos National Security, LLC. All rights
|
|
* reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "ompi_config.h"
|
|
#include "opal/mca/event/event.h"
|
|
#include "mpi.h"
|
|
#include "ompi/runtime/params.h"
|
|
#include "ompi/mca/pml/pml.h"
|
|
#include "ompi/mca/pml/base/pml_base_bsend.h"
|
|
#include "pml_bfo.h"
|
|
#include "pml_bfo_hdr.h"
|
|
#include "pml_bfo_sendreq.h"
|
|
#include "pml_bfo_recvreq.h"
|
|
#include "pml_bfo_rdmafrag.h"
|
|
#include "pml_bfo_recvfrag.h"
|
|
#include "ompi/mca/bml/base/base.h"
|
|
#include "pml_bfo_component.h"
|
|
#include "opal/mca/allocator/base/base.h"
|
|
#include "opal/runtime/opal_params.h"
|
|
|
|
OBJ_CLASS_INSTANCE( mca_pml_bfo_pckt_pending_t,
|
|
ompi_free_list_item_t,
|
|
NULL,
|
|
NULL );
|
|
|
|
static int mca_pml_bfo_component_register(void);
|
|
static int mca_pml_bfo_component_open(void);
|
|
static int mca_pml_bfo_component_close(void);
|
|
static mca_pml_base_module_t*
|
|
mca_pml_bfo_component_init( int* priority, bool enable_progress_threads,
|
|
bool enable_mpi_threads );
|
|
static int mca_pml_bfo_component_fini(void);
|
|
int mca_pml_bfo_output = 0;
|
|
static int mca_pml_bfo_verbose = 0;
|
|
|
|
mca_pml_base_component_2_0_0_t mca_pml_bfo_component = {
|
|
|
|
/* First, the mca_base_component_t struct containing meta
|
|
information about the component itself */
|
|
|
|
.pmlm_version = {
|
|
MCA_PML_BASE_VERSION_2_0_0,
|
|
|
|
.mca_component_name = "bfo",
|
|
MCA_BASE_MAKE_VERSION(component, OMPI_MAJOR_VERSION, OMPI_MINOR_VERSION,
|
|
OMPI_RELEASE_VERSION),
|
|
.mca_open_component = mca_pml_bfo_component_open,
|
|
.mca_close_component = mca_pml_bfo_component_close,
|
|
.mca_register_component_params = mca_pml_bfo_component_register,
|
|
},
|
|
.pmlm_data = {
|
|
/* The component is checkpoint ready */
|
|
MCA_BASE_METADATA_PARAM_CHECKPOINT
|
|
},
|
|
|
|
.pmlm_init = mca_pml_bfo_component_init,
|
|
.pmlm_finalize = mca_pml_bfo_component_fini,
|
|
};
|
|
|
|
void *mca_pml_bfo_seg_alloc( struct mca_mpool_base_module_t* mpool,
|
|
size_t* size,
|
|
mca_mpool_base_registration_t** registration);
|
|
|
|
void mca_pml_bfo_seg_free( struct mca_mpool_base_module_t* mpool,
|
|
void* segment );
|
|
|
|
static inline int mca_pml_bfo_param_register_int(
|
|
const char* param_name,
|
|
int default_value,
|
|
int *storage)
|
|
{
|
|
*storage = default_value;
|
|
(void) mca_base_component_var_register(&mca_pml_bfo_component.pmlm_version, param_name,
|
|
NULL, MCA_BASE_VAR_TYPE_INT, NULL, 0, 0,
|
|
OPAL_INFO_LVL_9,
|
|
MCA_BASE_VAR_SCOPE_READONLY, storage);
|
|
|
|
return *storage;
|
|
}
|
|
|
|
static inline unsigned int mca_pml_bfo_param_register_uint(
|
|
const char* param_name,
|
|
unsigned int default_value,
|
|
unsigned int *storage)
|
|
{
|
|
*storage = default_value;
|
|
(void) mca_base_component_var_register(&mca_pml_bfo_component.pmlm_version, param_name,
|
|
NULL, MCA_BASE_VAR_TYPE_UNSIGNED_INT, NULL, 0, 0,
|
|
OPAL_INFO_LVL_9,
|
|
MCA_BASE_VAR_SCOPE_READONLY, storage);
|
|
|
|
return *storage;
|
|
}
|
|
|
|
static int mca_pml_bfo_component_register(void)
|
|
{
|
|
int default_priority;
|
|
|
|
#if PML_BFO
|
|
default_priority = 5;
|
|
#else /* PML_BFO */
|
|
default_priority = 20;
|
|
mca_pml_bfo_param_register_int("priority", 20);
|
|
#endif /* PML_BFO */
|
|
|
|
(void) mca_pml_bfo_param_register_int("verbose", 0, &mca_pml_bfo_verbose);
|
|
(void) mca_pml_bfo_param_register_int("free_list_num", 4, &mca_pml_bfo.free_list_num);
|
|
(void) mca_pml_bfo_param_register_int("free_list_max", -1, &mca_pml_bfo.free_list_max);
|
|
(void) mca_pml_bfo_param_register_int("free_list_inc", 64, &mca_pml_bfo.free_list_inc);
|
|
(void) mca_pml_bfo_param_register_int("priority", default_priority, &mca_pml_bfo.priority);
|
|
(void) mca_pml_bfo_param_register_uint("send_pipeline_depth", 3, &mca_pml_bfo.send_pipeline_depth);
|
|
(void) mca_pml_bfo_param_register_uint("recv_pipeline_depth", 4, &mca_pml_bfo.recv_pipeline_depth);
|
|
(void) mca_pml_bfo_param_register_uint("rdma_put_retries_limit", 5, &mca_pml_bfo.rdma_put_retries_limit);
|
|
(void) mca_pml_bfo_param_register_int("max_rdma_per_request", 4, &mca_pml_bfo.max_rdma_per_request);
|
|
(void) mca_pml_bfo_param_register_int("max_send_per_range", 4, &mca_pml_bfo.max_send_per_range);
|
|
(void) mca_pml_bfo_param_register_uint("unexpected_limit", 128, &mca_pml_bfo.unexpected_limit);
|
|
|
|
mca_pml_bfo.allocator_name = "bucket";
|
|
(void) mca_base_component_var_register(&mca_pml_bfo_component.pmlm_version,
|
|
"allocator",
|
|
"Name of allocator component for unexpected messages",
|
|
MCA_BASE_VAR_TYPE_STRING, NULL, 0, 0,
|
|
OPAL_INFO_LVL_9,
|
|
MCA_BASE_VAR_SCOPE_READONLY,
|
|
&mca_pml_bfo.allocator_name);
|
|
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|
|
static int mca_pml_bfo_component_open(void)
|
|
{
|
|
mca_pml_bfo_output = opal_output_open(NULL);
|
|
opal_output_set_verbosity(mca_pml_bfo_output, mca_pml_bfo_verbose);
|
|
|
|
mca_pml_bfo.enabled = false;
|
|
return mca_base_framework_open(&ompi_bml_base_framework, 0);
|
|
}
|
|
|
|
|
|
static int mca_pml_bfo_component_close(void)
|
|
{
|
|
int rc;
|
|
|
|
if (OMPI_SUCCESS != (rc = mca_base_framework_close(&ompi_bml_base_framework))) {
|
|
return rc;
|
|
}
|
|
opal_output_close(mca_pml_bfo_output);
|
|
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|
|
|
|
static mca_pml_base_module_t*
|
|
mca_pml_bfo_component_init( int* priority,
|
|
bool enable_progress_threads,
|
|
bool enable_mpi_threads )
|
|
{
|
|
mca_allocator_base_component_t* allocator_component;
|
|
|
|
opal_output_verbose( 10, mca_pml_bfo_output,
|
|
"in bfo, my priority is %d\n", mca_pml_bfo.priority);
|
|
|
|
if((*priority) > mca_pml_bfo.priority) {
|
|
*priority = mca_pml_bfo.priority;
|
|
return NULL;
|
|
}
|
|
*priority = mca_pml_bfo.priority;
|
|
|
|
allocator_component = mca_allocator_component_lookup( mca_pml_bfo.allocator_name );
|
|
if(NULL == allocator_component) {
|
|
opal_output(0, "mca_pml_bfo_component_init: can't find allocator: %s\n", mca_pml_bfo.allocator_name);
|
|
return NULL;
|
|
}
|
|
|
|
mca_pml_bfo.allocator = allocator_component->allocator_init(true,
|
|
mca_pml_bfo_seg_alloc,
|
|
mca_pml_bfo_seg_free, NULL);
|
|
if(NULL == mca_pml_bfo.allocator) {
|
|
opal_output(0, "mca_pml_bfo_component_init: unable to initialize allocator\n");
|
|
return NULL;
|
|
}
|
|
|
|
|
|
if(OMPI_SUCCESS != mca_bml_base_init( enable_progress_threads,
|
|
enable_mpi_threads)) {
|
|
return NULL;
|
|
}
|
|
|
|
/* Set this here (vs in component_open()) because
|
|
opal_leave_pinned* may have been set after MCA params were
|
|
read (e.g., by the openib btl) */
|
|
mca_pml_bfo.leave_pinned = (1 == opal_leave_pinned);
|
|
mca_pml_bfo.leave_pinned_pipeline = (int) opal_leave_pinned_pipeline;
|
|
|
|
return &mca_pml_bfo.super;
|
|
}
|
|
|
|
int mca_pml_bfo_component_fini(void)
|
|
{
|
|
int rc;
|
|
|
|
/* Shutdown BML */
|
|
if(OMPI_SUCCESS != (rc = mca_bml.bml_finalize()))
|
|
return rc;
|
|
|
|
if(!mca_pml_bfo.enabled)
|
|
return OMPI_SUCCESS; /* never selected.. return success.. */
|
|
mca_pml_bfo.enabled = false; /* not anymore */
|
|
|
|
OBJ_DESTRUCT(&mca_pml_bfo.rdma_pending);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.pckt_pending);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.recv_pending);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.send_pending);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.non_existing_communicator_pending);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.buffers);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.pending_pckts);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.recv_frags);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.rdma_frags);
|
|
OBJ_DESTRUCT(&mca_pml_bfo.lock);
|
|
|
|
if(OMPI_SUCCESS != (rc = mca_pml_bfo.allocator->alc_finalize(mca_pml_bfo.allocator))) {
|
|
return rc;
|
|
}
|
|
|
|
#if 0
|
|
if (mca_pml_base_send_requests.fl_num_allocated !=
|
|
mca_pml_base_send_requests.super.opal_list_length) {
|
|
opal_output(0, "bfo send requests: %d allocated %d returned\n",
|
|
mca_pml_base_send_requests.fl_num_allocated,
|
|
mca_pml_base_send_requests.super.opal_list_length);
|
|
}
|
|
if (mca_pml_base_recv_requests.fl_num_allocated !=
|
|
mca_pml_base_recv_requests.super.opal_list_length) {
|
|
opal_output(0, "bfo recv requests: %d allocated %d returned\n",
|
|
mca_pml_base_recv_requests.fl_num_allocated,
|
|
mca_pml_base_recv_requests.super.opal_list_length);
|
|
}
|
|
#endif
|
|
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|
|
void *mca_pml_bfo_seg_alloc( struct mca_mpool_base_module_t* mpool,
|
|
size_t* size,
|
|
mca_mpool_base_registration_t** registration) {
|
|
return malloc(*size);
|
|
}
|
|
|
|
void mca_pml_bfo_seg_free( struct mca_mpool_base_module_t* mpool,
|
|
void* segment ) {
|
|
free(segment);
|
|
}
|