1
1
openmpi/ompi/mca/mpool/openib/mpool_openib_module.c
Gleb Natapov 91f48f9a79 Merge with gleb-pml branch. Add out of resource handling support to PML layer.
If resource is not available request is added to one of the pending list and retried later.

This commit was SVN r10900.
2006-07-20 14:44:35 +00:00

249 строки
7.6 KiB
C

/*
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
* University Research and Technology
* Corporation. All rights reserved.
* Copyright (c) 2004-2005 The University of Tennessee and The University
* of Tennessee Research Foundation. All rights
* reserved.
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
* University of Stuttgart. All rights reserved.
* Copyright (c) 2004-2005 The Regents of the University of California.
* All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "ompi_config.h"
#include <string.h>
#include "opal/util/output.h"
#include "ompi/mca/mpool/openib/mpool_openib.h"
#include <infiniband/verbs.h>
#include <errno.h>
#include <string.h>
#include "ompi/mca/rcache/rcache.h"
#include "ompi/mca/rcache/base/base.h"
#include "ompi/mca/mpool/base/base.h"
extern uint32_t mca_mpool_base_page_size;
extern uint32_t mca_mpool_base_page_size_log;
/*
* Initializes the mpool module.
*/
void mca_mpool_openib_module_init(mca_mpool_openib_module_t* mpool)
{
mpool->super.mpool_component = &mca_mpool_openib_component.super;
mpool->super.mpool_base = NULL; /* no base .. */
mpool->super.mpool_alloc = mca_mpool_openib_alloc;
mpool->super.mpool_realloc = mca_mpool_openib_realloc;
mpool->super.mpool_free = mca_mpool_openib_free;
mpool->super.mpool_register = mca_mpool_openib_register;
mpool->super.mpool_deregister = mca_mpool_openib_deregister;
mpool->super.mpool_find = mca_mpool_openib_find;
mpool->super.mpool_retain = mca_mpool_openib_retain;
mpool->super.mpool_release = mca_mpool_openib_release;
mpool->super.mpool_finalize = NULL;
mpool->super.rcache =
mca_rcache_base_module_create(mca_mpool_openib_component.rcache_name);
mpool->super.flags = MCA_MPOOL_FLAGS_MPI_ALLOC_MEM;
OBJ_CONSTRUCT(&mpool->reg_list, ompi_free_list_t);
ompi_free_list_init(&mpool->reg_list, sizeof(mca_mpool_openib_registration_t),
OBJ_CLASS(mca_mpool_openib_registration_t), 0, -1, 32, NULL);
}
/**
* allocate function
*/
void* mca_mpool_openib_alloc(
mca_mpool_base_module_t* mpool,
size_t size,
size_t align,
uint32_t flags,
mca_mpool_base_registration_t** registration)
{
void* addr_malloc = (void*)memalign(mca_mpool_base_page_size, size);
void* addr = addr_malloc;
if(OMPI_SUCCESS != mpool->mpool_register(mpool, addr, size, flags, registration)) {
free(addr_malloc);
return NULL;
}
(*registration)->alloc_base = addr_malloc;
return addr;
}
/*
* register memory
*/
int mca_mpool_openib_register(mca_mpool_base_module_t* mpool,
void *addr,
size_t size,
uint32_t flags,
mca_mpool_base_registration_t** registration){
mca_mpool_openib_module_t * mpool_module = (mca_mpool_openib_module_t*) mpool;
mca_mpool_openib_registration_t * vapi_reg;
ompi_free_list_item_t *item;
int rc;
OMPI_FREE_LIST_GET(&mpool_module->reg_list, item, rc);
if(OMPI_SUCCESS != rc) {
return rc;
}
vapi_reg = (mca_mpool_openib_registration_t*) item;
*registration = &vapi_reg->base_reg;
vapi_reg->base_reg.mpool = mpool;
vapi_reg->base_reg.base = down_align_addr(addr, mca_mpool_base_page_size_log);
vapi_reg->base_reg.bound = up_align_addr( (void*) ((char*) addr + size - 1)
, mca_mpool_base_page_size_log);
size = vapi_reg->base_reg.bound -vapi_reg->base_reg.base + 1;
vapi_reg->mr = ibv_reg_mr(
mpool_module->resources.ib_pd,
vapi_reg->base_reg.base,
size,
IBV_ACCESS_LOCAL_WRITE | IBV_ACCESS_REMOTE_WRITE | IBV_ACCESS_REMOTE_READ
/* IBV_ACCESS_LOCAL_WRITE | IBV_ACCESS_REMOTE_WRITE */
);
if(NULL == vapi_reg->mr){
return OMPI_ERROR;
}
if(flags & (MCA_MPOOL_FLAGS_CACHE | MCA_MPOOL_FLAGS_PERSIST)) {
mpool->rcache->rcache_insert(mpool->rcache,
(mca_mpool_base_registration_t*) vapi_reg,
flags);
}
vapi_reg->base_reg.flags = flags;
mca_mpool_openib_retain(mpool,
(mca_mpool_base_registration_t*) vapi_reg);
return OMPI_SUCCESS;
}
/*
* deregister memory
*/
int mca_mpool_openib_deregister(mca_mpool_base_module_t* mpool,
mca_mpool_base_registration_t* registration){
if(registration->flags & (MCA_MPOOL_FLAGS_CACHE | MCA_MPOOL_FLAGS_PERSIST)) {
mpool->rcache->rcache_delete(mpool->rcache,
registration,
registration->flags);
registration->flags=0;
}
return mca_mpool_openib_release(mpool, registration);
}
/**
* realloc function
*/
void* mca_mpool_openib_realloc(
mca_mpool_base_module_t* mpool,
void* addr,
size_t size,
mca_mpool_base_registration_t** registration)
{
mca_mpool_base_registration_t* old_reg = *registration;
void* new_mem = mpool->mpool_alloc(mpool, size, 0,0, registration);
memcpy(new_mem, addr, old_reg->bound - old_reg->base);
mpool->mpool_free(mpool, addr, old_reg);
return new_mem;
}
/**
* free function
*/
void mca_mpool_openib_free(mca_mpool_base_module_t* mpool, void * addr,
mca_mpool_base_registration_t* registration)
{
mpool->mpool_deregister(mpool, registration);
free(registration->alloc_base);
}
int mca_mpool_openib_find(
struct mca_mpool_base_module_t* mpool,
void* addr,
size_t size,
ompi_pointer_array_t *regs,
uint32_t *cnt
){
return mpool->rcache->rcache_find(mpool->rcache,
addr,
size,
regs,
cnt);
}
int mca_mpool_openib_release(
struct mca_mpool_base_module_t* mpool,
mca_mpool_base_registration_t* registration
){
if(0 >= OPAL_THREAD_ADD32(&registration->ref_count, -1)) {
mca_mpool_openib_registration_t * openib_reg;
mca_mpool_openib_module_t* mpool_openib =
(mca_mpool_openib_module_t*) mpool;
openib_reg = (mca_mpool_openib_registration_t*) registration;
if(ibv_dereg_mr(openib_reg->mr)){
opal_output(0, "%s: error unpinning openib memory errno says %s\n", __func__, strerror(errno));
return OMPI_ERROR;
}
OMPI_FREE_LIST_RETURN(&mpool_openib->reg_list, (ompi_free_list_item_t*) openib_reg);
}
return OMPI_SUCCESS;
}
int mca_mpool_openib_retain(struct mca_mpool_base_module_t* mpool,
mca_mpool_base_registration_t* registration
){
OPAL_THREAD_ADD32(&registration->ref_count, 1);
return OMPI_SUCCESS;
}