1
1
openmpi/ompi/mca/mpool/openib/mpool_openib_module.c
Galen Shipman b8cb6e1c64 modified mpool module to contain flags - used to determine if the mpool will
be used in MPI_Alloc_mem operations. Note that we found an interesting bug in
which if memory was allocated by the sm mpool (via mmap) and then registered
via the mvapi mpool, the registration would fail on certain systems. 

Added mca param mpool_base_use_mem_hooks, set to 1 to enable the memory hooks
so that memory is deregistered if the user frees it behind our back. This is
only useful if the mca param mpi_leave_pinned is also set to 1. Otherwise all
registrations are deregistered within the MPI library or via
MPI_Free_buf. After testing we should probably set both mpi_leave_pinned and
mpool_base_use_mem_hooks to default to 1. 

This commit was SVN r7415.
2005-09-16 22:22:03 +00:00

227 строки
6.7 KiB
C

/*
* Copyright (c) 2004-2005 The Trustees of Indiana University.
* All rights reserved.
* Copyright (c) 2004-2005 The Trustees of the University of Tennessee.
* All rights reserved.
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
* University of Stuttgart. All rights reserved.
* Copyright (c) 2004-2005 The Regents of the University of California.
* All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "ompi_config.h"
#include <string.h>
#include "opal/util/output.h"
#include "mca/mpool/openib/mpool_openib.h"
#include <infiniband/verbs.h>
#include <errno.h>
#include <string.h>
#include "mca/rcache/rcache.h"
#include "mca/rcache/base/base.h"
/*
* Initializes the mpool module.
*/
void mca_mpool_openib_module_init(mca_mpool_openib_module_t* mpool)
{
mpool->super.mpool_component = &mca_mpool_openib_component.super;
mpool->super.mpool_base = NULL; /* no base .. */
mpool->super.mpool_alloc = mca_mpool_openib_alloc;
mpool->super.mpool_realloc = mca_mpool_openib_realloc;
mpool->super.mpool_free = mca_mpool_openib_free;
mpool->super.mpool_register = mca_mpool_openib_register;
mpool->super.mpool_deregister = mca_mpool_openib_deregister;
mpool->super.mpool_find = mca_mpool_openib_find;
mpool->super.mpool_retain = mca_mpool_openib_retain;
mpool->super.mpool_release = mca_mpool_openib_release;
mpool->super.mpool_finalize = NULL;
mpool->super.rcache =
mca_rcache_base_module_create(mca_mpool_openib_component.rcache_name);
mpool->super.flags = MCA_MPOOL_FLAGS_MPI_ALLOC_MEM;
}
/**
* allocate function
*/
void* mca_mpool_openib_alloc(
mca_mpool_base_module_t* mpool,
size_t size,
size_t align,
uint32_t flags,
mca_mpool_base_registration_t** registration)
{
void* addr_malloc = (void*)memalign(mca_mpool_openib_component.page_size, size);
void* addr = addr_malloc;
if(OMPI_SUCCESS != mpool->mpool_register(mpool, addr, size, 0, registration)) {
free(addr_malloc);
return NULL;
}
(*registration)->alloc_base = addr_malloc;
return addr;
}
/*
* register memory
*/
int mca_mpool_openib_register(mca_mpool_base_module_t* mpool,
void *addr,
size_t size,
uint32_t flags,
mca_mpool_base_registration_t** registration){
mca_mpool_openib_module_t * mpool_module = (mca_mpool_openib_module_t*) mpool;
mca_mpool_openib_registration_t * vapi_reg;
*registration = (mca_mpool_base_registration_t*) OBJ_NEW(mca_mpool_openib_registration_t); /* (void*) malloc(sizeof(mca_mpool_base_registration_t)); */
vapi_reg = (mca_mpool_openib_registration_t*) *registration;
vapi_reg->base_reg.mpool = mpool;
vapi_reg->mr = ibv_reg_mr(
mpool_module->resources.ib_pd,
addr,
size,
IBV_ACCESS_LOCAL_WRITE | IBV_ACCESS_REMOTE_WRITE | IBV_ACCESS_REMOTE_READ
/* IBV_ACCESS_LOCAL_WRITE | IBV_ACCESS_REMOTE_WRITE */
);
if(NULL == vapi_reg->mr){
opal_output(0, "%s: error registering openib memory of size %lu errno says %s\n", __func__, size, strerror(errno));
return OMPI_ERROR;
}
vapi_reg->base_reg.base = addr;
vapi_reg->base_reg.bound = (void*) ((char*) addr + size - 1);
if(flags & (MCA_MPOOL_FLAGS_CACHE | MCA_MPOOL_FLAGS_PERSIST)) {
mpool->rcache->rcache_insert(mpool->rcache,
(mca_mpool_base_registration_t*) vapi_reg,
flags);
}
vapi_reg->base_reg.flags = flags;
mca_mpool_openib_retain(mpool,
(mca_mpool_base_registration_t*) vapi_reg);
return OMPI_SUCCESS;
}
/*
* deregister memory
*/
int mca_mpool_openib_deregister(mca_mpool_base_module_t* mpool,
mca_mpool_base_registration_t* registration){
mca_mpool_openib_registration_t * openib_reg;
openib_reg = (mca_mpool_openib_registration_t*) registration;
if(ibv_dereg_mr(openib_reg->mr)){
opal_output(0, "%s: error unpinning openib memory errno says %s\n", __func__, strerror(errno));
return OMPI_ERROR;
}
if(registration->flags & (MCA_MPOOL_FLAGS_CACHE | MCA_MPOOL_FLAGS_PERSIST)) {
mpool->rcache->rcache_delete(mpool->rcache,
registration,
registration->flags);
}
return OMPI_SUCCESS;
}
/**
* realloc function
*/
void* mca_mpool_openib_realloc(
mca_mpool_base_module_t* mpool,
void* addr,
size_t size,
mca_mpool_base_registration_t** registration)
{
mca_mpool_base_registration_t* old_reg = *registration;
void* new_mem = mpool->mpool_alloc(mpool, size, 0,0, registration);
memcpy(new_mem, addr, old_reg->bound - old_reg->base);
mpool->mpool_free(mpool, addr, old_reg);
return new_mem;
}
/**
* free function
*/
void mca_mpool_openib_free(mca_mpool_base_module_t* mpool, void * addr,
mca_mpool_base_registration_t* registration)
{
mpool->mpool_deregister(mpool, registration);
free(registration->alloc_base);
}
int mca_mpool_openib_find(
struct mca_mpool_base_module_t* mpool,
void* addr,
size_t size,
ompi_pointer_array_t *regs,
uint32_t *cnt
){
return mpool->rcache->rcache_find(mpool->rcache,
addr,
size,
regs,
cnt);
}
int mca_mpool_openib_release(
struct mca_mpool_base_module_t* mpool,
mca_mpool_base_registration_t* registration
){
if(0 == OPAL_THREAD_ADD32(&registration->ref_count, -1)) {
mpool->mpool_deregister(mpool, registration);
}
return OMPI_SUCCESS;
}
int mca_mpool_openib_retain(struct mca_mpool_base_module_t* mpool,
mca_mpool_base_registration_t* registration
){
OPAL_THREAD_ADD32(&registration->ref_count, 1);
return OMPI_SUCCESS;
}