/* * Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana * University Research and Technology * Corporation. All rights reserved. * Copyright (c) 2004-2005 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. * Copyright (c) 2006 Cisco Systems, Inc. All rights reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ */ #include "ompi_config.h" #include "opal/util/output.h" #include "ompi/mca/mpool/openib/mpool_openib.h" #include #include #include #include #include "ompi/mca/rcache/rcache.h" #include "ompi/mca/rcache/base/base.h" #include "ompi/mca/mpool/base/base.h" extern uint32_t mca_mpool_base_page_size; extern uint32_t mca_mpool_base_page_size_log; /* * Initializes the mpool module. */ void mca_mpool_openib_module_init(mca_mpool_openib_module_t* mpool) { mpool->super.mpool_component = &mca_mpool_openib_component.super; mpool->super.mpool_base = NULL; /* no base .. */ mpool->super.mpool_alloc = mca_mpool_openib_alloc; mpool->super.mpool_realloc = mca_mpool_openib_realloc; mpool->super.mpool_free = mca_mpool_openib_free; mpool->super.mpool_register = mca_mpool_openib_register; mpool->super.mpool_deregister = mca_mpool_openib_deregister; mpool->super.mpool_find = mca_mpool_openib_find; mpool->super.mpool_retain = mca_mpool_openib_retain; mpool->super.mpool_release = mca_mpool_openib_release; mpool->super.mpool_finalize = NULL; mpool->super.rcache = mca_rcache_base_module_create(mca_mpool_openib_component.rcache_name); mpool->super.flags = MCA_MPOOL_FLAGS_MPI_ALLOC_MEM; OBJ_CONSTRUCT(&mpool->reg_list, ompi_free_list_t); ompi_free_list_init(&mpool->reg_list, sizeof(mca_mpool_openib_registration_t), OBJ_CLASS(mca_mpool_openib_registration_t), 0, -1, 32, NULL); } /** * allocate function */ void* mca_mpool_openib_alloc( mca_mpool_base_module_t* mpool, size_t size, size_t align, uint32_t flags, mca_mpool_base_registration_t** registration) { void* addr_malloc = (void*)memalign(mca_mpool_base_page_size, size); void* addr = addr_malloc; if(OMPI_SUCCESS != mpool->mpool_register(mpool, addr, size, flags, registration)) { free(addr_malloc); return NULL; } (*registration)->alloc_base = addr_malloc; return addr; } /* * register memory */ int mca_mpool_openib_register(mca_mpool_base_module_t* mpool, void *addr, size_t size, uint32_t flags, mca_mpool_base_registration_t** registration){ mca_mpool_openib_module_t * mpool_module = (mca_mpool_openib_module_t*) mpool; mca_mpool_openib_registration_t * vapi_reg; ompi_free_list_item_t *item; int rc; OMPI_FREE_LIST_GET(&mpool_module->reg_list, item, rc); if(OMPI_SUCCESS != rc) { return rc; } vapi_reg = (mca_mpool_openib_registration_t*) item; *registration = &vapi_reg->base_reg; vapi_reg->base_reg.mpool = mpool; vapi_reg->base_reg.base = down_align_addr(addr, mca_mpool_base_page_size_log); vapi_reg->base_reg.bound = up_align_addr( (void*) ((char*) addr + size - 1) , mca_mpool_base_page_size_log); size = vapi_reg->base_reg.bound -vapi_reg->base_reg.base + 1; vapi_reg->mr = ibv_reg_mr( mpool_module->resources.ib_pd, vapi_reg->base_reg.base, size, IBV_ACCESS_LOCAL_WRITE | IBV_ACCESS_REMOTE_WRITE | IBV_ACCESS_REMOTE_READ /* IBV_ACCESS_LOCAL_WRITE | IBV_ACCESS_REMOTE_WRITE */ ); if(NULL == vapi_reg->mr){ return OMPI_ERROR; } if(flags & (MCA_MPOOL_FLAGS_CACHE | MCA_MPOOL_FLAGS_PERSIST)) { mpool->rcache->rcache_insert(mpool->rcache, (mca_mpool_base_registration_t*) vapi_reg, flags); } vapi_reg->base_reg.flags = flags; mca_mpool_openib_retain(mpool, (mca_mpool_base_registration_t*) vapi_reg); return OMPI_SUCCESS; } /* * deregister memory */ int mca_mpool_openib_deregister(mca_mpool_base_module_t* mpool, mca_mpool_base_registration_t* registration){ if(registration->flags & (MCA_MPOOL_FLAGS_CACHE | MCA_MPOOL_FLAGS_PERSIST)) { mpool->rcache->rcache_delete(mpool->rcache, registration, registration->flags); registration->flags=0; } return mca_mpool_openib_release(mpool, registration); } /** * realloc function */ void* mca_mpool_openib_realloc( mca_mpool_base_module_t* mpool, void* addr, size_t size, mca_mpool_base_registration_t** registration) { mca_mpool_base_registration_t* old_reg = *registration; void* new_mem = mpool->mpool_alloc(mpool, size, 0,0, registration); memcpy(new_mem, addr, old_reg->bound - old_reg->base); mpool->mpool_free(mpool, addr, old_reg); return new_mem; } /** * free function */ void mca_mpool_openib_free(mca_mpool_base_module_t* mpool, void * addr, mca_mpool_base_registration_t* registration) { mpool->mpool_deregister(mpool, registration); free(registration->alloc_base); } int mca_mpool_openib_find( struct mca_mpool_base_module_t* mpool, void* addr, size_t size, ompi_pointer_array_t *regs, uint32_t *cnt ){ return mpool->rcache->rcache_find(mpool->rcache, addr, size, regs, cnt); } int mca_mpool_openib_release( struct mca_mpool_base_module_t* mpool, mca_mpool_base_registration_t* registration ){ if(0 >= OPAL_THREAD_ADD32(®istration->ref_count, -1)) { mca_mpool_openib_registration_t * openib_reg; mca_mpool_openib_module_t* mpool_openib = (mca_mpool_openib_module_t*) mpool; openib_reg = (mca_mpool_openib_registration_t*) registration; if(ibv_dereg_mr(openib_reg->mr)){ opal_output(0, "%s: error unpinning openib memory errno says %s\n", __func__, strerror(errno)); return OMPI_ERROR; } OMPI_FREE_LIST_RETURN(&mpool_openib->reg_list, (ompi_free_list_item_t*) openib_reg); } return OMPI_SUCCESS; } int mca_mpool_openib_retain(struct mca_mpool_base_module_t* mpool, mca_mpool_base_registration_t* registration ){ OPAL_THREAD_ADD32(®istration->ref_count, 1); return OMPI_SUCCESS; }