13643f5b6e
This commit makes the folowing changes: - Add support for the knem single-copy mechanism. Initially vader will only support the synchronous copy mode. Asynchronous copy support may be added int the future. - Improve Linux cross memory attach (CMA) when using restrictive ptrace settings. This will allow Open MPI to use CMA without modifying the system settings to support ptrace attach (see /etc/sysctl.d/10-ptrace.conf). - Allow runtime selection of the single copy mechanism. The default behavior is to use the best available. The priority list of single-copy mehanisms is as follows: xpmem, cma, and knem. - Allow disabling support for kernel-assisted single copy. - Some tuning and bug fixes.
137 строки
4.4 KiB
C
137 строки
4.4 KiB
C
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
|
/*
|
|
* Copyright (c) 2011-2014 Los Alamos National Security, LLC. All rights
|
|
* reserved.
|
|
* Copyright (c) 2014 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "btl_vader.h"
|
|
|
|
#include "opal/include/opal/align.h"
|
|
#include "opal/mca/memchecker/base/base.h"
|
|
|
|
#if OPAL_BTL_VADER_HAVE_XPMEM
|
|
|
|
/* look up the remote pointer in the peer rcache and attach if
|
|
* necessary */
|
|
mca_mpool_base_registration_t *vader_get_registation (struct mca_btl_base_endpoint_t *ep, void *rem_ptr,
|
|
size_t size, int flags, void **local_ptr)
|
|
{
|
|
struct mca_rcache_base_module_t *rcache = ep->segment_data.xpmem.rcache;
|
|
mca_mpool_base_registration_t *regs[10], *reg = NULL;
|
|
xpmem_addr_t xpmem_addr;
|
|
uintptr_t base, bound;
|
|
int rc, i;
|
|
|
|
/* protect rcache access */
|
|
OPAL_THREAD_LOCK(&ep->lock);
|
|
|
|
/* use btl/self for self communication */
|
|
assert (ep->peer_smp_rank != MCA_BTL_VADER_LOCAL_RANK);
|
|
|
|
base = (uintptr_t) down_align_addr(rem_ptr, mca_btl_vader_component.log_attach_align);
|
|
bound = (uintptr_t) up_align_addr((void *)((uintptr_t) rem_ptr + size - 1),
|
|
mca_btl_vader_component.log_attach_align) + 1;
|
|
if (OPAL_UNLIKELY(bound > VADER_MAX_ADDRESS)) {
|
|
bound = VADER_MAX_ADDRESS;
|
|
}
|
|
|
|
/* several segments may match the base pointer */
|
|
rc = rcache->rcache_find_all (rcache, (void *) base, bound - base, regs, 10);
|
|
for (i = 0 ; i < rc ; ++i) {
|
|
if (bound <= (uintptr_t)regs[i]->bound && base >= (uintptr_t)regs[i]->base) {
|
|
(void)opal_atomic_add (®s[i]->ref_count, 1);
|
|
reg = regs[i];
|
|
goto reg_found;
|
|
}
|
|
|
|
if (regs[i]->flags & MCA_MPOOL_FLAGS_PERSIST) {
|
|
continue;
|
|
}
|
|
|
|
/* remove this pointer from the rcache and decrement its reference count
|
|
(so it is detached later) */
|
|
rc = rcache->rcache_delete (rcache, regs[i]);
|
|
if (OPAL_UNLIKELY(0 != rc)) {
|
|
/* someone beat us to it? */
|
|
break;
|
|
}
|
|
|
|
/* start the new segment from the lower of the two bases */
|
|
base = (uintptr_t) regs[i]->base < base ? (uintptr_t) regs[i]->base : base;
|
|
|
|
(void)opal_atomic_add (®s[i]->ref_count, -1);
|
|
|
|
if (OPAL_LIKELY(0 == regs[i]->ref_count)) {
|
|
/* this pointer is not in use */
|
|
(void) xpmem_detach (regs[i]->alloc_base);
|
|
OBJ_RELEASE(regs[i]);
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
reg = OBJ_NEW(mca_mpool_base_registration_t);
|
|
if (OPAL_LIKELY(NULL != reg)) {
|
|
/* stick around for awhile */
|
|
reg->ref_count = 2;
|
|
reg->base = (unsigned char *) base;
|
|
reg->bound = (unsigned char *) bound;
|
|
reg->flags = flags;
|
|
|
|
#if defined(HAVE_SN_XPMEM_H)
|
|
xpmem_addr.id = ep->segment_data.xpmem.apid;
|
|
#else
|
|
xpmem_addr.apid = ep->segment_data.xpmem.apid;
|
|
#endif
|
|
xpmem_addr.offset = base;
|
|
|
|
reg->alloc_base = xpmem_attach (xpmem_addr, bound - base, NULL);
|
|
if (OPAL_UNLIKELY((void *)-1 == reg->alloc_base)) {
|
|
OPAL_THREAD_UNLOCK(&ep->lock);
|
|
OBJ_RELEASE(reg);
|
|
return NULL;
|
|
}
|
|
|
|
opal_memchecker_base_mem_defined (reg->alloc_base, bound - base);
|
|
|
|
rcache->rcache_insert (rcache, reg, 0);
|
|
}
|
|
|
|
reg_found:
|
|
opal_atomic_wmb ();
|
|
*local_ptr = (void *) ((uintptr_t) reg->alloc_base +
|
|
(ptrdiff_t)((uintptr_t) rem_ptr - (uintptr_t) reg->base));
|
|
|
|
OPAL_THREAD_UNLOCK(&ep->lock);
|
|
|
|
return reg;
|
|
}
|
|
|
|
void vader_return_registration (mca_mpool_base_registration_t *reg, struct mca_btl_base_endpoint_t *ep)
|
|
{
|
|
struct mca_rcache_base_module_t *rcache = ep->segment_data.xpmem.rcache;
|
|
int32_t ref_count;
|
|
|
|
ref_count = opal_atomic_add_32 (®->ref_count, -1);
|
|
if (OPAL_UNLIKELY(0 == ref_count && !(reg->flags & MCA_MPOOL_FLAGS_PERSIST))) {
|
|
/* protect rcache access */
|
|
OPAL_THREAD_LOCK(&ep->lock);
|
|
rcache->rcache_delete (rcache, reg);
|
|
OPAL_THREAD_UNLOCK(&ep->lock);
|
|
|
|
opal_memchecker_base_mem_noaccess (reg->alloc_base, (uintptr_t)(reg->bound - reg->base));
|
|
(void)xpmem_detach (reg->alloc_base);
|
|
OBJ_RELEASE (reg);
|
|
}
|
|
}
|
|
|
|
#endif /* OPAL_BTL_VADER_HAVE_XPMEM */
|