552c9ca5a0
WHAT: Open our low-level communication infrastructure by moving all necessary components (btl/rcache/allocator/mpool) down in OPAL All the components required for inter-process communications are currently deeply integrated in the OMPI layer. Several groups/institutions have express interest in having a more generic communication infrastructure, without all the OMPI layer dependencies. This communication layer should be made available at a different software level, available to all layers in the Open MPI software stack. As an example, our ORTE layer could replace the current OOB and instead use the BTL directly, gaining access to more reactive network interfaces than TCP. Similarly, external software libraries could take advantage of our highly optimized AM (active message) communication layer for their own purpose. UTK with support from Sandia, developped a version of Open MPI where the entire communication infrastucture has been moved down to OPAL (btl/rcache/allocator/mpool). Most of the moved components have been updated to match the new schema, with few exceptions (mainly BTLs where I have no way of compiling/testing them). Thus, the completion of this RFC is tied to being able to completing this move for all BTLs. For this we need help from the rest of the Open MPI community, especially those supporting some of the BTLs. A non-exhaustive list of BTLs that qualify here is: mx, portals4, scif, udapl, ugni, usnic. This commit was SVN r32317.
109 строки
3.2 KiB
C
109 строки
3.2 KiB
C
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
|
/*
|
|
* Copyright (c) 2013 Los Alamos National Security, LLC. All rights
|
|
* reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#if !defined(MCA_BTL_SCIF_FRAG_H)
|
|
#define MCA_BTL_SCIF_FRAG_H
|
|
|
|
#include "btl_scif.h"
|
|
#include "btl_scif_endpoint.h"
|
|
|
|
typedef struct mca_btl_scif_segment_t {
|
|
mca_btl_base_segment_t base;
|
|
|
|
/* scif offset */
|
|
off_t scif_offset;
|
|
|
|
/* original pointer */
|
|
uint64_t orig_ptr;
|
|
} mca_btl_scif_segment_t;
|
|
|
|
typedef struct mca_btl_scif_frag_hdr_t {
|
|
#if defined(SCIF_USE_SEQ)
|
|
uint32_t seq;
|
|
#endif
|
|
uint8_t tag;
|
|
uint8_t flags;
|
|
uint16_t size;
|
|
} mca_btl_scif_frag_hdr_t;
|
|
|
|
struct mca_btl_scif_base_frag_t;
|
|
|
|
typedef void (*frag_cb_t) (struct mca_btl_scif_base_frag_t *, int);
|
|
|
|
typedef struct mca_btl_scif_base_frag_t {
|
|
mca_btl_base_descriptor_t base;
|
|
mca_btl_scif_frag_hdr_t hdr;
|
|
mca_btl_scif_segment_t segments[2];
|
|
mca_btl_base_endpoint_t *endpoint;
|
|
mca_btl_scif_reg_t *registration;
|
|
ompi_free_list_t *my_list;
|
|
} mca_btl_scif_base_frag_t;
|
|
|
|
typedef mca_btl_scif_base_frag_t mca_btl_scif_dma_frag_t;
|
|
typedef mca_btl_scif_base_frag_t mca_btl_scif_eager_frag_t;
|
|
|
|
OBJ_CLASS_DECLARATION(mca_btl_scif_dma_frag_t);
|
|
OBJ_CLASS_DECLARATION(mca_btl_scif_eager_frag_t);
|
|
|
|
static inline int mca_btl_scif_frag_alloc (mca_btl_base_endpoint_t *ep,
|
|
ompi_free_list_t *list,
|
|
mca_btl_scif_base_frag_t **frag)
|
|
{
|
|
ompi_free_list_item_t *item = NULL;
|
|
|
|
OMPI_FREE_LIST_GET_MT(list, item);
|
|
*frag = (mca_btl_scif_base_frag_t *) item;
|
|
if (OPAL_LIKELY(NULL != item)) {
|
|
(*frag)->my_list = list;
|
|
(*frag)->endpoint = ep;
|
|
return OPAL_SUCCESS;
|
|
}
|
|
|
|
return OPAL_ERR_OUT_OF_RESOURCE;
|
|
}
|
|
|
|
static inline int mca_btl_scif_frag_return (mca_btl_scif_base_frag_t *frag)
|
|
{
|
|
if (frag->registration) {
|
|
frag->endpoint->btl->super.btl_mpool->mpool_deregister(frag->endpoint->btl->super.btl_mpool,
|
|
&frag->registration->base);
|
|
frag->registration = NULL;
|
|
}
|
|
|
|
frag->segments[0].base.seg_addr.pval = frag->base.super.ptr;
|
|
frag->segments[0].base.seg_len = 0;
|
|
frag->segments[1].base.seg_len = 0;
|
|
|
|
OMPI_FREE_LIST_RETURN_MT(frag->my_list, (ompi_free_list_item_t *) frag);
|
|
|
|
return OPAL_SUCCESS;
|
|
}
|
|
|
|
static inline void mca_btl_scif_frag_complete (mca_btl_scif_base_frag_t *frag, int rc) {
|
|
BTL_VERBOSE(("frag complete. flags = %d", frag->base.des_flags));
|
|
|
|
/* call callback if specified */
|
|
if (frag->base.des_flags & MCA_BTL_DES_SEND_ALWAYS_CALLBACK) {
|
|
frag->base.des_cbfunc(&frag->endpoint->btl->super, frag->endpoint, &frag->base, rc);
|
|
}
|
|
|
|
if (frag->base.des_flags & MCA_BTL_DES_FLAGS_BTL_OWNERSHIP) {
|
|
mca_btl_scif_frag_return (frag);
|
|
}
|
|
}
|
|
|
|
#define MCA_BTL_SCIF_FRAG_ALLOC_EAGER(ep, frag) \
|
|
mca_btl_scif_frag_alloc((ep), &(ep)->btl->eager_frags, &(frag))
|
|
#define MCA_BTL_SCIF_FRAG_ALLOC_DMA(ep, frag) \
|
|
mca_btl_scif_frag_alloc((ep), &(ep)->btl->dma_frags, &(frag))
|
|
|
|
#endif /* MCA_BTL_SCIF_FRAG_H */
|