/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */ /* * Copyright (c) 2011-2016 Los Alamos National Security, LLC. All rights * reserved. * Copyright (c) 2011 UT-Battelle, LLC. All rights reserved. * Copyright (c) 2013 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ */ #if !defined(MCA_BTL_UGNI_FRAG_H) #define MCA_BTL_UGNI_FRAG_H #include "btl_ugni.h" #include "btl_ugni_endpoint.h" typedef struct mca_btl_ugni_send_frag_hdr_t { uint32_t lag; } mca_btl_ugni_send_frag_hdr_t; typedef struct mca_btl_ugni_send_ex_frag_hdr_t { mca_btl_ugni_send_frag_hdr_t send; uint8_t pml_header[128]; } mca_btl_ugni_send_ex_frag_hdr_t; typedef struct mca_btl_ugni_rdma_frag_hdr_t { void *ctx; } mca_btl_ugni_rdma_frag_hdr_t; typedef struct mca_btl_ugni_eager_frag_hdr_t { mca_btl_ugni_send_frag_hdr_t send; uint32_t size; uint64_t address; mca_btl_base_registration_handle_t memory_handle; void *ctx; } mca_btl_ugni_eager_frag_hdr_t; typedef struct mca_btl_ugni_eager_ex_frag_hdr_t { mca_btl_ugni_eager_frag_hdr_t eager; uint8_t pml_header[128]; } mca_btl_ugni_eager_ex_frag_hdr_t; typedef union mca_btl_ugni_frag_hdr_t { mca_btl_ugni_send_frag_hdr_t send; mca_btl_ugni_send_ex_frag_hdr_t send_ex; mca_btl_ugni_rdma_frag_hdr_t rdma; mca_btl_ugni_eager_frag_hdr_t eager; mca_btl_ugni_eager_ex_frag_hdr_t eager_ex; } mca_btl_ugni_frag_hdr_t; enum { MCA_BTL_UGNI_FRAG_BUFFERED = 1, /* frag data is buffered */ MCA_BTL_UGNI_FRAG_COMPLETE = 2, /* smsg complete for frag */ MCA_BTL_UGNI_FRAG_EAGER = 4, /* eager get frag */ MCA_BTL_UGNI_FRAG_IGNORE = 8, /* ignore local smsg completion */ MCA_BTL_UGNI_FRAG_SMSG_COMPLETE = 16, /* SMSG has completed for this message */ MCA_BTL_UGNI_FRAG_RESPONSE = 32, }; struct mca_btl_ugni_base_frag_t; typedef struct mca_btl_ugni_base_frag_t { mca_btl_base_descriptor_t base; volatile int32_t ref_cnt; uint32_t msg_id; uint16_t hdr_size; uint16_t flags; mca_btl_ugni_frag_hdr_t hdr; mca_btl_base_segment_t segments[2]; opal_common_ugni_post_desc_t post_desc; mca_btl_base_endpoint_t *endpoint; mca_btl_ugni_reg_t *registration; opal_free_list_t *my_list; mca_btl_base_registration_handle_t memory_handle; } mca_btl_ugni_base_frag_t; typedef struct mca_btl_ugni_base_frag_t mca_btl_ugni_smsg_frag_t; typedef struct mca_btl_ugni_base_frag_t mca_btl_ugni_rdma_frag_t; typedef struct mca_btl_ugni_base_frag_t mca_btl_ugni_eager_frag_t; #define MCA_BTL_UGNI_DESC_TO_FRAG(desc) \ ((mca_btl_ugni_base_frag_t *)((uintptr_t) (desc) - offsetof (mca_btl_ugni_base_frag_t, post_desc))) typedef struct mca_btl_ugni_post_descriptor_t { opal_free_list_item_t super; opal_common_ugni_post_desc_t desc; mca_btl_base_endpoint_t *endpoint; mca_btl_base_registration_handle_t *local_handle; mca_btl_base_rdma_completion_fn_t cbfunc; void *cbdata; void *ctx; } mca_btl_ugni_post_descriptor_t; OBJ_CLASS_DECLARATION(mca_btl_ugni_post_descriptor_t); #define MCA_BTL_UGNI_DESC_TO_PDESC(desc) \ ((mca_btl_ugni_post_descriptor_t *)((uintptr_t) (desc) - offsetof (mca_btl_ugni_post_descriptor_t, desc))) static inline void mca_btl_ugni_alloc_post_descriptor (mca_btl_base_endpoint_t *endpoint, mca_btl_base_registration_handle_t *local_handle, mca_btl_base_rdma_completion_fn_t cbfunc, void *cbcontext, void *cbdata, mca_btl_ugni_post_descriptor_t **desc) { *desc = (mca_btl_ugni_post_descriptor_t *) opal_free_list_get (&endpoint->btl->post_descriptors); if (NULL != *desc) { (*desc)->cbfunc = cbfunc; (*desc)->ctx = cbcontext; (*desc)->cbdata = cbdata; (*desc)->local_handle = local_handle; (*desc)->endpoint = endpoint; (void) OPAL_THREAD_ADD64(&endpoint->btl->active_rdma_count, 1); } } static inline void mca_btl_ugni_return_post_descriptor (mca_btl_ugni_module_t *module, mca_btl_ugni_post_descriptor_t *desc) { (void) OPAL_THREAD_ADD64(&module->active_rdma_count, -1); opal_free_list_return (&module->post_descriptors, &desc->super); } static inline void mca_btl_ugni_post_desc_complete (mca_btl_ugni_module_t *module, mca_btl_ugni_post_descriptor_t *desc, int rc) { BTL_VERBOSE(("RDMA/FMA/ATOMIC operation complete for post descriptor %p. rc = %d", (void *) desc, rc)); if (NULL != desc->cbfunc) { /* call the user's callback function */ desc->cbfunc (&module->super, desc->endpoint, (void *)(intptr_t) desc->desc.base.local_addr, desc->local_handle, desc->ctx, desc->cbdata, rc); } /* the descriptor is no longer needed */ mca_btl_ugni_return_post_descriptor (module, desc); } OBJ_CLASS_DECLARATION(mca_btl_ugni_smsg_frag_t); OBJ_CLASS_DECLARATION(mca_btl_ugni_rdma_frag_t); OBJ_CLASS_DECLARATION(mca_btl_ugni_eager_frag_t); int mca_btl_ugni_frag_init (mca_btl_ugni_base_frag_t *frag, mca_btl_ugni_module_t *ugni_module); static inline int mca_btl_ugni_frag_alloc (mca_btl_base_endpoint_t *ep, opal_free_list_t *list, mca_btl_ugni_base_frag_t **frag) { *frag = (mca_btl_ugni_base_frag_t *) opal_free_list_get (list); if (OPAL_LIKELY(NULL != *frag)) { (*frag)->my_list = list; (*frag)->endpoint = ep; (*frag)->ref_cnt = 1; return OPAL_SUCCESS; } return OPAL_ERR_OUT_OF_RESOURCE; } static inline int mca_btl_ugni_frag_return (mca_btl_ugni_base_frag_t *frag) { if (frag->registration) { frag->endpoint->btl->rcache->rcache_deregister (frag->endpoint->btl->rcache, (mca_rcache_base_registration_t *) frag->registration); frag->registration = NULL; } frag->flags = 0; opal_free_list_return (frag->my_list, (opal_free_list_item_t *) frag); return OPAL_SUCCESS; } static inline bool mca_btl_ugni_frag_del_ref (mca_btl_ugni_base_frag_t *frag, int rc) { int32_t ref_cnt; opal_atomic_mb (); ref_cnt = OPAL_THREAD_ADD32(&frag->ref_cnt, -1); if (ref_cnt) { assert (ref_cnt > 0); return false; } /* call callback if specified */ if (frag->base.des_flags & MCA_BTL_DES_SEND_ALWAYS_CALLBACK) { frag->base.des_cbfunc(&frag->endpoint->btl->super, frag->endpoint, &frag->base, rc); } if (frag->base.des_flags & MCA_BTL_DES_FLAGS_BTL_OWNERSHIP) { mca_btl_ugni_frag_return (frag); } return true; } static inline void mca_btl_ugni_frag_complete (mca_btl_ugni_base_frag_t *frag, int rc) { BTL_VERBOSE(("frag complete. flags = %d", frag->base.des_flags)); frag->flags |= MCA_BTL_UGNI_FRAG_COMPLETE; mca_btl_ugni_frag_del_ref (frag, rc); } static inline bool mca_btl_ugni_frag_check_complete (mca_btl_ugni_base_frag_t *frag) { return !!(MCA_BTL_UGNI_FRAG_COMPLETE & frag->flags); } #define MCA_BTL_UGNI_FRAG_ALLOC_SMSG(ep, frag) \ mca_btl_ugni_frag_alloc((ep), &(ep)->btl->smsg_frags, &(frag)) #define MCA_BTL_UGNI_FRAG_ALLOC_RDMA(ep, frag) \ mca_btl_ugni_frag_alloc((ep), &(ep)->btl->rdma_frags, &(frag)) #define MCA_BTL_UGNI_FRAG_ALLOC_RDMA_INT(ep, frag) \ mca_btl_ugni_frag_alloc((ep), &(ep)->btl->rdma_int_frags, &(frag)) #define MCA_BTL_UGNI_FRAG_ALLOC_EAGER_SEND(ep, frag) \ mca_btl_ugni_frag_alloc((ep), &(ep)->btl->eager_frags_send, &(frag)) #define MCA_BTL_UGNI_FRAG_ALLOC_EAGER_RECV(ep, frag) \ mca_btl_ugni_frag_alloc((ep), &(ep)->btl->eager_frags_recv, &(frag)) #endif /* MCA_BTL_UGNI_FRAG_H */