/* * Copyright (c) 2004-2006 The Trustees of Indiana University and Indiana * University Research and Technology * Corporation. All rights reserved. * Copyright (c) 2004-2007 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. * Copyright (c) 2010-2012 Sandia National Laboratories. All rights reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ */ #ifndef BTL_PORTALS_H_HAS_BEEN_INCLUDED #define BTL_PORTALS_H_HAS_BEEN_INCLUDED #include #include #include "opal/class/opal_free_list.h" #include "opal/class/opal_list.h" #include "opal/datatype/opal_convertor.h" #include "opal/mca/btl/btl.h" #include "opal/mca/btl/base/base.h" #include "opal/mca/btl/base/btl_base_error.h" BEGIN_C_DECLS /* * Portals BTL component. */ struct mca_btl_portals4_component_t { /* base BTL component */ mca_btl_base_component_2_0_0_t super; unsigned int num_btls; unsigned int max_btls; /* Maximum number of accepted Portals4 cards */ struct mca_btl_portals4_module_t** btls; /* array of available BTL modules */ /* initial size of free lists */ int portals_free_list_init_num; /* max size of free lists */ int portals_free_list_max_num; /* numer of elements to grow free lists */ int portals_free_list_inc_num; /* number of eager fragments */ int portals_free_list_eager_max_num; /* do I need a portals ACK? */ int portals_need_ack; /** Length of the receive event queues */ int recv_queue_size; /* number outstanding sends and local rdma */ int32_t portals_max_outstanding_ops; /* incoming send message receive memory descriptors */ int portals_recv_mds_num; int portals_recv_mds_size; /** Event queue handles table used in PtlEQPoll */ ptl_handle_eq_t *eqs_h; }; typedef struct mca_btl_portals4_component_t mca_btl_portals4_component_t; struct mca_btl_portals4_module_t { /* base BTL module interface */ mca_btl_base_module_t super; /* number of processes we're actively connected to. Needed to know when to do activation / shutdown */ int32_t portals_num_procs; /* number of the interface (btl) */ uint32_t interface_num; /* fragment free lists */ ompi_free_list_t portals_frag_eager; ompi_free_list_t portals_frag_max; ompi_free_list_t portals_frag_user; opal_list_t portals_recv_blocks; /** Length of the receive event queues */ int recv_queue_size; /** Event queue handle */ ptl_handle_eq_t recv_eq_h; /* number outstanding sends and local rdma */ volatile int32_t portals_outstanding_ops; int32_t portals_max_outstanding_ops; /* key to use for next rdma operation */ volatile int64_t portals_rdma_key; /* our portals network interface */ ptl_handle_ni_t portals_ni_h; /** portals index */ ptl_pt_index_t recv_idx; /** MD handle for sending ACKS */ ptl_handle_md_t zero_md_h; /** Send MD handle(s). Use opal_mtl_portals4_get_md() to get the right md */ #if OPAL_PORTALS4_MAX_MD_SIZE < OPAL_PORTALS4_MAX_VA_SIZE ptl_handle_md_t *send_md_hs; #else ptl_handle_md_t send_md_h; #endif /** long message receive overflow ME. Persistent ME, first in overflow list on the recv_idx portal table. */ ptl_handle_me_t long_overflow_me_h; }; typedef struct mca_btl_portals4_module_t mca_btl_portals4_module_t; /* match/ignore bit manipulation * * 0123 4567 01234567 01234567 01234567 01234567 01234567 01234567 01234567 * | | | * ^ | context id | source | message tag * | | | | * +---- protocol */ #define BTL_PORTALS4_PROTOCOL_MASK 0xF000000000000000ULL #define BTL_PORTALS4_CONTEXT_MASK 0x0FFF000000000000ULL #define BTL_PORTALS4_SOURCE_MASK 0x0000FFFF00000000ULL #define BTL_PORTALS4_TAG_MASK 0x00000000FFFFFFFFULL #define BTL_PORTALS4_PROTOCOL_IGNR BTL_PORTALS4_PROTOCOL_MASK #define BTL_PORTALS4_CONTEXT_IGNR BTL_PORTALS4_CONTEXT_MASK #define BTL_PORTALS4_SOURCE_IGNR BTL_PORTALS4_SOURCE_MASK #define BTL_PORTALS4_TAG_IGNR 0x000000007FFFFFFFULL #define BTL_PORTALS4_SHORT_MSG 0x1000000000000000ULL #define BTL_PORTALS4_LONG_MSG 0x2000000000000000ULL /* send posting */ #define BTL_PORTALS4_SET_SEND_BITS(match_bits, contextid, source, tag, type) \ { \ match_bits = contextid; \ match_bits = (match_bits << 16); \ match_bits |= source; \ match_bits = (match_bits << 32); \ match_bits |= (BTL_PORTALS4_TAG_MASK & tag) | type; \ } #define BTL_PORTALS4_SET_HDR_DATA(hdr_data, opcount, length, sync) \ { \ hdr_data = (sync) ? 1 : 0; \ hdr_data = (hdr_data << 15); \ hdr_data |= opcount & 0x7FFFULL; \ hdr_data = (hdr_data << 48); \ hdr_data |= (length & 0xFFFFFFFFFFFFULL); \ } /* * See note in ompi/mtl/portals4/mtl_portals4.h for how we deal with * platforms that don't allow us to crate an MD that covers all of * memory. */ static inline void opal_btl_portals4_get_md(const void *ptr, ptl_handle_md_t *md_h, void **base_ptr, mca_btl_portals4_module_t *portals4_btl) { #if OPAL_PORTALS4_MAX_MD_SIZE < OPAL_PORTALS4_MAX_VA_SIZE int mask = (1ULL << (OPAL_PORTALS4_MAX_VA_SIZE - OPAL_PORTALS4_MAX_MD_SIZE + 1)) - 1; int which = (((uintptr_t) ptr) >> (OPAL_PORTALS4_MAX_MD_SIZE - 1)) & mask; *md_h = portals4_btl->send_md_hs[which]; *base_ptr = (void*) (which * (1ULL << (OPAL_PORTALS4_MAX_MD_SIZE - 1))); #else *md_h = portals4_btl->send_md_h; *base_ptr = 0; #endif } static inline int mca_btl_portals4_get_num_mds(void) { #if OPAL_PORTALS4_MAX_MD_SIZE < OPAL_PORTALS4_MAX_VA_SIZE return (1 << (OPAL_PORTALS4_MAX_VA_SIZE - OPAL_PORTALS4_MAX_MD_SIZE + 1)); #else return 1; #endif } int mca_btl_portals4_component_progress(void); void mca_btl_portals4_free_module(mca_btl_portals4_module_t *portals4_btl); /* BTL interface functions */ int mca_btl_portals4_finalize(struct mca_btl_base_module_t* btl_base); int mca_btl_portals4_add_procs(struct mca_btl_base_module_t* btl_base, size_t nprocs, struct opal_proc_t **procs, struct mca_btl_base_endpoint_t** peers, opal_bitmap_t* reachable); int mca_btl_portals4_del_procs(struct mca_btl_base_module_t* btl_base, size_t nprocs, struct opal_proc_t **procs, struct mca_btl_base_endpoint_t** peers); mca_btl_base_descriptor_t* mca_btl_portals4_alloc(struct mca_btl_base_module_t* btl_base, struct mca_btl_base_endpoint_t* endpoint, uint8_t order, size_t size, uint32_t flags); int mca_btl_portals4_free(struct mca_btl_base_module_t* btl_base, mca_btl_base_descriptor_t* des); mca_btl_base_descriptor_t* mca_btl_portals4_prepare_src(struct mca_btl_base_module_t* btl_base, struct mca_btl_base_endpoint_t* peer, mca_mpool_base_registration_t* registration, struct opal_convertor_t* convertor, uint8_t order, size_t reserve, size_t* size, uint32_t flags); mca_btl_base_descriptor_t* mca_btl_portals4_prepare_dst(struct mca_btl_base_module_t* btl_base, struct mca_btl_base_endpoint_t* peer, mca_mpool_base_registration_t* registration, struct opal_convertor_t* convertor, uint8_t order, size_t reserve, size_t* size, uint32_t flags); int mca_btl_portals4_send(struct mca_btl_base_module_t* btl_base, struct mca_btl_base_endpoint_t* btl_peer, struct mca_btl_base_descriptor_t* descriptor, mca_btl_base_tag_t tag); int mca_btl_portals4_sendi(struct mca_btl_base_module_t* btl_base, struct mca_btl_base_endpoint_t* endpoint, struct opal_convertor_t* convertor, void* header, size_t header_size, size_t payload_size, uint8_t order, uint32_t flags, mca_btl_base_tag_t tag, mca_btl_base_descriptor_t** des); int mca_btl_portals4_put(struct mca_btl_base_module_t* btl_base, struct mca_btl_base_endpoint_t* btl_peer, struct mca_btl_base_descriptor_t* decriptor); int mca_btl_portals4_get(struct mca_btl_base_module_t* btl_base, struct mca_btl_base_endpoint_t* btl_peer, struct mca_btl_base_descriptor_t* decriptor); int mca_btl_portals4_get_error(int ptl_error); /* * global structures */ OPAL_MODULE_DECLSPEC extern mca_btl_portals4_component_t mca_btl_portals4_component; extern mca_btl_portals4_module_t mca_btl_portals4_module; /** * An abstraction that represents a connection to a endpoint process. * An instance of mca_btl_base_endpoint_t is associated w/ each process * and BTL pair at startup. However, connections to the endpoint * are established dynamically on an as-needed basis: */ struct mca_btl_base_endpoint_t { ptl_process_t ptl_proc; }; typedef struct mca_btl_base_endpoint_t mca_btl_base_endpoint_t; END_C_DECLS #endif /* BTL_PORTALS_H_HAS_BEEN_INCLUDED */