29f7b4deda
queue pairs. Tested on intel p2p with 16 procs - Passed. This commit was SVN r7119.
315 строки
12 KiB
C
315 строки
12 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University.
|
|
* All rights reserved.
|
|
* Copyright (c) 2004-2005 The Trustees of the University of Tennessee.
|
|
* All rights reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#ifndef MCA_BTL_IB_ENDPOINT_H
|
|
#define MCA_BTL_IB_ENDPOINT_H
|
|
|
|
#include "opal/class/opal_list.h"
|
|
#include "opal/event/event.h"
|
|
#include "mca/pml/pml.h"
|
|
#include "mca/btl/btl.h"
|
|
#include "btl_mvapi_frag.h"
|
|
#include "btl_mvapi.h"
|
|
|
|
#include <vapi.h>
|
|
#include <mtl_common.h>
|
|
#include <vapi_common.h>
|
|
|
|
|
|
#if defined(c_plusplus) || defined(__cplusplus)
|
|
extern "C" {
|
|
#endif
|
|
#define MAX_POST_RR (16)
|
|
OBJ_CLASS_DECLARATION(mca_btl_mvapi_endpoint_t);
|
|
|
|
|
|
struct mca_btl_mvapi_frag_t;
|
|
|
|
struct mca_btl_mvapi_addr_t {
|
|
uint32_t subnet;
|
|
};
|
|
typedef struct mca_btl_mvapi_addr_t mca_btl_mvapi_addr_t;
|
|
|
|
|
|
/**
|
|
* State of IB endpoint connection.
|
|
*/
|
|
|
|
typedef enum {
|
|
/* Defines the state in which this BTL instance
|
|
* has started the process of connection */
|
|
MCA_BTL_IB_CONNECTING,
|
|
|
|
/* Waiting for ack from endpoint */
|
|
MCA_BTL_IB_CONNECT_ACK,
|
|
|
|
/*Waiting for final connection ACK from endpoint */
|
|
MCA_BTL_IB_WAITING_ACK,
|
|
|
|
/* Connected ... both sender & receiver have
|
|
* buffers associated with this connection */
|
|
MCA_BTL_IB_CONNECTED,
|
|
|
|
/* Connection is closed, there are no resources
|
|
* associated with this */
|
|
MCA_BTL_IB_CLOSED,
|
|
|
|
/* Maximum number of retries have been used.
|
|
* Report failure on send to upper layer */
|
|
MCA_BTL_IB_FAILED
|
|
} mca_btl_mvapi_endpoint_state_t;
|
|
|
|
/**
|
|
* An abstraction that represents a connection to a endpoint process.
|
|
* An instance of mca_btl_base_endpoint_t is associated w/ each process
|
|
* and BTL pair at startup. However, connections to the endpoint
|
|
* are established dynamically on an as-needed basis:
|
|
*/
|
|
|
|
struct mca_btl_base_endpoint_t {
|
|
opal_list_item_t super;
|
|
|
|
struct mca_btl_mvapi_module_t* endpoint_btl;
|
|
/**< BTL instance that created this connection */
|
|
|
|
struct mca_btl_mvapi_proc_t* endpoint_proc;
|
|
/**< proc structure corresponding to endpoint */
|
|
|
|
mca_btl_mvapi_endpoint_state_t endpoint_state;
|
|
/**< current state of the connection */
|
|
|
|
size_t endpoint_retries;
|
|
/**< number of connection retries attempted */
|
|
|
|
double endpoint_tstamp;
|
|
/**< timestamp of when the first connection was attempted */
|
|
|
|
opal_mutex_t endpoint_send_lock;
|
|
/**< lock for concurrent access to endpoint state */
|
|
|
|
opal_mutex_t endpoint_recv_lock;
|
|
/**< lock for concurrent access to endpoint state */
|
|
|
|
opal_list_t pending_send_frags;
|
|
/**< list of pending send frags for this endpoint */
|
|
|
|
opal_list_t pending_frags_hp;
|
|
/**< list of pending high priority frags */
|
|
|
|
opal_list_t pending_frags_lp;
|
|
/**< list of pending low prioirty frags */
|
|
|
|
uint32_t wr_sq_tokens_hp;
|
|
/**< number of high priority frags that can be outstanding (down counter) */
|
|
|
|
|
|
uint32_t wr_sq_tokens_lp;
|
|
/**< number of low priority frags that can be outstanding (down counter) */
|
|
|
|
VAPI_qp_num_t rem_qp_num_high;
|
|
/* High priority remote side QP number */
|
|
|
|
VAPI_qp_num_t rem_qp_num_low;
|
|
/* Low prioirty remote size QP number */
|
|
|
|
IB_lid_t rem_lid;
|
|
/* Local identifier of the remote process */
|
|
|
|
VAPI_qp_hndl_t lcl_qp_hndl_high;
|
|
/* High priority local QP handle */
|
|
|
|
VAPI_qp_hndl_t lcl_qp_hndl_low;
|
|
/* Low priority local QP handle */
|
|
|
|
VAPI_qp_prop_t lcl_qp_prop_high;
|
|
/* High priority local QP properties */
|
|
|
|
VAPI_qp_prop_t lcl_qp_prop_low;
|
|
/* Low priority local QP properties */
|
|
|
|
|
|
uint32_t rr_posted_high; /**< number of high priority rr posted to the nic*/
|
|
uint32_t rr_posted_low; /**< number of low priority rr posted to the nic*/
|
|
|
|
mca_btl_mvapi_addr_t endpoint_addr;
|
|
|
|
};
|
|
|
|
typedef struct mca_btl_base_endpoint_t mca_btl_base_endpoint_t;
|
|
typedef mca_btl_base_endpoint_t mca_btl_mvapi_endpoint_t;
|
|
|
|
int mca_btl_mvapi_endpoint_send(mca_btl_base_endpoint_t* endpoint, struct mca_btl_mvapi_frag_t* frag);
|
|
int mca_btl_mvapi_endpoint_connect(mca_btl_base_endpoint_t*);
|
|
void mca_btl_mvapi_post_recv(void);
|
|
|
|
|
|
void mca_btl_mvapi_progress_send_frags(mca_btl_mvapi_endpoint_t*);
|
|
|
|
#define MCA_BTL_MVAPI_ENDPOINT_POST_RR_HIGH(post_rr_high_endpoint, \
|
|
post_rr_high_additional) \
|
|
{ \
|
|
mca_btl_mvapi_module_t * post_rr_high_mvapi_btl = post_rr_high_endpoint->endpoint_btl; \
|
|
OPAL_THREAD_LOCK(&post_rr_high_mvapi_btl->ib_lock); \
|
|
if(post_rr_high_endpoint->rr_posted_high <= mca_btl_mvapi_component.ib_rr_buf_min+post_rr_high_additional && \
|
|
post_rr_high_endpoint->rr_posted_high < mca_btl_mvapi_component.ib_rr_buf_max){ \
|
|
MCA_BTL_MVAPI_ENDPOINT_POST_RR_SUB(mca_btl_mvapi_component.ib_rr_buf_max - \
|
|
post_rr_high_endpoint->rr_posted_high, \
|
|
post_rr_high_endpoint, \
|
|
&post_rr_high_mvapi_btl->recv_free_eager, \
|
|
&post_rr_high_endpoint->rr_posted_high, \
|
|
post_rr_high_mvapi_btl->nic, \
|
|
post_rr_high_endpoint->lcl_qp_hndl_high); \
|
|
} \
|
|
OPAL_THREAD_UNLOCK(&post_rr_high_mvapi_btl->ib_lock); \
|
|
}
|
|
|
|
#define MCA_BTL_MVAPI_ENDPOINT_POST_RR_LOW(post_rr_low_endpoint, \
|
|
post_rr_low_additional) \
|
|
{ \
|
|
mca_btl_mvapi_module_t * post_rr_low_mvapi_btl = post_rr_low_endpoint->endpoint_btl; \
|
|
OPAL_THREAD_LOCK(&post_rr_low_mvapi_btl->ib_lock); \
|
|
if(post_rr_low_endpoint->rr_posted_low <= mca_btl_mvapi_component.ib_rr_buf_min+post_rr_low_additional && \
|
|
post_rr_low_endpoint->rr_posted_low < mca_btl_mvapi_component.ib_rr_buf_max){ \
|
|
MCA_BTL_MVAPI_ENDPOINT_POST_RR_SUB(mca_btl_mvapi_component.ib_rr_buf_max - \
|
|
post_rr_low_endpoint->rr_posted_low, \
|
|
post_rr_low_endpoint, \
|
|
&post_rr_low_mvapi_btl->recv_free_max, \
|
|
&post_rr_low_endpoint->rr_posted_low, \
|
|
post_rr_low_mvapi_btl->nic, \
|
|
post_rr_low_endpoint->lcl_qp_hndl_low); \
|
|
} \
|
|
OPAL_THREAD_UNLOCK(&post_rr_low_mvapi_btl->ib_lock); \
|
|
}
|
|
|
|
|
|
#define MCA_BTL_MVAPI_ENDPOINT_POST_RR_SUB(post_rr_sub_cnt, \
|
|
post_rr_sub_endpoint, \
|
|
post_rr_sub_frag_list, \
|
|
post_rr_sub_rr_posted, \
|
|
post_rr_sub_nic, \
|
|
post_rr_sub_qp ) \
|
|
{\
|
|
uint32_t post_rr_sub_i; \
|
|
int post_rr_sub_rc; \
|
|
opal_list_item_t* post_rr_sub_item; \
|
|
mca_btl_mvapi_frag_t* post_rr_sub_frag; \
|
|
mca_btl_mvapi_module_t *post_rr_sub_mvapi_btl = post_rr_sub_endpoint->endpoint_btl; \
|
|
VAPI_rr_desc_t* post_rr_sub_desc_post = post_rr_sub_mvapi_btl->rr_desc_post; \
|
|
for(post_rr_sub_i = 0; post_rr_sub_i < post_rr_sub_cnt; post_rr_sub_i++) { \
|
|
OMPI_FREE_LIST_WAIT(post_rr_sub_frag_list, post_rr_sub_item, post_rr_sub_rc); \
|
|
post_rr_sub_frag = (mca_btl_mvapi_frag_t*) post_rr_sub_item; \
|
|
post_rr_sub_frag->endpoint = post_rr_sub_endpoint; \
|
|
post_rr_sub_frag->sg_entry.len = post_rr_sub_frag->size + \
|
|
((unsigned char*) post_rr_sub_frag->segment.seg_addr.pval- \
|
|
(unsigned char*) post_rr_sub_frag->hdr); \
|
|
post_rr_sub_desc_post[post_rr_sub_i] = post_rr_sub_frag->rr_desc; \
|
|
}\
|
|
post_rr_sub_frag->ret = EVAPI_post_rr_list( post_rr_sub_nic, \
|
|
post_rr_sub_qp, \
|
|
post_rr_sub_cnt, \
|
|
post_rr_sub_desc_post); \
|
|
if(VAPI_OK != post_rr_sub_frag->ret) { \
|
|
BTL_ERROR(("error posting receive descriptors: %s",\
|
|
VAPI_strerror(post_rr_sub_frag->ret))); \
|
|
} else {\
|
|
OPAL_THREAD_ADD32(post_rr_sub_rr_posted, post_rr_sub_cnt); \
|
|
}\
|
|
}
|
|
|
|
/* static inline int mca_btl_mvapi_endpoint_post_rr_sub(int cnt, */
|
|
/* mca_btl_mvapi_endpoint_t* endpoint, */
|
|
/* ompi_free_list_t* frag_list, */
|
|
/* uint32_t* rr_posted, */
|
|
/* VAPI_hca_hndl_t nic, */
|
|
/* VAPI_qp_hndl_t qp_hndl */
|
|
/* ) */
|
|
/* { */
|
|
|
|
/* int rc, i; */
|
|
/* opal_list_item_t* item; */
|
|
/* mca_btl_mvapi_frag_t* frag; */
|
|
|
|
/* mca_btl_mvapi_module_t *mvapi_btl = endpoint->endpoint_btl; */
|
|
/* VAPI_rr_desc_t* rr_desc_post = mvapi_btl->rr_desc_post; */
|
|
|
|
/* /\* prepare frags and post receive requests *\/ */
|
|
/* for(i = 0; i < cnt; i++) { */
|
|
/* OMPI_FREE_LIST_WAIT(frag_list, item, rc); */
|
|
/* frag = (mca_btl_mvapi_frag_t*) item; */
|
|
/* frag->endpoint = endpoint; */
|
|
/* frag->sg_entry.len = frag->size + ((unsigned char*) frag->segment.seg_addr.pval- (unsigned char*) frag->hdr); /\* sizeof(mca_btl_mvapi_header_t); *\/ */
|
|
/* rr_desc_post[i] = frag->rr_desc; */
|
|
|
|
/* } */
|
|
|
|
/* frag->ret = EVAPI_post_rr_list(nic, */
|
|
/* qp_hndl, */
|
|
/* cnt, */
|
|
/* rr_desc_post); */
|
|
/* if(VAPI_OK != frag->ret) { */
|
|
/* BTL_ERROR(("error posting receive descriptors: %s", VAPI_strerror(frag->ret))); */
|
|
/* return OMPI_ERROR; */
|
|
/* } */
|
|
/* OPAL_THREAD_ADD32(rr_posted, cnt); */
|
|
/* return OMPI_SUCCESS; */
|
|
/* } */
|
|
|
|
/* static inline int mca_btl_mvapi_endpoint_post_rr( mca_btl_mvapi_endpoint_t * endpoint, int additional){ */
|
|
/* mca_btl_mvapi_module_t * mvapi_btl = endpoint->endpoint_btl; */
|
|
/* int rc; */
|
|
/* OPAL_THREAD_LOCK(&endpoint->ib_lock); */
|
|
|
|
/* if(endpoint->rr_posted_high <= mca_btl_mvapi_component.ib_rr_buf_min+additional && endpoint->rr_posted_high < mca_btl_mvapi_component.ib_rr_buf_max){ */
|
|
|
|
/* rc = mca_btl_mvapi_endpoint_post_rr_sub(mca_btl_mvapi_component.ib_rr_buf_max - endpoint->rr_posted_high, */
|
|
/* endpoint, */
|
|
/* &mvapi_btl->recv_free_eager, */
|
|
/* &endpoint->rr_posted_high, */
|
|
/* mvapi_btl->nic, */
|
|
/* endpoint->lcl_qp_hndl_high */
|
|
/* ); */
|
|
/* if(rc != OMPI_SUCCESS){ */
|
|
/* OPAL_THREAD_UNLOCK(&mvapi_btl->ib_lock); */
|
|
/* return rc; */
|
|
/* } */
|
|
/* } */
|
|
/* if(endpoint->rr_posted_low <= mca_btl_mvapi_component.ib_rr_buf_min+additional && endpoint->rr_posted_low < mca_btl_mvapi_component.ib_rr_buf_max){ */
|
|
|
|
/* rc = mca_btl_mvapi_endpoint_post_rr_sub(mca_btl_mvapi_component.ib_rr_buf_max - endpoint->rr_posted_low, */
|
|
/* endpoint, */
|
|
/* &mvapi_btl->recv_free_max, */
|
|
/* &endpoint->rr_posted_low, */
|
|
/* mvapi_btl->nic, */
|
|
/* endpoint->lcl_qp_hndl_low */
|
|
/* ); */
|
|
/* if(rc != OMPI_SUCCESS) { */
|
|
/* OPAL_THREAD_UNLOCK(&mvapi_btl->ib_lock); */
|
|
/* return rc; */
|
|
/* } */
|
|
|
|
/* } */
|
|
/* OPAL_THREAD_UNLOCK(&mvapi_btl->ib_lock); */
|
|
/* return OMPI_SUCCESS; */
|
|
|
|
|
|
/* } */
|
|
|
|
|
|
#if defined(c_plusplus) || defined(__cplusplus)
|
|
}
|
|
#endif
|
|
#endif
|