7bfac82ce7
time. UD is connectionless, and as long as peers are statically assigned to QPs, there is no reason to set up the adressing information lazily. Lots of code was axed, as endpoints no longer have state. Removed a number of other elements in the endpoint struct to make it as lightweight as possible. I was able to remove an entire function call/branch in the send path, which I believe is the main contributor to a 2us drop in NetPIPE latency. Some whitespace cleanups as well. Passes IBM test suite, and all but certain intel tests that were failing before the change, over ob1 PML. This commit was SVN r10494.
73 строки
2.3 KiB
C
73 строки
2.3 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2006 Sandia National Laboratories. All rights
|
|
* reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#ifndef MCA_BTL_UD_PROC_H
|
|
#define MCA_BTL_UD_PROC_H
|
|
|
|
#include "orte/mca/ns/ns.h"
|
|
#include "opal/class/opal_object.h"
|
|
#include "ompi/proc/proc.h"
|
|
#include "btl_ud.h"
|
|
#include "btl_ud_endpoint.h"
|
|
|
|
#if defined(c_plusplus) || defined(__cplusplus)
|
|
extern "C" {
|
|
#endif
|
|
OBJ_CLASS_DECLARATION(mca_btl_ud_proc_t);
|
|
|
|
/**
|
|
* Represents the state of a remote process and the set of addresses
|
|
* that it exports. Also cache an instance of mca_btl_base_endpoint_t for
|
|
* each
|
|
* BTL instance that attempts to open a connection to the process.
|
|
*/
|
|
struct mca_btl_ud_proc_t {
|
|
opal_list_item_t super;
|
|
/**< allow proc to be placed on a list */
|
|
|
|
ompi_proc_t *proc_ompi;
|
|
/**< pointer to corresponding ompi_proc_t */
|
|
|
|
orte_process_name_t proc_guid;
|
|
/**< globally unique identifier for the process */
|
|
|
|
struct mca_btl_ud_addr_t* proc_addrs;
|
|
size_t proc_addr_count;
|
|
/**< number of addresses published by endpoint */
|
|
|
|
struct mca_btl_base_endpoint_t **proc_endpoints;
|
|
/**< array of endpoints that have been created to access this proc */
|
|
|
|
size_t proc_endpoint_count;
|
|
/**< number of endpoints */
|
|
|
|
opal_mutex_t proc_lock;
|
|
/**< lock to protect against concurrent access to proc state */
|
|
};
|
|
typedef struct mca_btl_ud_proc_t mca_btl_ud_proc_t;
|
|
|
|
mca_btl_ud_proc_t* mca_btl_ud_proc_create(ompi_proc_t* ompi_proc);
|
|
int mca_btl_ud_proc_insert(mca_btl_ud_proc_t*, mca_btl_base_endpoint_t*);
|
|
|
|
#if defined(c_plusplus) || defined(__cplusplus)
|
|
}
|
|
#endif
|
|
#endif
|