
- Add support for fallback to previous coll module on non-commutative operations (#30) - Replace mutexes by atomic operations. - Use the correct nbc request type (for both ibcast and ireduce) * coll/base: document type casts in ompi_coll_base_retain_* - add module-wide topology cache - use standard instead of synchronous send and add mca parameter to control mode of initial send in ireduce/ibcast - reduce number of memory allocations - call the default request completion. - Remove the requests from the Fortran lookup conversion tables before completing and free it. Signed-off-by: George Bosilca <bosilca@icl.utk.edu> Signed-off-by: Joseph Schuchart <schuchart@hlrs.de> Co-authored-by: Joseph Schuchart <schuchart@hlrs.de>
36 строки
901 B
C
36 строки
901 B
C
/*
|
|
* Copyright (c) 2014-2020 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#ifndef MCA_COLL_ADAPT_TOPOCACHE_H
|
|
#define MCA_COLL_ADAPT_TOPOCACHE_H
|
|
|
|
#include "opal/class/opal_list.h"
|
|
#include "ompi/mca/coll/coll.h"
|
|
#include "ompi/mca/coll/base/coll_base_topo.h"
|
|
|
|
typedef struct adapt_topology_cache_item_t {
|
|
opal_list_item_t super;
|
|
ompi_coll_tree_t *tree;
|
|
int root;
|
|
int algorithm;
|
|
} adapt_topology_cache_item_t;
|
|
|
|
OBJ_CLASS_DECLARATION(adapt_topology_cache_item_t);
|
|
|
|
|
|
OMPI_DECLSPEC ompi_coll_tree_t* adapt_module_cached_topology(
|
|
mca_coll_base_module_t *module,
|
|
struct ompi_communicator_t *comm,
|
|
int root,
|
|
ompi_coll_adapt_algorithm_t algorithm);
|
|
|
|
#endif /* MCA_COLL_ADAPT_TOPOCACHE_H */
|