Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
/**
|
|
|
|
Copyright (c) 2011 Mellanox Technologies. All rights reserved.
|
|
|
|
$COPYRIGHT$
|
|
|
|
|
|
|
|
Additional copyrights may follow
|
|
|
|
|
|
|
|
$HEADER$
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef MCA_COLL_FCA_H
|
|
|
|
#define MCA_COLL_FCA_H
|
|
|
|
|
|
|
|
#include "ompi_config.h"
|
|
|
|
|
|
|
|
#include "mpi.h"
|
|
|
|
#include "opal/mca/mca.h"
|
2014-05-17 23:49:43 +04:00
|
|
|
#include "opal/memoryhooks/memory.h"
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
#include "ompi/mca/coll/coll.h"
|
|
|
|
#include "ompi/request/request.h"
|
|
|
|
#include "ompi/mca/pml/pml.h"
|
|
|
|
#include "ompi/mca/coll/base/coll_tags.h"
|
|
|
|
#include "ompi/communicator/communicator.h"
|
2014-01-09 15:27:24 +04:00
|
|
|
#include "ompi/attribute/attribute.h"
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
#include "ompi/op/op.h"
|
|
|
|
|
|
|
|
#include "orte/runtime/orte_globals.h"
|
|
|
|
|
|
|
|
#include "hcoll_api.h"
|
|
|
|
#include "hcoll_constants.h"
|
|
|
|
|
|
|
|
|
|
|
|
#include "coll_hcoll_debug.h"
|
2014-05-17 23:49:43 +04:00
|
|
|
#ifndef HCOLL_VERSION
|
|
|
|
#define HCOLL_VERSION(major, minor) (((major)<<HCOLL_MAJOR_BIT)|((minor)<<HCOLL_MINOR_BIT))
|
|
|
|
#endif
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
BEGIN_C_DECLS
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Globally exported structure
|
|
|
|
*/
|
|
|
|
|
|
|
|
typedef struct mca_coll_hcoll_ops_t {
|
|
|
|
int (*hcoll_init) (void);
|
|
|
|
int (*hcoll_finalize) (void);
|
|
|
|
void * (*create_hcoll_context)(void *);
|
|
|
|
int (*hcoll_barrier)(void *);
|
|
|
|
} mca_coll_hcoll_ops_t;
|
|
|
|
|
2013-10-02 17:38:47 +04:00
|
|
|
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
struct mca_coll_hcoll_component_t {
|
|
|
|
/** Base coll component */
|
|
|
|
mca_coll_base_component_2_0_0_t super;
|
|
|
|
|
|
|
|
/** MCA parameter: Priority of this component */
|
|
|
|
int hcoll_priority;
|
|
|
|
|
|
|
|
/** MCA parameter: Verbose level of this component */
|
|
|
|
int hcoll_verbose;
|
|
|
|
|
|
|
|
/** MCA parameter: Enable FCA */
|
|
|
|
int hcoll_enable;
|
|
|
|
|
2014-06-26 22:14:41 +04:00
|
|
|
/** r/o MCA parameter: libhcoll compiletime version */
|
|
|
|
char* compiletime_version;
|
|
|
|
|
|
|
|
/** r/o MCA parameter: libhcoll runtime version */
|
|
|
|
const char* runtime_version;
|
|
|
|
|
2014-01-21 16:19:47 +04:00
|
|
|
/** MCA parameter: Minimal number of processes in the communicator
|
|
|
|
for the corresponding hcoll context to be created */
|
|
|
|
int hcoll_np;
|
|
|
|
|
|
|
|
/** Whether or not hcoll_init was ever called */
|
|
|
|
bool libhcoll_initialized;
|
|
|
|
|
2014-05-17 23:49:43 +04:00
|
|
|
bool using_mem_hooks;
|
|
|
|
|
2013-12-04 00:21:40 +04:00
|
|
|
/** MCA parameter: ON/OFF user defined datatype through HCOLL */
|
|
|
|
int hcoll_datatype_fallback;
|
|
|
|
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
/* FCA global stuff */
|
|
|
|
mca_coll_hcoll_ops_t hcoll_ops;
|
2015-02-19 23:41:41 +03:00
|
|
|
opal_free_list_t requests;
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
};
|
|
|
|
typedef struct mca_coll_hcoll_component_t mca_coll_hcoll_component_t;
|
|
|
|
|
|
|
|
OMPI_MODULE_DECLSPEC extern mca_coll_hcoll_component_t mca_coll_hcoll_component;
|
|
|
|
|
|
|
|
|
2013-12-04 00:21:40 +04:00
|
|
|
|
|
|
|
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
/**
|
|
|
|
* FCA enabled communicator
|
|
|
|
*/
|
|
|
|
struct mca_coll_hcoll_module_t {
|
|
|
|
mca_coll_base_module_t super;
|
|
|
|
|
2013-12-04 00:21:40 +04:00
|
|
|
ompi_communicator_t *comm;
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
int rank;
|
|
|
|
void *hcoll_context;
|
|
|
|
/* Saved handlers - for fallback */
|
|
|
|
mca_coll_base_module_reduce_fn_t previous_reduce;
|
|
|
|
mca_coll_base_module_t *previous_reduce_module;
|
|
|
|
mca_coll_base_module_allreduce_fn_t previous_allreduce;
|
|
|
|
mca_coll_base_module_t *previous_allreduce_module;
|
|
|
|
mca_coll_base_module_bcast_fn_t previous_bcast;
|
|
|
|
mca_coll_base_module_t *previous_bcast_module;
|
|
|
|
mca_coll_base_module_barrier_fn_t previous_barrier;
|
|
|
|
mca_coll_base_module_t *previous_barrier_module;
|
|
|
|
mca_coll_base_module_allgather_fn_t previous_allgather;
|
|
|
|
mca_coll_base_module_t *previous_allgather_module;
|
|
|
|
mca_coll_base_module_allgatherv_fn_t previous_allgatherv;
|
|
|
|
mca_coll_base_module_t *previous_allgatherv_module;
|
|
|
|
mca_coll_base_module_alltoall_fn_t previous_alltoall;
|
|
|
|
mca_coll_base_module_t *previous_alltoall_module;
|
|
|
|
mca_coll_base_module_alltoallv_fn_t previous_alltoallv;
|
|
|
|
mca_coll_base_module_t *previous_alltoallv_module;
|
|
|
|
mca_coll_base_module_alltoallw_fn_t previous_alltoallw;
|
|
|
|
mca_coll_base_module_t *previous_alltoallw_module;
|
|
|
|
mca_coll_base_module_gather_fn_t previous_gather;
|
|
|
|
mca_coll_base_module_t *previous_gather_module;
|
|
|
|
mca_coll_base_module_gatherv_fn_t previous_gatherv;
|
|
|
|
mca_coll_base_module_t *previous_gatherv_module;
|
|
|
|
mca_coll_base_module_reduce_scatter_fn_t previous_reduce_scatter;
|
|
|
|
mca_coll_base_module_t *previous_reduce_scatter_module;
|
2013-09-25 20:14:59 +04:00
|
|
|
mca_coll_base_module_ibcast_fn_t previous_ibcast;
|
|
|
|
mca_coll_base_module_t *previous_ibcast_module;
|
|
|
|
mca_coll_base_module_ibarrier_fn_t previous_ibarrier;
|
|
|
|
mca_coll_base_module_t *previous_ibarrier_module;
|
|
|
|
mca_coll_base_module_iallgather_fn_t previous_iallgather;
|
|
|
|
mca_coll_base_module_t *previous_iallgather_module;
|
|
|
|
mca_coll_base_module_iallreduce_fn_t previous_iallreduce;
|
|
|
|
mca_coll_base_module_t *previous_iallreduce_module;
|
2014-06-26 22:14:41 +04:00
|
|
|
mca_coll_base_module_igatherv_fn_t previous_igatherv;
|
|
|
|
mca_coll_base_module_t *previous_igatherv_module;
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
};
|
|
|
|
typedef struct mca_coll_hcoll_module_t mca_coll_hcoll_module_t;
|
|
|
|
|
|
|
|
OBJ_CLASS_DECLARATION(mca_coll_hcoll_module_t);
|
|
|
|
|
|
|
|
|
2013-12-04 00:21:40 +04:00
|
|
|
|
|
|
|
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
/* API functions */
|
|
|
|
int mca_coll_hcoll_init_query(bool enable_progress_threads, bool enable_mpi_threads);
|
|
|
|
mca_coll_base_module_t *mca_coll_hcoll_comm_query(struct ompi_communicator_t *comm, int *priority);
|
|
|
|
int mca_coll_hcoll_get_lib(void);
|
|
|
|
void hcoll_rte_fns_setup(void);
|
|
|
|
|
|
|
|
|
|
|
|
int mca_coll_hcoll_barrier(struct ompi_communicator_t *comm,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
|
|
|
int mca_coll_hcoll_bcast(void *buff, int count,
|
|
|
|
struct ompi_datatype_t *datatype, int root,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
|
|
|
int mca_coll_hcoll_allgather(void *sbuf, int scount,
|
|
|
|
struct ompi_datatype_t *sdtype,
|
|
|
|
void *rbuf, int rcount,
|
|
|
|
struct ompi_datatype_t *rdtype,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
2013-12-04 00:21:40 +04:00
|
|
|
int mca_coll_hcoll_gather(void *sbuf, int scount,
|
|
|
|
struct ompi_datatype_t *sdtype,
|
|
|
|
void *rbuf, int rcount,
|
|
|
|
struct ompi_datatype_t *rdtype,
|
|
|
|
int root,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
int mca_coll_hcoll_allreduce(void *sbuf, void *rbuf, int count,
|
|
|
|
struct ompi_datatype_t *dtype,
|
|
|
|
struct ompi_op_t *op,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
|
|
|
int mca_coll_hcoll_alltoall(void *sbuf, int scount,
|
|
|
|
struct ompi_datatype_t *sdtype,
|
|
|
|
void* rbuf, int rcount,
|
|
|
|
struct ompi_datatype_t *rdtype,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
2014-06-26 22:14:41 +04:00
|
|
|
int mca_coll_hcoll_gatherv(void* sbuf, int scount,
|
|
|
|
struct ompi_datatype_t *sdtype,
|
|
|
|
void* rbuf, int *rcounts, int *displs,
|
|
|
|
struct ompi_datatype_t *rdtype,
|
|
|
|
int root,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
2013-09-25 20:14:59 +04:00
|
|
|
int mca_coll_hcoll_ibarrier(struct ompi_communicator_t *comm,
|
|
|
|
ompi_request_t** request,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
|
|
|
int mca_coll_hcoll_ibcast(void *buff, int count,
|
|
|
|
struct ompi_datatype_t *datatype, int root,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
ompi_request_t** request,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
|
|
|
int mca_coll_hcoll_iallgather(void *sbuf, int scount,
|
|
|
|
struct ompi_datatype_t *sdtype,
|
|
|
|
void *rbuf, int rcount,
|
|
|
|
struct ompi_datatype_t *rdtype,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
ompi_request_t** request,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
|
|
|
int mca_coll_hcoll_iallreduce(void *sbuf, void *rbuf, int count,
|
|
|
|
struct ompi_datatype_t *dtype,
|
|
|
|
struct ompi_op_t *op,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
ompi_request_t** request,
|
|
|
|
mca_coll_base_module_t *module);
|
2014-06-26 22:14:41 +04:00
|
|
|
|
|
|
|
int mca_coll_hcoll_igatherv(void* sbuf, int scount,
|
|
|
|
struct ompi_datatype_t *sdtype,
|
|
|
|
void* rbuf, int *rcounts, int *displs,
|
|
|
|
struct ompi_datatype_t *rdtype,
|
|
|
|
int root,
|
|
|
|
struct ompi_communicator_t *comm,
|
|
|
|
ompi_request_t ** request,
|
|
|
|
mca_coll_base_module_t *module);
|
|
|
|
|
2013-12-04 00:21:40 +04:00
|
|
|
int mca_coll_hcoll_progress(void);
|
2014-05-17 23:49:43 +04:00
|
|
|
void mca_coll_hcoll_mem_release_cb(void *buf, size_t length, void *cbdata, bool from_alloc);
|
Per the details and schedule outlined in the attached RFC, Mellanox Technologies would like to CMR the new 'coll/hcoll' component. This component enables Mellanox Technologies' latest HPC middleware offering - 'Hcoll'. 'Hcoll' is a high-performance, standalone collectives library with support for truly asynchronous, non-blocking, hierarchical collectives via hardware offload on supporting Mellanox HCAs (ConnectX-3 and above.) To build the component, libhcoll must first be installed on your system, then you must configure OMPI with the configure flag: '--with-hcoll=/path/to/libhcoll'. Subsequent to installing, you may select the 'coll/hcoll' component at runtime as you would any other coll component, e.g. '-mca coll hcoll,tuned,libnbc'. This has been reviewed by Josh Ladd and should be added to cmr:v1.7:reviewer=jladd
This commit was SVN r28694.
2013-07-02 02:39:43 +04:00
|
|
|
END_C_DECLS
|
|
|
|
|
|
|
|
#endif
|