/* * Copyright (c) 2004-2007 The Trustees of Indiana University and Indiana * University Research and Technology * Corporation. All rights reserved. * Copyright (c) 2004-2006 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. * Copyright (c) 2008-2009 Cisco Systems, Inc. All rights reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ */ #ifndef MCA_COLL_SYNC_EXPORT_H #define MCA_COLL_SYNC_EXPORT_H #include "ompi_config.h" #include "mpi.h" #include "opal/class/opal_object.h" #include "opal/mca/mca.h" #include "ompi/constants.h" #include "ompi/mca/coll/coll.h" #include "ompi/mca/coll/base/base.h" #include "ompi/communicator/communicator.h" BEGIN_C_DECLS /* API functions */ int mca_coll_sync_init_query(bool enable_progress_threads, bool enable_mpi_threads); mca_coll_base_module_t *mca_coll_sync_comm_query(struct ompi_communicator_t *comm, int *priority); int mca_coll_sync_module_enable(mca_coll_base_module_t *module, struct ompi_communicator_t *comm); int mca_coll_sync_allgather(void *sbuf, int scount, struct ompi_datatype_t *sdtype, void *rbuf, int rcount, struct ompi_datatype_t *rdtype, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_allgatherv(void *sbuf, int scount, struct ompi_datatype_t *sdtype, void *rbuf, int *rcounts, int *disps, struct ompi_datatype_t *rdtype, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_allreduce(void *sbuf, void *rbuf, int count, struct ompi_datatype_t *dtype, struct ompi_op_t *op, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_alltoall(void *sbuf, int scount, struct ompi_datatype_t *sdtype, void *rbuf, int rcount, struct ompi_datatype_t *rdtype, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_alltoallv(void *sbuf, int *scounts, int *sdisps, struct ompi_datatype_t *sdtype, void *rbuf, int *rcounts, int *rdisps, struct ompi_datatype_t *rdtype, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_alltoallw(void *sbuf, int *scounts, int *sdisps, struct ompi_datatype_t **sdtypes, void *rbuf, int *rcounts, int *rdisps, struct ompi_datatype_t **rdtypes, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_barrier(struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_bcast(void *buff, int count, struct ompi_datatype_t *datatype, int root, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_exscan(void *sbuf, void *rbuf, int count, struct ompi_datatype_t *dtype, struct ompi_op_t *op, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_gather(void *sbuf, int scount, struct ompi_datatype_t *sdtype, void *rbuf, int rcount, struct ompi_datatype_t *rdtype, int root, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_gatherv(void *sbuf, int scount, struct ompi_datatype_t *sdtype, void *rbuf, int *rcounts, int *disps, struct ompi_datatype_t *rdtype, int root, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_reduce(void *sbuf, void *rbuf, int count, struct ompi_datatype_t *dtype, struct ompi_op_t *op, int root, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_reduce_scatter(void *sbuf, void *rbuf, int *rcounts, struct ompi_datatype_t *dtype, struct ompi_op_t *op, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_scan(void *sbuf, void *rbuf, int count, struct ompi_datatype_t *dtype, struct ompi_op_t *op, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_scatter(void *sbuf, int scount, struct ompi_datatype_t *sdtype, void *rbuf, int rcount, struct ompi_datatype_t *rdtype, int root, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_scatterv(void *sbuf, int *scounts, int *disps, struct ompi_datatype_t *sdtype, void *rbuf, int rcount, struct ompi_datatype_t *rdtype, int root, struct ompi_communicator_t *comm, mca_coll_base_module_t *module); int mca_coll_sync_ft_event(int status); /* Types */ /* Module */ typedef struct mca_coll_sync_module_t { mca_coll_base_module_t super; /* Pointers to all the "real" collective functions */ mca_coll_base_comm_coll_t c_coll; /* How many ops we've executed */ int before_num_operations; /* How many ops we've executed (it's easier to have 2) */ int after_num_operations; /* Avoid recursion of syncs */ bool in_operation; } mca_coll_sync_module_t; OBJ_CLASS_DECLARATION(mca_coll_sync_module_t); /* Component */ typedef struct mca_coll_sync_component_t { mca_coll_base_component_2_0_0_t super; /* Priority of this component */ int priority; /* Do a sync *before* each Nth collective */ int barrier_before_nops; /* Do a sync *after* each Nth collective */ int barrier_after_nops; } mca_coll_sync_component_t; /* Globally exported variables */ OMPI_MODULE_DECLSPEC extern mca_coll_sync_component_t mca_coll_sync_component; /* Macro used in most of the collectives */ #define COLL_SYNC(module, op) \ do { \ int err = MPI_SUCCESS; \ s->in_operation = true; \ if (OPAL_UNLIKELY(++s->before_num_operations == \ mca_coll_sync_component.barrier_before_nops)) { \ s->before_num_operations = 0; \ err = s->c_coll.coll_barrier(comm, s->c_coll.coll_barrier_module); \ } \ if (OPAL_LIKELY(MPI_SUCCESS == err)) { \ err = op; \ } \ if (OPAL_UNLIKELY(++s->after_num_operations == \ mca_coll_sync_component.barrier_after_nops) && \ OPAL_LIKELY(MPI_SUCCESS == err)) { \ s->after_num_operations = 0; \ err = s->c_coll.coll_barrier(comm, s->c_coll.coll_barrier_module); \ } \ s->in_operation = false; \ return err; \ } while(0) END_C_DECLS #endif /* MCA_COLL_SYNC_EXPORT_H */