2004-05-21 19:36:19 +00:00
|
|
|
/*
|
|
|
|
* $HEADER$
|
|
|
|
*/
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
#include "ompi_config.h"
|
2004-05-21 19:36:19 +00:00
|
|
|
#include <string.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include "mpi.h"
|
|
|
|
|
|
|
|
#include "communicator/communicator.h"
|
|
|
|
#include "op/op.h"
|
|
|
|
#include "proc/proc.h"
|
|
|
|
#include "include/constants.h"
|
2004-06-07 15:33:53 +00:00
|
|
|
#include "class/ompi_pointer_array.h"
|
2004-05-21 19:36:19 +00:00
|
|
|
#include "mca/pcm/pcm.h"
|
|
|
|
#include "mca/pml/pml.h"
|
|
|
|
#include "mca/coll/coll.h"
|
|
|
|
#include "mca/coll/base/base.h"
|
2004-08-05 16:31:30 +00:00
|
|
|
#include "mca/oob/oob.h"
|
2004-05-21 19:36:19 +00:00
|
|
|
|
2004-08-05 16:31:30 +00:00
|
|
|
#define OMPI_COLL_TAG_ALLREDUCE 31000
|
2004-05-21 19:36:19 +00:00
|
|
|
#define OMPI_MAX_COMM 32768
|
|
|
|
|
|
|
|
/**
|
|
|
|
* These functions make sure, that we determine the global result over
|
|
|
|
* an intra communicators (simple), an inter-communicator and a
|
|
|
|
* pseudo inter-communicator described by two separate intra-comms
|
|
|
|
* and a bridge-comm (intercomm-create scenario).
|
|
|
|
*/
|
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
typedef int ompi_comm_cid_allredfct (int *inbuf, int* outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *comm,
|
2004-06-07 15:33:53 +00:00
|
|
|
ompi_communicator_t *bridgecomm,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* lleader, void* rleader,
|
|
|
|
int send_first );
|
2004-06-16 22:37:03 +00:00
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_intra (int *inbuf, int* outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *intercomm,
|
2004-06-16 22:37:03 +00:00
|
|
|
ompi_communicator_t *bridgecomm,
|
2004-08-03 22:07:45 +00:00
|
|
|
void* local_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* remote_ledaer,
|
|
|
|
int send_first );
|
2004-05-21 19:36:19 +00:00
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_inter (int *inbuf, int *outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *intercomm,
|
|
|
|
ompi_communicator_t *bridgecomm,
|
|
|
|
void* local_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* remote_leader,
|
|
|
|
int send_first );
|
2004-05-21 19:36:19 +00:00
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_intra_bridge(int *inbuf, int* outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *intercomm,
|
2004-07-15 20:55:15 +00:00
|
|
|
ompi_communicator_t *bridgecomm,
|
2004-08-03 22:07:45 +00:00
|
|
|
void* local_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* remote_leader,
|
|
|
|
int send_first);
|
2004-05-21 19:36:19 +00:00
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_intra_oob (int *inbuf, int* outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *intercomm,
|
2004-07-15 20:55:15 +00:00
|
|
|
ompi_communicator_t *bridgecomm,
|
2004-08-03 22:07:45 +00:00
|
|
|
void* local_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* remote_leader,
|
|
|
|
int send_first );
|
2004-05-21 19:36:19 +00:00
|
|
|
|
|
|
|
|
2004-06-16 15:40:52 +00:00
|
|
|
int ompi_comm_nextcid ( ompi_communicator_t* newcomm,
|
|
|
|
ompi_communicator_t* comm,
|
|
|
|
ompi_communicator_t* bridgecomm,
|
2004-06-16 22:37:03 +00:00
|
|
|
void* local_leader,
|
|
|
|
void* remote_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
int mode, int send_first )
|
2004-05-21 19:36:19 +00:00
|
|
|
{
|
|
|
|
|
|
|
|
int nextlocal_cid;
|
|
|
|
int nextcid;
|
|
|
|
int done=0;
|
|
|
|
int response=0, glresponse=0;
|
|
|
|
int flag;
|
2004-06-07 15:33:53 +00:00
|
|
|
int start=ompi_mpi_communicators.lowest_free;
|
2004-05-21 19:36:19 +00:00
|
|
|
int i;
|
|
|
|
|
|
|
|
ompi_comm_cid_allredfct* allredfnct;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Determine which implementation of allreduce we have to use
|
|
|
|
* for the current scenario
|
|
|
|
*/
|
|
|
|
switch (mode)
|
|
|
|
{
|
2004-06-16 22:37:03 +00:00
|
|
|
case OMPI_COMM_CID_INTRA:
|
2004-08-03 22:07:45 +00:00
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_intra;
|
2004-05-21 19:36:19 +00:00
|
|
|
break;
|
2004-06-16 22:37:03 +00:00
|
|
|
case OMPI_COMM_CID_INTER:
|
2004-08-03 22:07:45 +00:00
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_inter;
|
2004-05-21 19:36:19 +00:00
|
|
|
break;
|
2004-06-16 22:37:03 +00:00
|
|
|
case OMPI_COMM_CID_INTRA_BRIDGE:
|
2004-08-03 22:07:45 +00:00
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_intra_bridge;
|
2004-06-16 22:37:03 +00:00
|
|
|
break;
|
|
|
|
case OMPI_COMM_CID_INTRA_OOB:
|
2004-08-03 22:07:45 +00:00
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_intra_oob;
|
2004-06-16 22:37:03 +00:00
|
|
|
break;
|
2004-05-21 19:36:19 +00:00
|
|
|
default:
|
|
|
|
return MPI_UNDEFINED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* This is the real algorithm described in the doc
|
|
|
|
*/
|
|
|
|
while ( !done ){
|
|
|
|
for (i=start; i<OMPI_MAX_COMM ;i++) {
|
2004-08-03 22:07:45 +00:00
|
|
|
flag=ompi_pointer_array_test_and_set_item(&ompi_mpi_communicators, i, comm);
|
2004-05-21 19:36:19 +00:00
|
|
|
if (true == flag) {
|
|
|
|
nextlocal_cid = i;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
(allredfnct)(&nextlocal_cid, &nextcid, 1, MPI_MAX, comm, bridgecomm,
|
2004-08-05 16:31:30 +00:00
|
|
|
local_leader, remote_leader, send_first );
|
2004-05-21 19:36:19 +00:00
|
|
|
if (nextcid == nextlocal_cid) {
|
|
|
|
response = 1; /* fine with me */
|
|
|
|
}
|
|
|
|
else {
|
2004-08-03 22:07:45 +00:00
|
|
|
ompi_pointer_array_set_item(&ompi_mpi_communicators,
|
|
|
|
nextlocal_cid, NULL);
|
|
|
|
flag = ompi_pointer_array_test_and_set_item(&ompi_mpi_communicators,
|
2004-05-21 19:36:19 +00:00
|
|
|
nextcid, comm );
|
|
|
|
if (true == flag) {
|
|
|
|
response = 1; /* works as well */
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
response = 0; /* nope, not acceptable */
|
|
|
|
start = nextcid+1; /* that's where we can start the next round */
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
(allredfnct)(&response, &glresponse, 1, MPI_MIN, comm, bridgecomm,
|
2004-08-05 16:31:30 +00:00
|
|
|
local_leader, remote_leader, send_first );
|
2004-05-21 19:36:19 +00:00
|
|
|
if (glresponse == 1) {
|
|
|
|
done = 1; /* we are done */
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2004-06-16 15:40:52 +00:00
|
|
|
/* set the according values to the newcomm */
|
|
|
|
newcomm->c_contextid = nextcid;
|
2004-07-15 20:55:15 +00:00
|
|
|
newcomm->c_f_to_c_index = newcomm->c_contextid;
|
2004-06-16 15:40:52 +00:00
|
|
|
ompi_pointer_array_set_item (&ompi_mpi_communicators, nextcid, newcomm);
|
|
|
|
|
|
|
|
return (MPI_SUCCESS);
|
2004-05-21 19:36:19 +00:00
|
|
|
}
|
|
|
|
|
2004-08-05 16:31:30 +00:00
|
|
|
/**************************************************************************/
|
|
|
|
/**************************************************************************/
|
|
|
|
/**************************************************************************/
|
|
|
|
/* This routine serves two purposes:
|
|
|
|
* - the allreduce acts as a kind of Barrier,
|
|
|
|
* which avoids, that we have incoming fragments
|
|
|
|
* on the new communicator before everybody has set
|
|
|
|
* up the comm structure.
|
|
|
|
* - some components (e.g. the collective MagPIe component
|
|
|
|
* might want to generate new communicators and communicate
|
|
|
|
* using the new comm. Thus, it can just be called after
|
|
|
|
* the 'barrier'.
|
|
|
|
*
|
|
|
|
* The reason that this routine is in comm_cid and not in
|
|
|
|
* comm.c is, that this file contains the allreduce implementations
|
|
|
|
* which are required, and thus we avoid having duplicate code...
|
|
|
|
*/
|
|
|
|
int ompi_comm_activate ( ompi_communicator_t* newcomm,
|
|
|
|
ompi_communicator_t* comm,
|
|
|
|
ompi_communicator_t* bridgecomm,
|
|
|
|
void* local_leader,
|
|
|
|
void* remote_leader,
|
|
|
|
int mode,
|
|
|
|
int send_first,
|
|
|
|
mca_base_component_t *collcomponent )
|
|
|
|
{
|
2004-08-06 15:46:44 +00:00
|
|
|
int ok=0, gok=0;
|
2004-08-05 16:31:30 +00:00
|
|
|
ompi_comm_cid_allredfct* allredfnct;
|
|
|
|
|
|
|
|
/* Step 1: the barrier, after which it is allowed to
|
|
|
|
* send messages over the new communicator
|
|
|
|
*/
|
|
|
|
switch (mode)
|
|
|
|
{
|
|
|
|
case OMPI_COMM_CID_INTRA:
|
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_intra;
|
|
|
|
break;
|
|
|
|
case OMPI_COMM_CID_INTER:
|
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_inter;
|
|
|
|
break;
|
|
|
|
case OMPI_COMM_CID_INTRA_BRIDGE:
|
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_intra_bridge;
|
|
|
|
break;
|
|
|
|
case OMPI_COMM_CID_INTRA_OOB:
|
|
|
|
allredfnct=(ompi_comm_cid_allredfct*)ompi_comm_allreduce_intra_oob;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return MPI_UNDEFINED;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
(allredfnct)(&ok, &gok, 1, MPI_MIN, comm, bridgecomm,
|
|
|
|
local_leader, remote_leader, send_first );
|
|
|
|
|
|
|
|
|
|
|
|
/* Step 2: call all functions, which might use the new communicator
|
|
|
|
* already.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* Initialize the coll components */
|
|
|
|
/* Let the collectives components fight over who will do
|
|
|
|
collective on this new comm. */
|
|
|
|
if (OMPI_ERROR == mca_coll_base_comm_select(newcomm, collcomponent)) {
|
|
|
|
return OMPI_ERROR;
|
|
|
|
}
|
|
|
|
|
|
|
|
return OMPI_SUCCESS;
|
|
|
|
}
|
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
/**************************************************************************/
|
|
|
|
/**************************************************************************/
|
|
|
|
/**************************************************************************/
|
2004-05-21 19:36:19 +00:00
|
|
|
/* Arguments not used in this implementation:
|
2004-06-16 22:37:03 +00:00
|
|
|
* - bridgecomm
|
|
|
|
* - local_leader
|
|
|
|
* - remote_leader
|
2004-08-05 16:31:30 +00:00
|
|
|
* - send_first
|
2004-06-16 22:37:03 +00:00
|
|
|
*/
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_intra ( int *inbuf, int *outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *comm,
|
|
|
|
ompi_communicator_t *bridgecomm,
|
|
|
|
void* local_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* remote_leader,
|
|
|
|
int send_first )
|
2004-05-21 19:36:19 +00:00
|
|
|
{
|
2004-08-03 22:07:45 +00:00
|
|
|
return comm->c_coll.coll_allreduce ( inbuf, outbuf, count, MPI_INT,
|
|
|
|
op,comm );
|
2004-05-21 19:36:19 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Arguments not used in this implementation:
|
2004-06-16 22:37:03 +00:00
|
|
|
* - bridgecomm
|
|
|
|
* - local_leader
|
|
|
|
* - remote_leader
|
2004-08-05 16:31:30 +00:00
|
|
|
* - send_first
|
2004-06-16 22:37:03 +00:00
|
|
|
*/
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_inter ( int *inbuf, int *outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *intercomm,
|
|
|
|
ompi_communicator_t *bridgecomm,
|
|
|
|
void* local_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* remote_leader,
|
|
|
|
int send_first )
|
2004-05-21 19:36:19 +00:00
|
|
|
{
|
2004-08-03 22:07:45 +00:00
|
|
|
int local_rank, rsize;
|
|
|
|
int i, rc;
|
|
|
|
int *sbuf;
|
|
|
|
int *tmpbuf=NULL;
|
|
|
|
int *rcounts=NULL, scount=0;
|
|
|
|
int *rdisps=NULL;
|
2004-05-21 19:36:19 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( &ompi_mpi_op_sum != op && &ompi_mpi_op_prod != op &&
|
|
|
|
&ompi_mpi_op_max != op && &ompi_mpi_op_min != op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
return MPI_ERR_OP;
|
|
|
|
}
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( !OMPI_COMM_IS_INTER (intercomm)) {
|
2004-05-21 19:36:19 +00:00
|
|
|
return MPI_ERR_COMM;
|
|
|
|
}
|
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
/* Allocate temporary arrays */
|
|
|
|
rsize = ompi_comm_remote_size (intercomm);
|
2004-06-07 15:33:53 +00:00
|
|
|
local_rank = ompi_comm_rank ( intercomm );
|
2004-05-21 19:36:19 +00:00
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
tmpbuf = (int *) malloc ( count * sizeof(int));
|
|
|
|
rdisps = (int *) calloc ( rsize, sizeof(int));
|
|
|
|
rcounts = (int *) calloc ( rsize, sizeof(int) );
|
|
|
|
if ( NULL == tmpbuf || NULL == rdisps || NULL == rcounts ) {
|
|
|
|
return OMPI_ERR_OUT_OF_RESOURCE;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Execute the inter-allreduce: the result of our group will
|
|
|
|
be in the buffer of the remote group */
|
2004-06-29 00:02:25 +00:00
|
|
|
rc = intercomm->c_coll.coll_allreduce ( inbuf, tmpbuf, count, MPI_INT,
|
|
|
|
op, intercomm );
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ( 0 == local_rank ) {
|
|
|
|
MPI_Request req;
|
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
/* for the allgatherv later */
|
|
|
|
scount = count;
|
|
|
|
|
|
|
|
/* local leader exchange their data and determine the overall result
|
|
|
|
for both groups */
|
|
|
|
rc = mca_pml.pml_irecv (outbuf, count, MPI_INT, 0,
|
2004-08-05 16:31:30 +00:00
|
|
|
OMPI_COLL_TAG_ALLREDUCE
|
|
|
|
, intercomm, &req );
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
2004-08-05 16:31:30 +00:00
|
|
|
rc = mca_pml.pml_send (tmpbuf, count, MPI_INT, 0,
|
|
|
|
OMPI_COLL_TAG_ALLREDUCE,
|
2004-05-21 19:36:19 +00:00
|
|
|
MCA_PML_BASE_SEND_STANDARD, intercomm );
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
2004-08-03 22:07:45 +00:00
|
|
|
rc = mca_pml.pml_wait_all ( 1, &req, MPI_STATUS_IGNORE );
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( &ompi_mpi_op_max == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
if (tmpbuf[i] > outbuf[i]) outbuf[i] = tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
else if ( &ompi_mpi_op_min == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
if (tmpbuf[i] < outbuf[i]) outbuf[i] = tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
else if ( &ompi_mpi_op_sum == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
outbuf[i] += tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
else if ( &ompi_mpi_op_prod == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
outbuf[i] *= tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2004-08-03 22:07:45 +00:00
|
|
|
|
|
|
|
/* distribute the overall result to all processes in the other group.
|
|
|
|
Instead of using bcast, we are using here allgatherv, to avoid the
|
|
|
|
possible deadlock. Else, we need an algorithm to determine,
|
|
|
|
which group sends first in the inter-bcast and which receives
|
|
|
|
the result first.
|
|
|
|
*/
|
|
|
|
rcounts[0] = count;
|
|
|
|
sbuf = outbuf;
|
|
|
|
rc = intercomm->c_coll.coll_allgatherv (sbuf, scount, MPI_INT, outbuf,
|
|
|
|
rcounts, rdisps, MPI_INT,
|
|
|
|
intercomm);
|
|
|
|
|
2004-05-21 19:36:19 +00:00
|
|
|
exit:
|
|
|
|
if ( NULL != tmpbuf ) {
|
|
|
|
free ( tmpbuf );
|
|
|
|
}
|
2004-08-03 22:07:45 +00:00
|
|
|
if ( NULL != rcounts ) {
|
|
|
|
free ( rcounts );
|
|
|
|
}
|
|
|
|
if ( NULL != rdisps ) {
|
|
|
|
free ( rdisps );
|
|
|
|
}
|
|
|
|
|
2004-05-21 19:36:19 +00:00
|
|
|
return (rc);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Arguments not used in this implementation:
|
2004-08-05 16:31:30 +00:00
|
|
|
* - send_first
|
|
|
|
*/
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_intra_bridge (int *inbuf, int *outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *comm,
|
|
|
|
ompi_communicator_t *bcomm,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* lleader, void* rleader,
|
|
|
|
int send_first )
|
2004-05-21 19:36:19 +00:00
|
|
|
{
|
|
|
|
int *tmpbuf=NULL;
|
|
|
|
int local_rank;
|
|
|
|
int i;
|
|
|
|
int rc;
|
2004-06-16 22:37:03 +00:00
|
|
|
int local_leader, remote_leader;
|
|
|
|
|
|
|
|
local_leader = (*((int*)lleader));
|
|
|
|
remote_leader = (*((int*)rleader));
|
2004-05-21 19:36:19 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( &ompi_mpi_op_sum != op && &ompi_mpi_op_prod != op &&
|
|
|
|
&ompi_mpi_op_max != op && &ompi_mpi_op_min != op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
return MPI_ERR_OP;
|
|
|
|
}
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
local_rank = ompi_comm_rank ( comm );
|
2004-05-21 19:36:19 +00:00
|
|
|
tmpbuf = (int *) malloc ( count * sizeof(int));
|
|
|
|
if ( NULL == tmpbuf ) {
|
|
|
|
return MPI_ERR_INTERN;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Intercomm_create */
|
2004-06-29 00:02:25 +00:00
|
|
|
rc = comm->c_coll.coll_allreduce ( inbuf, tmpbuf, count, MPI_INT,
|
|
|
|
op, comm );
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (local_rank == local_leader ) {
|
|
|
|
MPI_Request req;
|
|
|
|
|
|
|
|
rc = mca_pml.pml_irecv ( outbuf, count, MPI_INT, remote_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
OMPI_COLL_TAG_ALLREDUCE,
|
|
|
|
bcomm, &req );
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
rc = mca_pml.pml_send (tmpbuf, count, MPI_INT, remote_leader,
|
2004-08-05 16:31:30 +00:00
|
|
|
OMPI_COLL_TAG_ALLREDUCE,
|
2004-08-03 22:07:45 +00:00
|
|
|
MCA_PML_BASE_SEND_STANDARD, bcomm );
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
2004-08-03 22:07:45 +00:00
|
|
|
rc = mca_pml.pml_wait_all ( 1, &req, MPI_STATUS_IGNORE);
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if ( &ompi_mpi_op_max == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
if (tmpbuf[i] > outbuf[i]) outbuf[i] = tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
else if ( &ompi_mpi_op_min == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
if (tmpbuf[i] < outbuf[i]) outbuf[i] = tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
else if ( &ompi_mpi_op_sum == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
outbuf[i] += tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
else if ( &ompi_mpi_op_prod == op ) {
|
2004-05-21 19:36:19 +00:00
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
outbuf[i] *= tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2004-08-03 22:07:45 +00:00
|
|
|
rc = comm->c_coll.coll_bcast ( outbuf, count, MPI_INT, local_leader,
|
|
|
|
comm);
|
2004-05-21 19:36:19 +00:00
|
|
|
|
|
|
|
exit:
|
|
|
|
if (NULL != tmpbuf ) {
|
|
|
|
free (tmpbuf);
|
|
|
|
}
|
|
|
|
|
|
|
|
return (rc);
|
|
|
|
}
|
|
|
|
|
2004-06-16 22:37:03 +00:00
|
|
|
/* Arguments not used in this implementation:
|
|
|
|
* - bridgecomm
|
|
|
|
*
|
2004-08-05 16:31:30 +00:00
|
|
|
* lleader is the local rank of root in comm
|
|
|
|
* rleader is the OOB contact information of the
|
|
|
|
* root processes in the other world.
|
2004-06-16 22:37:03 +00:00
|
|
|
*/
|
2004-08-03 22:07:45 +00:00
|
|
|
static int ompi_comm_allreduce_intra_oob (int *inbuf, int *outbuf,
|
|
|
|
int count, ompi_op_t *op,
|
|
|
|
ompi_communicator_t *comm,
|
2004-06-16 22:37:03 +00:00
|
|
|
ompi_communicator_t *bridgecomm,
|
2004-08-05 16:31:30 +00:00
|
|
|
void* lleader, void* rleader,
|
|
|
|
int send_first )
|
2004-06-16 22:37:03 +00:00
|
|
|
{
|
|
|
|
int *tmpbuf=NULL;
|
|
|
|
int i;
|
|
|
|
int rc;
|
2004-08-05 16:31:30 +00:00
|
|
|
int local_leader, local_rank;
|
|
|
|
ompi_process_name_t *remote_leader=NULL;
|
2004-06-16 22:37:03 +00:00
|
|
|
|
2004-08-05 16:31:30 +00:00
|
|
|
local_leader = (*((int*)lleader));
|
|
|
|
remote_leader = (ompi_process_name_t*)rleader;
|
2004-06-16 22:37:03 +00:00
|
|
|
|
|
|
|
if ( &ompi_mpi_op_sum != op && &ompi_mpi_op_prod != op &&
|
|
|
|
&ompi_mpi_op_max != op && &ompi_mpi_op_min != op ) {
|
|
|
|
return MPI_ERR_OP;
|
|
|
|
}
|
|
|
|
|
2004-08-05 16:31:30 +00:00
|
|
|
|
|
|
|
local_rank = ompi_comm_rank ( comm );
|
2004-06-16 22:37:03 +00:00
|
|
|
tmpbuf = (int *) malloc ( count * sizeof(int));
|
|
|
|
if ( NULL == tmpbuf ) {
|
|
|
|
return MPI_ERR_INTERN;
|
|
|
|
}
|
|
|
|
|
2004-08-05 16:31:30 +00:00
|
|
|
/* comm is an intra-communicator */
|
|
|
|
rc = comm->c_coll.coll_allreduce(inbuf,tmpbuf,count,MPI_INT,op, comm );
|
2004-06-16 22:37:03 +00:00
|
|
|
if ( OMPI_SUCCESS != rc ) {
|
|
|
|
goto exit;
|
|
|
|
}
|
2004-08-05 16:31:30 +00:00
|
|
|
|
2004-06-16 22:37:03 +00:00
|
|
|
if (local_rank == local_leader ) {
|
2004-08-12 22:41:42 +00:00
|
|
|
ompi_buffer_t sbuf;
|
|
|
|
ompi_buffer_t rbuf;
|
2004-08-05 16:31:30 +00:00
|
|
|
|
2004-08-12 22:41:42 +00:00
|
|
|
ompi_buffer_init(&sbuf, count * sizeof(int));
|
|
|
|
ompi_pack(sbuf, tmpbuf, count, OMPI_INT32);
|
2004-08-05 16:31:30 +00:00
|
|
|
|
2004-08-12 22:41:42 +00:00
|
|
|
if ( send_first ) {
|
|
|
|
rc = mca_oob_send_packed(remote_leader, sbuf, 0, 0);
|
|
|
|
rc = mca_oob_recv_packed (remote_leader, &rbuf, NULL);
|
2004-08-05 16:31:30 +00:00
|
|
|
}
|
|
|
|
else {
|
2004-08-12 22:41:42 +00:00
|
|
|
rc = mca_oob_recv_packed(remote_leader, &rbuf, NULL);
|
|
|
|
rc = mca_oob_send_packed(remote_leader, sbuf, 0, 0);
|
2004-08-05 16:31:30 +00:00
|
|
|
}
|
|
|
|
|
2004-08-12 22:41:42 +00:00
|
|
|
ompi_unpack(rbuf, outbuf, count, OMPI_INT32);
|
|
|
|
ompi_buffer_free(sbuf);
|
|
|
|
ompi_buffer_free(rbuf);
|
|
|
|
|
2004-06-16 22:37:03 +00:00
|
|
|
if ( &ompi_mpi_op_max == op ) {
|
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
if (tmpbuf[i] > outbuf[i]) outbuf[i] = tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if ( &ompi_mpi_op_min == op ) {
|
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
if (tmpbuf[i] < outbuf[i]) outbuf[i] = tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if ( &ompi_mpi_op_sum == op ) {
|
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
outbuf[i] += tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if ( &ompi_mpi_op_prod == op ) {
|
|
|
|
for ( i = 0 ; i < count; i++ ) {
|
|
|
|
outbuf[i] *= tmpbuf[i];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2004-08-05 16:31:30 +00:00
|
|
|
rc = comm->c_coll.coll_bcast (outbuf, count, MPI_INT,
|
|
|
|
local_leader, comm);
|
2004-06-16 22:37:03 +00:00
|
|
|
|
|
|
|
exit:
|
|
|
|
if (NULL != tmpbuf ) {
|
|
|
|
free (tmpbuf);
|
|
|
|
}
|
|
|
|
|
|
|
|
return (rc);
|
|
|
|
}
|