366d64b7e5
As we changed the ABI (forcing a major release), we can limit the size of the predefined communicators by moving the collective structure outside the communicator. This might have a minimal, but unnoticeable, impact on performance. This approach has been discussed during the January 2017 devel meeting. Signed-off-by: George Bosilca <bosilca@icl.utk.edu> Signed-off-by: Joshua Hursey <jhursey@us.ibm.com>
184 строки
6.2 KiB
C
184 строки
6.2 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2017 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2013-2016 University of Houston. All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
|
|
#include "ompi_config.h"
|
|
#include "sharedfp_addproc.h"
|
|
|
|
#include "mpi.h"
|
|
#include "ompi/constants.h"
|
|
#include "ompi/mca/sharedfp/sharedfp.h"
|
|
#include "ompi/mca/sharedfp/base/base.h"
|
|
|
|
int mca_sharedfp_addproc_write (mca_io_ompio_file_t *fh,
|
|
const void *buf,
|
|
int count,
|
|
struct ompi_datatype_t *datatype,
|
|
ompi_status_public_t *status)
|
|
{
|
|
int ret = OMPI_SUCCESS;
|
|
OMPI_MPI_OFFSET_TYPE offset = 0;
|
|
long bytesRequested = 0;
|
|
size_t numofBytes;
|
|
struct mca_sharedfp_base_data_t *sh = NULL;
|
|
|
|
if(NULL == fh->f_sharedfp_data){
|
|
opal_output(0, "sharedfp_addproc_write: shared file pointer structure not initialized correctly\n");
|
|
return OMPI_ERROR;
|
|
}
|
|
|
|
/* Calculate the number of bytes to write*/
|
|
opal_datatype_type_size ( &datatype->super, &numofBytes);
|
|
bytesRequested = count * numofBytes;
|
|
|
|
/*Retrieve the shared file data structure */
|
|
sh = fh->f_sharedfp_data;
|
|
|
|
if ( mca_sharedfp_addproc_verbose ){
|
|
opal_output(ompi_sharedfp_base_framework.framework_output,
|
|
"sharedfp_addproc_write: sharedfp_addproc_write: Bytes Requested is %ld\n",
|
|
bytesRequested);
|
|
}
|
|
|
|
/*Request the offset to write bytesRequested bytes*/
|
|
ret = mca_sharedfp_addproc_request_position( sh, bytesRequested, &offset);
|
|
offset /= sh->sharedfh->f_etype_size;
|
|
if ( OMPI_SUCCESS == ret ) {
|
|
if ( mca_sharedfp_addproc_verbose ){
|
|
opal_output(ompi_sharedfp_base_framework.framework_output,
|
|
"sharedfp_addproc_write: Offset received is %lld\n",offset);
|
|
}
|
|
/* Write to the file */
|
|
ret = mca_common_ompio_file_write_at(sh->sharedfh,offset,buf,count,datatype,status);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
int mca_sharedfp_addproc_write_ordered (mca_io_ompio_file_t *fh,
|
|
const void *buf,
|
|
int count,
|
|
struct ompi_datatype_t *datatype,
|
|
ompi_status_public_t *status)
|
|
{
|
|
int ret = OMPI_SUCCESS;
|
|
OMPI_MPI_OFFSET_TYPE offset = 0, offsetReceived = 0;
|
|
long sendBuff = 0;
|
|
long *buff=NULL;
|
|
long offsetBuff;
|
|
long bytesRequested = 0;
|
|
int recvcnt = 1, sendcnt = 1;
|
|
size_t numofBytes;
|
|
int rank, size, i;
|
|
struct mca_sharedfp_base_data_t *sh = NULL;
|
|
|
|
if(NULL == fh->f_sharedfp_data){
|
|
opal_output(0, "sharedfp_addproc_write_ordered: shared file pointer "
|
|
"structure not initialized correctly\n");
|
|
return OMPI_ERROR;
|
|
}
|
|
|
|
/*Retrieve the shared file pointer structure*/
|
|
sh = fh->f_sharedfp_data;
|
|
|
|
/* Calculate the number of bytes to write*/
|
|
opal_datatype_type_size ( &datatype->super, &numofBytes);
|
|
sendBuff = count * numofBytes;
|
|
|
|
/* Get the ranks in the communicator */
|
|
rank = ompi_comm_rank ( sh->comm );
|
|
size = ompi_comm_size ( sh->comm );
|
|
|
|
if ( 0 == rank ) {
|
|
buff = (long*)malloc(sizeof(OMPI_MPI_OFFSET_TYPE) * size);
|
|
if ( NULL == buff )
|
|
return OMPI_ERR_OUT_OF_RESOURCE;
|
|
}
|
|
|
|
ret = sh->comm->c_coll->coll_gather ( &sendBuff, sendcnt, OMPI_OFFSET_DATATYPE, buff,
|
|
recvcnt, OMPI_OFFSET_DATATYPE, 0, sh->comm,
|
|
sh->comm->c_coll->coll_gather_module);
|
|
if( OMPI_SUCCESS != ret ){
|
|
goto exit;
|
|
}
|
|
|
|
/* All the counts are present now in the recvBuff.
|
|
The size of recvBuff is sizeof_newComm
|
|
*/
|
|
if ( 0 == rank ) {
|
|
for (i = 0; i < size ; i ++) {
|
|
bytesRequested += buff[i];
|
|
|
|
if ( mca_sharedfp_addproc_verbose ){
|
|
opal_output(ompi_sharedfp_base_framework.framework_output,
|
|
"sharedfp_addproc_write_ordered: Bytes requested are %ld\n",
|
|
bytesRequested);
|
|
}
|
|
}
|
|
|
|
/* Request the offset to write bytesRequested bytes
|
|
** only the root process needs to do the request,
|
|
** since the root process will then tell the other
|
|
** processes at what offset they should write their
|
|
** share of the data.
|
|
*/
|
|
ret = mca_sharedfp_addproc_request_position(sh,bytesRequested,&offsetReceived);
|
|
if( OMPI_SUCCESS != ret ){
|
|
goto exit;
|
|
}
|
|
if ( mca_sharedfp_addproc_verbose ){
|
|
opal_output(ompi_sharedfp_base_framework.framework_output,
|
|
"sharedfp_addproc_write_ordered: Offset received is %lld\n",
|
|
offsetReceived);
|
|
}
|
|
buff[0] += offsetReceived;
|
|
|
|
for (i = 1 ; i < size; i++) {
|
|
buff[i] += buff[i-1];
|
|
}
|
|
}
|
|
|
|
/* Scatter the results to the other processes*/
|
|
ret = sh->comm->c_coll->coll_scatter ( buff, sendcnt, OMPI_OFFSET_DATATYPE, &offsetBuff,
|
|
recvcnt, OMPI_OFFSET_DATATYPE, 0, sh->comm,
|
|
sh->comm->c_coll->coll_scatter_module );
|
|
if( OMPI_SUCCESS != ret ){
|
|
goto exit;
|
|
}
|
|
|
|
/*Each process now has its own individual offset in recvBUFF*/
|
|
offset = offsetBuff - sendBuff;
|
|
offset /= sh->sharedfh->f_etype_size;
|
|
|
|
if ( mca_sharedfp_addproc_verbose ){
|
|
opal_output(ompi_sharedfp_base_framework.framework_output,
|
|
"sharedfp_addproc_write_ordered: Offset returned is %lld\n",
|
|
offset);
|
|
}
|
|
|
|
/* write to the file */
|
|
ret = mca_common_ompio_file_write_at_all(sh->sharedfh,offset,buf,count,datatype,status);
|
|
|
|
exit:
|
|
if ( NULL != buff ) {
|
|
free ( buff );
|
|
}
|
|
return ret;
|
|
}
|