1
1
openmpi/oshmem/shmem/f77/shmem_max_to_all_f.c

126 строки
5.1 KiB
C

/*
* Copyright (c) 2013 Mellanox Technologies, Inc.
* All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "oshmem_config.h"
#include "oshmem/shmem/f77/bindings.h"
#include "oshmem/include/shmem.h"
#include "oshmem/constants.h"
#include "oshmem/mca/scoll/scoll.h"
#include "oshmem/proc/proc.h"
#include "oshmem/proc/proc_group_cache.h"
#include "oshmem/op/op.h"
OMPI_GENERATE_F77_BINDINGS (void,
SHMEM_INT4_MAX_TO_ALL,
shmem_int4_max_to_all_,
shmem_int4_max_to_all__,
shmem_int4_max_to_all_f,
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nreduce, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T *pWrk, FORTRAN_POINTER_T pSync),
(target,source,nreduce,PE_start,logPE_stride,PE_size,pWrk,pSync) )
OMPI_GENERATE_F77_BINDINGS (void,
SHMEM_INT8_MAX_TO_ALL,
shmem_int8_max_to_all_,
shmem_int8_max_to_all__,
shmem_int8_max_to_all_f,
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nreduce, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T *pWrk, FORTRAN_POINTER_T pSync),
(target,source,nreduce,PE_start,logPE_stride,PE_size,pWrk,pSync) )
OMPI_GENERATE_F77_BINDINGS (void,
SHMEM_REAL4_MAX_TO_ALL,
shmem_real4_max_to_all_,
shmem_real4_max_to_all__,
shmem_real4_max_to_all_f,
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nreduce, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T *pWrk, FORTRAN_POINTER_T pSync),
(target,source,nreduce,PE_start,logPE_stride,PE_size,pWrk,pSync) )
OMPI_GENERATE_F77_BINDINGS (void,
SHMEM_REAL8_MAX_TO_ALL,
shmem_real8_max_to_all_,
shmem_real8_max_to_all__,
shmem_real8_max_to_all_f,
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nreduce, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T *pWrk, FORTRAN_POINTER_T pSync),
(target,source,nreduce,PE_start,logPE_stride,PE_size,pWrk,pSync) )
OMPI_GENERATE_F77_BINDINGS (void,
SHMEM_REAL16_MAX_TO_ALL,
shmem_real16_max_to_all_,
shmem_real16_max_to_all__,
shmem_real16_max_to_all_f,
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nreduce, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T *pWrk, FORTRAN_POINTER_T pSync),
(target,source,nreduce,PE_start,logPE_stride,PE_size,pWrk,pSync) )
#define SHMEM_MAX_TO_ALL(F_NAME, T_NAME, OSHMEM_GROUP_CACHE_ENABLED) void F_NAME(FORTRAN_POINTER_T target, \
FORTRAN_POINTER_T source, \
MPI_Fint *nreduce,\
MPI_Fint *PE_start,\
MPI_Fint * logPE_stride,\
MPI_Fint *PE_size,\
FORTRAN_POINTER_T *pWrk,\
FORTRAN_POINTER_T pSync)\
{\
int rc = OSHMEM_SUCCESS;\
oshmem_group_t* group = NULL;\
{\
/* Create group basing PE_start, logPE_stride and PE_size */\
if (OSHMEM_GROUP_CACHE_ENABLED == 0) {\
group = oshmem_proc_group_create(OMPI_FINT_2_INT(*PE_start),\
(1 << OMPI_FINT_2_INT(*logPE_stride)),\
OMPI_FINT_2_INT(*PE_size));\
if (!group)\
rc = OSHMEM_ERROR;\
}\
else\
{\
group = find_group_in_cache(OMPI_FINT_2_INT(*PE_start),\
OMPI_FINT_2_INT(*logPE_stride),\
OMPI_FINT_2_INT(*PE_size));\
if (!group)\
{\
group = oshmem_proc_group_create(OMPI_FINT_2_INT(*PE_start),\
(1 << OMPI_FINT_2_INT(*logPE_stride)),\
OMPI_FINT_2_INT(*PE_size));\
if (!group)\
rc = OSHMEM_ERROR;\
cache_group(group,OMPI_FINT_2_INT(*PE_start),\
OMPI_FINT_2_INT(*logPE_stride),\
OMPI_FINT_2_INT(*PE_size));\
}\
}\
/* Collective operation call */\
if ( rc == OSHMEM_SUCCESS )\
{\
oshmem_op_t* op = T_NAME;\
size_t size = OMPI_FINT_2_INT(*nreduce) * op->dt_size;\
/* Call collective reduce operation */\
rc = group->g_scoll.scoll_reduce( group,\
op,\
FPTR_2_VOID_PTR(target),\
FPTR_2_VOID_PTR(source),\
size,\
FPTR_2_VOID_PTR(pSync),\
FPTR_2_VOID_PTR(*pWrk), SCOLL_DEFAULT_ALG);\
}\
if (OSHMEM_GROUP_CACHE_ENABLED == 0)\
{\
if ( rc == OSHMEM_SUCCESS )\
{\
oshmem_proc_group_destroy(group);\
}\
}\
}\
}
SHMEM_MAX_TO_ALL(shmem_int4_max_to_all_f, oshmem_op_max_fint4, OSHMEM_GROUP_CACHE_ENABLED);
SHMEM_MAX_TO_ALL(shmem_int8_max_to_all_f, oshmem_op_max_fint8, OSHMEM_GROUP_CACHE_ENABLED);
SHMEM_MAX_TO_ALL(shmem_real4_max_to_all_f, oshmem_op_max_freal4, OSHMEM_GROUP_CACHE_ENABLED);
SHMEM_MAX_TO_ALL(shmem_real8_max_to_all_f, oshmem_op_max_freal8, OSHMEM_GROUP_CACHE_ENABLED);
SHMEM_MAX_TO_ALL(shmem_real16_max_to_all_f, oshmem_op_max_freal16, OSHMEM_GROUP_CACHE_ENABLED);