b3f88c4a1d
This commit was SVN r29153.
151 строка
6.1 KiB
C
151 строка
6.1 KiB
C
/*
|
|
* Copyright (c) 2013 Mellanox Technologies, Inc.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "oshmem_config.h"
|
|
#include "oshmem/shmem/f77/bindings.h"
|
|
#include "oshmem/include/shmem.h"
|
|
#include "oshmem/constants.h"
|
|
#include "oshmem/mca/scoll/scoll.h"
|
|
#include "oshmem/proc/proc.h"
|
|
#include "oshmem/proc/proc_group_cache.h"
|
|
#include "oshmem/op/op.h"
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_COLLECT4,
|
|
shmem_collect4_,
|
|
shmem_collect4__,
|
|
shmem_collect4_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_COLLECT8,
|
|
shmem_collect8_,
|
|
shmem_collect8__,
|
|
shmem_collect8_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_COLLECT32,
|
|
shmem_collect32_,
|
|
shmem_collect32__,
|
|
shmem_collect32_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_COLLECT64,
|
|
shmem_collect64_,
|
|
shmem_collect64__,
|
|
shmem_collect64_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_FCOLLECT4,
|
|
shmem_fcollect4_,
|
|
shmem_fcollect4__,
|
|
shmem_fcollect4_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_FCOLLECT8,
|
|
shmem_fcollect8_,
|
|
shmem_fcollect8__,
|
|
shmem_fcollect8_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_FCOLLECT32,
|
|
shmem_fcollect32_,
|
|
shmem_fcollect32__,
|
|
shmem_fcollect32_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
OMPI_GENERATE_F77_BINDINGS (void,
|
|
SHMEM_FCOLLECT64,
|
|
shmem_fcollect64_,
|
|
shmem_fcollect64__,
|
|
shmem_fcollect64_f,
|
|
(FORTRAN_POINTER_T target, FORTRAN_POINTER_T source, MPI_Fint *nlong, MPI_Fint *PE_start, MPI_Fint * logPE_stride, MPI_Fint *PE_size, FORTRAN_POINTER_T pSync),
|
|
(target,source,nlong,PE_start,logPE_stride,PE_size,pSync) )
|
|
|
|
#define SHMEM_COLLECT(F_NAME, T_NAME, OSHMEM_GROUP_CACHE_ENABLED) void F_NAME(FORTRAN_POINTER_T target, \
|
|
FORTRAN_POINTER_T source, \
|
|
MPI_Fint *nlong, \
|
|
MPI_Fint *PE_start, \
|
|
MPI_Fint * logPE_stride, \
|
|
MPI_Fint *PE_size, \
|
|
FORTRAN_POINTER_T pSync)\
|
|
{\
|
|
int rc = OSHMEM_SUCCESS;\
|
|
oshmem_group_t* group = NULL;\
|
|
{\
|
|
/* Create group basing PE_start, logPE_stride and PE_size */\
|
|
if (OSHMEM_GROUP_CACHE_ENABLED == 0)\
|
|
{\
|
|
group = oshmem_proc_group_create(OMPI_FINT_2_INT(*PE_start), \
|
|
(1 << OMPI_FINT_2_INT(*logPE_stride)), \
|
|
OMPI_FINT_2_INT(*PE_size));\
|
|
if (!group)\
|
|
rc = OSHMEM_ERROR;\
|
|
}\
|
|
else\
|
|
{\
|
|
group = find_group_in_cache(OMPI_FINT_2_INT(*PE_start),\
|
|
OMPI_FINT_2_INT(*logPE_stride),\
|
|
OMPI_FINT_2_INT(*PE_size));\
|
|
if (!group)\
|
|
{\
|
|
group = oshmem_proc_group_create(OMPI_FINT_2_INT(*PE_start), \
|
|
(1 << OMPI_FINT_2_INT(*logPE_stride)), \
|
|
OMPI_FINT_2_INT(*PE_size));\
|
|
if (!group)\
|
|
rc = OSHMEM_ERROR;\
|
|
cache_group(group,OMPI_FINT_2_INT(*PE_start),\
|
|
OMPI_FINT_2_INT(*logPE_stride),\
|
|
OMPI_FINT_2_INT(*PE_size));\
|
|
}\
|
|
} /* OSHMEM_GROUP_CACHE_ENABLED */\
|
|
/* Collective operation call */\
|
|
if ( rc == OSHMEM_SUCCESS )\
|
|
{\
|
|
oshmem_op_t* op = T_NAME;\
|
|
/* Call collective broadcast operation */\
|
|
rc = group->g_scoll.scoll_collect( group, \
|
|
FPTR_2_VOID_PTR(target), \
|
|
FPTR_2_VOID_PTR(source), \
|
|
OMPI_FINT_2_INT(*nlong) * op->dt_size, \
|
|
FPTR_2_VOID_PTR(pSync), \
|
|
false, SCOLL_DEFAULT_ALG);\
|
|
}\
|
|
if (OSHMEM_GROUP_CACHE_ENABLED == 0)\
|
|
{\
|
|
if ( rc == OSHMEM_SUCCESS )\
|
|
{\
|
|
oshmem_proc_group_destroy(group);\
|
|
}\
|
|
}/* OSHMEM_GROUP_CACHE_ENABLED */\
|
|
}\
|
|
}
|
|
|
|
SHMEM_COLLECT(shmem_collect4_f, oshmem_op_prod_fint4, OSHMEM_GROUP_CACHE_ENABLED);
|
|
SHMEM_COLLECT(shmem_collect8_f, oshmem_op_prod_fint8, OSHMEM_GROUP_CACHE_ENABLED);
|
|
SHMEM_COLLECT(shmem_collect32_f, oshmem_op_prod_fint4, OSHMEM_GROUP_CACHE_ENABLED);
|
|
SHMEM_COLLECT(shmem_collect64_f, oshmem_op_prod_fint8, OSHMEM_GROUP_CACHE_ENABLED);
|
|
SHMEM_COLLECT(shmem_fcollect4_f, oshmem_op_prod_freal4, OSHMEM_GROUP_CACHE_ENABLED);
|
|
SHMEM_COLLECT(shmem_fcollect8_f, oshmem_op_prod_freal8, OSHMEM_GROUP_CACHE_ENABLED);
|
|
SHMEM_COLLECT(shmem_fcollect32_f, oshmem_op_prod_freal4, OSHMEM_GROUP_CACHE_ENABLED);
|
|
SHMEM_COLLECT(shmem_fcollect64_f, oshmem_op_prod_freal8, OSHMEM_GROUP_CACHE_ENABLED);
|