1
1
openmpi/oshmem/shmem/c/shmem_collect.c
Sergey Oblomov dea9cf6b63 OSHMEM: added processing of zero-length collectives
- according spec 1.4, annex C shmem collectives should process
  calls where number of elements is zero independently from pointer
  value
- added zero-count processing - it just call barrier to
  sync ranks

Signed-off-by: Sergey Oblomov <sergeyo@mellanox.com>
(cherry picked from commit 9de128afaf)
2018-11-27 14:26:44 +02:00

90 строки
3.3 KiB
C

/*
* Copyright (c) 2013-2018 Mellanox Technologies, Inc.
* All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "oshmem_config.h"
#include "oshmem/constants.h"
#include "oshmem/include/shmem.h"
#include "orte/mca/grpcomm/grpcomm.h"
#include "oshmem/runtime/runtime.h"
#include "oshmem/mca/scoll/scoll.h"
#include "oshmem/proc/proc.h"
static void _shmem_collect(void *target,
const void *source,
size_t nbytes,
int PE_start,
int logPE_stride,
int PE_size,
long *pSync,
bool nlong_type);
#define SHMEM_TYPE_COLLECT(name, element_size, nelems_type) \
void shmem##name( void *target, \
const void *source, \
size_t nelems, \
int PE_start, \
int logPE_stride, \
int PE_size, \
long *pSync) \
{ \
RUNTIME_CHECK_INIT(); \
RUNTIME_CHECK_ADDR_SIZE(target, nelems); \
RUNTIME_CHECK_ADDR_SIZE(source, nelems); \
\
_shmem_collect( target, source, nelems * element_size, \
PE_start, logPE_stride, PE_size, \
pSync, \
nelems_type); \
}
static void _shmem_collect(void *target,
const void *source,
size_t nbytes,
int PE_start,
int logPE_stride,
int PE_size,
long *pSync,
bool array_type)
{
int rc;
oshmem_group_t *group;
/* Create group basing PE_start, logPE_stride and PE_size */
group = oshmem_proc_group_create_nofail(PE_start, 1<<logPE_stride, PE_size);
/* Call collective broadcast operation */
rc = group->g_scoll.scoll_collect(group,
target,
source,
nbytes,
pSync,
array_type,
SCOLL_DEFAULT_ALG);
oshmem_proc_group_destroy(group);
RUNTIME_CHECK_RC(rc);
}
#if OSHMEM_PROFILING
#include "oshmem/include/pshmem.h"
#pragma weak shmem_collect32 = pshmem_collect32
#pragma weak shmem_collect64 = pshmem_collect64
#pragma weak shmem_fcollect32 = pshmem_fcollect32
#pragma weak shmem_fcollect64 = pshmem_fcollect64
#include "oshmem/shmem/c/profile/defines.h"
#endif
SHMEM_TYPE_COLLECT(_collect32, sizeof(uint32_t), false)
SHMEM_TYPE_COLLECT(_collect64, sizeof(uint64_t), false)
SHMEM_TYPE_COLLECT(_fcollect32, sizeof(uint32_t), true)
SHMEM_TYPE_COLLECT(_fcollect64, sizeof(uint64_t), true)