f63d6da6d7
- added signed datatypes for atomic_add calls - added unsigned datatypes for atomic put/inc/get/fetch calls - fixed incorrect SHMEM_CTX_DEFAULT macro, added external declaration of oshmem_ctx_default variable Signed-off-by: Sergey Oblomov <sergeyo@mellanox.com>
182 строки
8.8 KiB
C
182 строки
8.8 KiB
C
/*
|
|
* Copyright (c) 2013 Mellanox Technologies, Inc.
|
|
* All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
#include "oshmem_config.h"
|
|
|
|
#include "oshmem/constants.h"
|
|
#include "oshmem/include/shmem.h"
|
|
|
|
#include "oshmem/runtime/runtime.h"
|
|
|
|
#include "oshmem/mca/spml/spml.h"
|
|
|
|
/*
|
|
* These routines copy strided data from the local PE to a strided data object on the destination PE.
|
|
* The shmem_iput() routines read the elements of a local array (source) and write them to
|
|
* a remote array (target) on the PE indicated by pe. These routines return when the data has
|
|
* been copied out of the source array on the local PE but not necessarily before the data has
|
|
* been delivered to the remote data object.
|
|
*/
|
|
#define DO_SHMEM_TYPE_IPUT(ctx, type, target, source, tst, sst, nelemes, pe) do { \
|
|
int rc = OSHMEM_SUCCESS; \
|
|
size_t element_size = 0; \
|
|
size_t i = 0; \
|
|
\
|
|
RUNTIME_CHECK_INIT(); \
|
|
RUNTIME_CHECK_PE(pe); \
|
|
RUNTIME_CHECK_ADDR(target); \
|
|
\
|
|
element_size = sizeof(type); \
|
|
for (i = 0; i < nelems; i++) \
|
|
{ \
|
|
rc = MCA_SPML_CALL(put( \
|
|
ctx, \
|
|
(void*)(target + i * tst), \
|
|
element_size, \
|
|
(void*)(source + i * sst), \
|
|
pe)); \
|
|
} \
|
|
RUNTIME_CHECK_RC(rc); \
|
|
} while (0)
|
|
|
|
#define SHMEM_CTX_TYPE_IPUT(type_name, type) \
|
|
void shmem_ctx##type_name##_iput(shmem_ctx_t ctx, type *target, const type *source, ptrdiff_t tst, ptrdiff_t sst, size_t nelems, int pe) \
|
|
{ \
|
|
DO_SHMEM_TYPE_IPUT(ctx, type, target, source, tst, sst, \
|
|
nelems, pe); \
|
|
return ; \
|
|
}
|
|
|
|
#define SHMEM_TYPE_IPUT(type_name, type) \
|
|
void shmem##type_name##_iput(type *target, const type *source, ptrdiff_t tst, ptrdiff_t sst, size_t nelems, int pe) \
|
|
{ \
|
|
DO_SHMEM_TYPE_IPUT(oshmem_ctx_default, type, target, source, \
|
|
tst, sst, nelems, pe); \
|
|
return ; \
|
|
}
|
|
|
|
#if OSHMEM_PROFILING
|
|
#include "oshmem/include/pshmem.h"
|
|
#pragma weak shmem_ctx_char_iput = pshmem_ctx_char_iput
|
|
#pragma weak shmem_ctx_short_iput = pshmem_ctx_short_iput
|
|
#pragma weak shmem_ctx_int_iput = pshmem_ctx_int_iput
|
|
#pragma weak shmem_ctx_long_iput = pshmem_ctx_long_iput
|
|
#pragma weak shmem_ctx_longlong_iput = pshmem_ctx_longlong_iput
|
|
#pragma weak shmem_ctx_schar_iput = pshmem_ctx_schar_iput
|
|
#pragma weak shmem_ctx_uchar_iput = pshmem_ctx_uchar_iput
|
|
#pragma weak shmem_ctx_ushort_iput = pshmem_ctx_ushort_iput
|
|
#pragma weak shmem_ctx_uint_iput = pshmem_ctx_uint_iput
|
|
#pragma weak shmem_ctx_ulong_iput = pshmem_ctx_ulong_iput
|
|
#pragma weak shmem_ctx_ulonglong_iput = pshmem_ctx_ulonglong_iput
|
|
#pragma weak shmem_ctx_float_iput = pshmem_ctx_float_iput
|
|
#pragma weak shmem_ctx_double_iput = pshmem_ctx_double_iput
|
|
#pragma weak shmem_ctx_longdouble_iput = pshmem_ctx_longdouble_iput
|
|
#pragma weak shmem_char_iput = pshmem_char_iput
|
|
#pragma weak shmem_short_iput = pshmem_short_iput
|
|
#pragma weak shmem_int_iput = pshmem_int_iput
|
|
#pragma weak shmem_long_iput = pshmem_long_iput
|
|
#pragma weak shmem_longlong_iput = pshmem_longlong_iput
|
|
#pragma weak shmem_schar_iput = pshmem_schar_iput
|
|
#pragma weak shmem_uchar_iput = pshmem_uchar_iput
|
|
#pragma weak shmem_ushort_iput = pshmem_ushort_iput
|
|
#pragma weak shmem_uint_iput = pshmem_uint_iput
|
|
#pragma weak shmem_ulong_iput = pshmem_ulong_iput
|
|
#pragma weak shmem_ulonglong_iput = pshmem_ulonglong_iput
|
|
#pragma weak shmem_float_iput = pshmem_float_iput
|
|
#pragma weak shmem_double_iput = pshmem_double_iput
|
|
#pragma weak shmem_longdouble_iput = pshmem_longdouble_iput
|
|
#pragma weak shmem_ctx_iput8 = pshmem_ctx_iput8
|
|
#pragma weak shmem_ctx_iput16 = pshmem_ctx_iput16
|
|
#pragma weak shmem_ctx_iput32 = pshmem_ctx_iput32
|
|
#pragma weak shmem_ctx_iput64 = pshmem_ctx_iput64
|
|
#pragma weak shmem_ctx_iput128 = pshmem_ctx_iput128
|
|
#pragma weak shmem_iput8 = pshmem_iput8
|
|
#pragma weak shmem_iput16 = pshmem_iput16
|
|
#pragma weak shmem_iput32 = pshmem_iput32
|
|
#pragma weak shmem_iput64 = pshmem_iput64
|
|
#pragma weak shmem_iput128 = pshmem_iput128
|
|
#include "oshmem/shmem/c/profile/defines.h"
|
|
#endif
|
|
|
|
SHMEM_CTX_TYPE_IPUT(_char, char)
|
|
SHMEM_CTX_TYPE_IPUT(_short, short)
|
|
SHMEM_CTX_TYPE_IPUT(_int, int)
|
|
SHMEM_CTX_TYPE_IPUT(_long, long)
|
|
SHMEM_CTX_TYPE_IPUT(_longlong, long long)
|
|
SHMEM_CTX_TYPE_IPUT(_schar, signed char)
|
|
SHMEM_CTX_TYPE_IPUT(_uchar, unsigned char)
|
|
SHMEM_CTX_TYPE_IPUT(_ushort, unsigned short)
|
|
SHMEM_CTX_TYPE_IPUT(_uint, unsigned int)
|
|
SHMEM_CTX_TYPE_IPUT(_ulong, unsigned long)
|
|
SHMEM_CTX_TYPE_IPUT(_ulonglong, unsigned long long)
|
|
SHMEM_CTX_TYPE_IPUT(_float, float)
|
|
SHMEM_CTX_TYPE_IPUT(_double, double)
|
|
SHMEM_CTX_TYPE_IPUT(_longdouble, long double)
|
|
SHMEM_TYPE_IPUT(_char, char)
|
|
SHMEM_TYPE_IPUT(_short, short)
|
|
SHMEM_TYPE_IPUT(_int, int)
|
|
SHMEM_TYPE_IPUT(_long, long)
|
|
SHMEM_TYPE_IPUT(_longlong, long long)
|
|
SHMEM_TYPE_IPUT(_schar, signed char)
|
|
SHMEM_TYPE_IPUT(_uchar, unsigned char)
|
|
SHMEM_TYPE_IPUT(_ushort, unsigned short)
|
|
SHMEM_TYPE_IPUT(_uint, unsigned int)
|
|
SHMEM_TYPE_IPUT(_ulong, unsigned long)
|
|
SHMEM_TYPE_IPUT(_ulonglong, unsigned long long)
|
|
SHMEM_TYPE_IPUT(_float, float)
|
|
SHMEM_TYPE_IPUT(_double, double)
|
|
SHMEM_TYPE_IPUT(_longdouble, long double)
|
|
|
|
#define DO_SHMEM_IPUTMEM(ctx, target, source, tst, sst, element_size, nelems, pe) do { \
|
|
int rc = OSHMEM_SUCCESS; \
|
|
size_t i = 0; \
|
|
\
|
|
RUNTIME_CHECK_INIT(); \
|
|
RUNTIME_CHECK_PE(pe); \
|
|
RUNTIME_CHECK_ADDR(target); \
|
|
\
|
|
for (i = 0; i < nelems; i++) \
|
|
{ \
|
|
rc = MCA_SPML_CALL(put( \
|
|
ctx, \
|
|
(void*)((char*)target + i * tst * element_size), \
|
|
element_size, \
|
|
(void*)((char*)source + i * sst * element_size), \
|
|
pe)); \
|
|
} \
|
|
RUNTIME_CHECK_RC(rc); \
|
|
} while (0)
|
|
|
|
#define SHMEM_CTX_TYPE_IPUTMEM(name, element_size, prefix) \
|
|
void prefix##_ctx##name(shmem_ctx_t ctx, void *target, const void *source, ptrdiff_t tst, ptrdiff_t sst, size_t nelems, int pe) \
|
|
{ \
|
|
DO_SHMEM_IPUTMEM(ctx, target, source, tst, sst, \
|
|
element_size, nelems, pe); \
|
|
return ; \
|
|
}
|
|
|
|
#define SHMEM_TYPE_IPUTMEM(name, element_size, prefix) \
|
|
void prefix##name(void *target, const void *source, ptrdiff_t tst, ptrdiff_t sst, size_t nelems, int pe) \
|
|
{ \
|
|
DO_SHMEM_IPUTMEM(oshmem_ctx_default, target, source, tst, \
|
|
sst, element_size, nelems, pe); \
|
|
return ; \
|
|
}
|
|
|
|
SHMEM_CTX_TYPE_IPUTMEM(_iput8, 1, shmem)
|
|
SHMEM_CTX_TYPE_IPUTMEM(_iput16, 2, shmem)
|
|
SHMEM_CTX_TYPE_IPUTMEM(_iput32, 4, shmem)
|
|
SHMEM_CTX_TYPE_IPUTMEM(_iput64, 8, shmem)
|
|
SHMEM_CTX_TYPE_IPUTMEM(_iput128, 16, shmem)
|
|
SHMEM_TYPE_IPUTMEM(_iput8, 1, shmem)
|
|
SHMEM_TYPE_IPUTMEM(_iput16, 2, shmem)
|
|
SHMEM_TYPE_IPUTMEM(_iput32, 4, shmem)
|
|
SHMEM_TYPE_IPUTMEM(_iput64, 8, shmem)
|
|
SHMEM_TYPE_IPUTMEM(_iput128, 16, shmem)
|