d4843b1651
Signed-off-by: Mikhail Brinskii <mikhailb@mellanox.com>
445 строки
16 KiB
C
445 строки
16 KiB
C
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
|
/*
|
|
* Copyright (c) 2013 Mellanox Technologies, Inc.
|
|
* All rights reserved.
|
|
* Copyright (c) 2014 Cisco Systems, Inc. All rights reserved.
|
|
* Copyright (c) 2015 Los Alamos National Security, LLC. All rights
|
|
* reserved.
|
|
* Copyright (c) 2016 Research Organization for Information Science
|
|
* and Technology (RIST). All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#ifndef MCA_SPML_H
|
|
#define MCA_SPML_H
|
|
|
|
#include "oshmem_config.h"
|
|
#include "oshmem/types.h"
|
|
#include "oshmem/constants.h"
|
|
|
|
#include "opal_stdint.h"
|
|
#include "oshmem/mca/mca.h"
|
|
#include "opal/mca/btl/btl.h"
|
|
#include "oshmem/proc/proc.h"
|
|
|
|
#include "oshmem/mca/sshmem/sshmem.h"
|
|
|
|
BEGIN_C_DECLS
|
|
|
|
/*
|
|
* SPML component types
|
|
*/
|
|
|
|
/**
|
|
* MCA->PML Called by MCA framework to initialize the component.
|
|
*
|
|
* @param priority (OUT) Relative priority or ranking used by MCA to
|
|
* selected a component.
|
|
*
|
|
* @param enable_progress_threads (IN) Whether this component is
|
|
* allowed to run a hidden/progress thread or not.
|
|
*
|
|
* @param enable_mpi_threads (IN) Whether support for multiple MPI
|
|
* threads is enabled or not (i.e., MPI_THREAD_MULTIPLE), which
|
|
* indicates whether multiple threads may invoke this component
|
|
* simultaneously or not.
|
|
*/
|
|
typedef enum {
|
|
MCA_SPML_BASE_PUT_SYNCHRONOUS,
|
|
MCA_SPML_BASE_PUT_COMPLETE,
|
|
MCA_SPML_BASE_PUT_BUFFERED,
|
|
MCA_SPML_BASE_PUT_READY,
|
|
MCA_SPML_BASE_PUT_STANDARD,
|
|
MCA_SPML_BASE_PUT_SIZE
|
|
} mca_spml_base_put_mode_t;
|
|
|
|
typedef struct mca_spml_base_module_1_0_0_t * (*mca_spml_base_component_init_fn_t)(int *priority,
|
|
bool enable_progress_threads,
|
|
bool enable_mpi_threads);
|
|
|
|
typedef int (*mca_spml_base_component_finalize_fn_t)(void);
|
|
|
|
/**
|
|
* SPML component version and interface functions.
|
|
*/
|
|
struct mca_spml_base_component_2_0_0_t {
|
|
mca_base_component_t spmlm_version;
|
|
mca_base_component_data_t spmlm_data;
|
|
mca_spml_base_component_init_fn_t spmlm_init;
|
|
mca_spml_base_component_finalize_fn_t spmlm_finalize;
|
|
};
|
|
typedef struct mca_spml_base_component_2_0_0_t mca_spml_base_component_2_0_0_t;
|
|
typedef mca_spml_base_component_2_0_0_t mca_spml_base_component_t;
|
|
|
|
/**
|
|
* MCA management functions.
|
|
*/
|
|
|
|
static inline char *mca_spml_base_mkey2str(sshmem_mkey_t *mkey)
|
|
{
|
|
static char buf[64];
|
|
|
|
if (mkey->len == 0) {
|
|
snprintf(buf, sizeof(buf), "mkey: base=%p len=%d key=%" PRIu64, mkey->va_base, mkey->len, mkey->u.key);
|
|
} else {
|
|
snprintf(buf, sizeof(buf), "mkey: base=%p len=%d data=0x%p", mkey->va_base, mkey->len, mkey->u.data);
|
|
}
|
|
|
|
return buf;
|
|
}
|
|
|
|
/**
|
|
* Downcall from MCA layer to enable the PML/BTLs.
|
|
*
|
|
* @param enable Enable/Disable SPML forwarding
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_enable_fn_t)(bool enable);
|
|
|
|
/**
|
|
* Waits for an int variable to change on the local PE.
|
|
* Blocked until the variable is not equal to value.
|
|
*
|
|
* @param addr Address of the variable to pool on.
|
|
* @param value The value to pool on. Pool until the value held in addr is different than value.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_wait_fn_t)(void* addr,
|
|
int cmp,
|
|
void* value,
|
|
int datatype);
|
|
|
|
/**
|
|
* Test for an int variable to change on the local PE.
|
|
*
|
|
* @param addr Address of the variable to pool on.
|
|
* @param value The value to pool on. Pool until the value held in addr is different than value.
|
|
* @param out_value Return value to indicated if variable is equal to given cmp value.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_test_fn_t)(void* addr,
|
|
int cmp,
|
|
void* value,
|
|
int datatype,
|
|
int *out_value);
|
|
|
|
/**
|
|
* deserialize remote mkey
|
|
*
|
|
* @param mkey remote mkey
|
|
*/
|
|
typedef void (*mca_spml_base_module_mkey_unpack_fn_t)(shmem_ctx_t ctx, sshmem_mkey_t *, uint32_t segno, int remote_pe, int tr_id);
|
|
|
|
/**
|
|
* If possible, get a pointer to the remote memory described by the mkey
|
|
*
|
|
* @param dst_addr address of the symmetric variable
|
|
* @param mkey remote memory key
|
|
* @param pe remote PE
|
|
*
|
|
* @return pointer to remote memory or NULL
|
|
*/
|
|
typedef void * (*mca_spml_base_module_mkey_ptr_fn_t)(const void *dst_addr, sshmem_mkey_t *mkey, int pe);
|
|
|
|
/**
|
|
* free resources used by deserialized remote mkey
|
|
*
|
|
* @param mkey remote mkey
|
|
*/
|
|
typedef void (*mca_spml_base_module_mkey_free_fn_t)(sshmem_mkey_t *);
|
|
|
|
/**
|
|
* Register (Pinn) a buffer of 'size' bits starting in address addr
|
|
*
|
|
* @param addr base address of the registered buffer.
|
|
* @param size the size of the buffer to be registered.
|
|
* @param seg_id sysv segment id
|
|
* @param count number of internal transports (btls) that registered memory
|
|
* @return array of mkeys (one mkey per "btl") or NULL on failure
|
|
*
|
|
*/
|
|
typedef sshmem_mkey_t * (*mca_spml_base_module_register_fn_t)(void *addr,
|
|
size_t size,
|
|
uint64_t shmid,
|
|
int *count);
|
|
|
|
/**
|
|
* deregister memory pinned by register()
|
|
*/
|
|
typedef int (*mca_spml_base_module_deregister_fn_t)(sshmem_mkey_t *mkeys);
|
|
|
|
/**
|
|
* try to fill up mkeys that can be used to reach remote pe.
|
|
* @param pe remote pe
|
|
* @param seg 0 - symmetric heap, 1 - static data, everything else are static data in .so
|
|
* @param mkeys mkeys array
|
|
*
|
|
* @return OSHMEM_SUCCSESS if keys are found
|
|
*/
|
|
typedef int (*mca_spml_base_module_oob_get_mkeys_fn_t)(shmem_ctx_t ctx, int pe,
|
|
uint32_t seg,
|
|
sshmem_mkey_t *mkeys);
|
|
|
|
/**
|
|
* For each proc setup a datastructure that indicates the BTLs
|
|
* that can be used to reach the destination.
|
|
*
|
|
* @param procs A list of all procs participating in the parallel application.
|
|
* @param nprocs The number of procs in the parallel application.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*
|
|
*/
|
|
typedef int (*mca_spml_base_module_add_procs_fn_t)(ompi_proc_t** procs,
|
|
size_t nprocs);
|
|
typedef int (*mca_spml_base_module_del_procs_fn_t)(ompi_proc_t** procs,
|
|
size_t nprocs);
|
|
|
|
|
|
/**
|
|
* Create a communication context.
|
|
*
|
|
* @param options The set of options requested for the given context.
|
|
* @param ctx A handle to the newly created context.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_ctx_create_fn_t)(long options, shmem_ctx_t *ctx);
|
|
|
|
|
|
/**
|
|
* Destroy a communication context.
|
|
*
|
|
* @param ctx Handle to the context that will be destroyed.
|
|
*/
|
|
typedef void (*mca_spml_base_module_ctx_destroy_fn_t)(shmem_ctx_t ctx);
|
|
|
|
/**
|
|
* Transfer data to a remote pe.
|
|
*
|
|
* @param ctx The context object this routine is working on.
|
|
* @param dst_addr The address in the remote PE of the object being written.
|
|
* @param size The number of bytes to be written.
|
|
* @param src_addr An address on the local PE holdng the value to be written.
|
|
* @param dst The remote PE to be written to.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_put_fn_t)(shmem_ctx_t ctx,
|
|
void *dst_addr,
|
|
size_t size,
|
|
void *src_addr,
|
|
int dst);
|
|
|
|
/**
|
|
* These routines provide the means for copying contiguous data to another PE without
|
|
* blocking the caller. These routines return before the data has been delivered to the
|
|
* remote PE.
|
|
*
|
|
* @param ctx The context object this routine is working on.
|
|
* @param dst_addr The address in the remote PE of the object being written.
|
|
* @param size The number of bytes to be written.
|
|
* @param src_addr An address on the local PE holdng the value to be written.
|
|
* @param dst The remote PE to be written to.
|
|
* @param handle The address of a handle to be passed to shmem_wait_nb() or
|
|
* shmem_test_nb() to wait or poll for the completion of the transfer.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_put_nb_fn_t)(shmem_ctx_t ctx,
|
|
void *dst_addr,
|
|
size_t size,
|
|
void *src_addr,
|
|
int dst,
|
|
void **handle);
|
|
|
|
/**
|
|
* Blocking data transfer from remote PE.
|
|
* Read data from remote PE.
|
|
*
|
|
* @param ctx The context object this routine is working on.
|
|
* @param dst_addr The address on the local PE, to write the result of the get operation to.
|
|
* @param size The number of bytes to be read.
|
|
* @param src_addr The address on the remote PE, to read from.
|
|
* @param src The ID of the remote PE.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_get_fn_t)(shmem_ctx_t ctx,
|
|
void *dst_addr,
|
|
size_t size,
|
|
void *src_addr,
|
|
int src);
|
|
|
|
/**
|
|
* Non-blocking data transfer from remote PE.
|
|
* Read data from remote PE.
|
|
*
|
|
* @param ctx The context object this routine is working on.
|
|
* @param dst_addr The address on the local PE, to write the result of the get operation to.
|
|
* @param size The number of bytes to be read.
|
|
* @param src_addr The address on the remote PE, to read from.
|
|
* @param src The ID of the remote PE.
|
|
* @param handle The address of a handle to be passed to shmem_wait_nb() or
|
|
* shmem_test_nb() to wait or poll for the completion of the transfer.
|
|
* @return - OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_get_nb_fn_t)(shmem_ctx_t ctx,
|
|
void *dst_addr,
|
|
size_t size,
|
|
void *src_addr,
|
|
int src,
|
|
void **handle);
|
|
|
|
/**
|
|
* Post a receive and wait for completion.
|
|
*
|
|
* @param buf (IN) User buffer.
|
|
* @param count (IN) The number of bytes to be sent.
|
|
* @param src (IN) The ID of the remote PE.
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_recv_fn_t)(void *buf, size_t count, int src);
|
|
|
|
/**
|
|
* Post a send request and wait for completion.
|
|
*
|
|
* @param buf (IN) User buffer.
|
|
* @param count (IN) The number of bytes to be sent.
|
|
* @param dst (IN) The ID of the remote PE.
|
|
* @param mode (IN) Send mode (STANDARD,BUFFERED,SYNCHRONOUS,READY)
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_send_fn_t)(void *buf,
|
|
size_t count,
|
|
int dst,
|
|
mca_spml_base_put_mode_t mode);
|
|
|
|
/**
|
|
* The routine transfers the data asynchronously from the source PE to all
|
|
* PEs in the OpenSHMEM job. The routine returns immediately. The source and
|
|
* target buffers are reusable only after the completion of the routine.
|
|
* After the data is transferred to the target buffers, the counter object
|
|
* is updated atomically. The counter object can be read either using atomic
|
|
* operations such as shmem_atomic_fetch or can use point-to-point synchronization
|
|
* routines such as shmem_wait_until and shmem_test.
|
|
*
|
|
* Shmem_quiet may be used for completing the operation, but not required for
|
|
* progress or completion. In a multithreaded OpenSHMEM program, the user
|
|
* (the OpenSHMEM program) should ensure the correct ordering of
|
|
* shmemx_alltoall_global calls.
|
|
*
|
|
* @param dest A symmetric data object that is large enough to receive
|
|
* “size” bytes of data from each PE in the OpenSHMEM job.
|
|
* @param source A symmetric data object that contains “size” bytes of data
|
|
* for each PE in the OpenSHMEM job.
|
|
* @param size The number of bytes to be sent to each PE in the job.
|
|
* @param counter A symmetric data object to be atomically incremented after
|
|
* the target buffer is updated.
|
|
*
|
|
* @return OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_put_all_nb_fn_t)(void *dest,
|
|
const void *source,
|
|
size_t size,
|
|
long *counter);
|
|
|
|
/**
|
|
* Assures ordering of delivery of put() requests
|
|
*
|
|
* @param ctx - The context object this routine is working on.
|
|
* @return - OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_fence_fn_t)(shmem_ctx_t ctx);
|
|
|
|
/**
|
|
* Wait for completion of all outstanding put() requests
|
|
*
|
|
* @param ctx - The context object this routine is working on.
|
|
* @return - OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_quiet_fn_t)(shmem_ctx_t ctx);
|
|
|
|
/**
|
|
* Waits for completion of a non-blocking put or get issued by the calling PE.
|
|
*
|
|
* @return - OSHMEM_SUCCESS or failure status.
|
|
*/
|
|
typedef int (*mca_spml_base_module_wait_nb_fn_t)(void *);
|
|
|
|
/**
|
|
* Called by memheap when memory is allocated by shmalloc(),
|
|
* shcalloc(), shmemalign() or shrealloc()
|
|
*
|
|
* @param addr base address of the registered buffer.
|
|
* @param size the size of the buffer to be registered.
|
|
*/
|
|
typedef void (*mca_spml_base_module_memuse_hook_fn_t)(void *, size_t);
|
|
|
|
/**
|
|
* SPML instance.
|
|
*/
|
|
struct mca_spml_base_module_1_0_0_t {
|
|
|
|
mca_spml_base_module_add_procs_fn_t spml_add_procs;
|
|
mca_spml_base_module_del_procs_fn_t spml_del_procs;
|
|
|
|
mca_spml_base_module_enable_fn_t spml_enable;
|
|
mca_spml_base_module_register_fn_t spml_register;
|
|
mca_spml_base_module_deregister_fn_t spml_deregister;
|
|
mca_spml_base_module_oob_get_mkeys_fn_t spml_oob_get_mkeys;
|
|
|
|
mca_spml_base_module_ctx_create_fn_t spml_ctx_create;
|
|
mca_spml_base_module_ctx_destroy_fn_t spml_ctx_destroy;
|
|
|
|
mca_spml_base_module_put_fn_t spml_put;
|
|
mca_spml_base_module_put_nb_fn_t spml_put_nb;
|
|
mca_spml_base_module_get_fn_t spml_get;
|
|
mca_spml_base_module_get_nb_fn_t spml_get_nb;
|
|
|
|
mca_spml_base_module_recv_fn_t spml_recv;
|
|
mca_spml_base_module_send_fn_t spml_send;
|
|
|
|
mca_spml_base_module_wait_fn_t spml_wait;
|
|
mca_spml_base_module_wait_nb_fn_t spml_wait_nb;
|
|
mca_spml_base_module_test_fn_t spml_test;
|
|
mca_spml_base_module_fence_fn_t spml_fence;
|
|
mca_spml_base_module_quiet_fn_t spml_quiet;
|
|
|
|
mca_spml_base_module_mkey_unpack_fn_t spml_rmkey_unpack;
|
|
mca_spml_base_module_mkey_free_fn_t spml_rmkey_free;
|
|
mca_spml_base_module_mkey_ptr_fn_t spml_rmkey_ptr;
|
|
|
|
mca_spml_base_module_memuse_hook_fn_t spml_memuse_hook;
|
|
mca_spml_base_module_put_all_nb_fn_t spml_put_all_nb;
|
|
void *self;
|
|
};
|
|
|
|
typedef struct mca_spml_base_module_1_0_0_t mca_spml_base_module_1_0_0_t;
|
|
typedef mca_spml_base_module_1_0_0_t mca_spml_base_module_t;
|
|
|
|
/*
|
|
* Macro for use in components that are of type spml
|
|
*/
|
|
#define MCA_SPML_BASE_VERSION_2_0_0 \
|
|
OSHMEM_MCA_BASE_VERSION_2_1_0("spml", 2, 0, 0)
|
|
|
|
/*
|
|
* macro for doing direct call / call through struct
|
|
*/
|
|
#if MCA_oshmem_spml_DIRECT_CALL
|
|
|
|
#include MCA_oshmem_spml_DIRECT_CALL_HEADER
|
|
|
|
#define MCA_SPML_CALL_STAMP(a, b) mca_spml_ ## a ## _ ## b
|
|
#define MCA_SPML_CALL_EXPANDER(a, b) MCA_SPML_CALL_STAMP(a,b)
|
|
#define MCA_SPML_CALL(a) MCA_SPML_CALL_EXPANDER(MCA_oshmem_spml_DIRECT_CALL_COMPONENT, a)
|
|
|
|
#else
|
|
#define MCA_SPML_CALL(a) mca_spml.spml_ ## a
|
|
#endif
|
|
|
|
OSHMEM_DECLSPEC extern mca_spml_base_module_t mca_spml;
|
|
|
|
END_C_DECLS
|
|
#endif /* MCA_SPML_H */
|