311 строки
12 KiB
C
311 строки
12 KiB
C
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
|
/*
|
|
* Copyright (c) 2004-2008 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2007-2014 Los Alamos National Security, LLC. All rights
|
|
* reserved.
|
|
* Copyright (c) 2014-2016 Intel, Inc. All rights reserved.
|
|
* Copyright (c) 2016 Research Organization for Information Science
|
|
* and Technology (RIST). All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
*
|
|
* RML Framework maintenence interface
|
|
*
|
|
* Interface for starting / stopping / controlling the RML framework,307
|
|
* as well as support for modifying RML datatypes.
|
|
*
|
|
* @note The only RML datatype exposed to the user is the RML tag.
|
|
* This will always be an integral value, so the only datatype support
|
|
* really required is the internal DSS functions for packing /
|
|
* unpacking / comparing tags. The user should never need to deal
|
|
* with these.
|
|
*/
|
|
|
|
#ifndef MCA_RML_BASE_H
|
|
#define MCA_RML_BASE_H
|
|
|
|
#include "orte_config.h"
|
|
|
|
#include "opal/dss/dss_types.h"
|
|
#include "orte/mca/mca.h"
|
|
#include "opal/util/timings.h"
|
|
#include "opal/class/opal_pointer_array.h"
|
|
|
|
#include "orte/runtime/orte_globals.h"
|
|
#include "orte/mca/routed/routed.h"
|
|
|
|
#include "orte/mca/rml/rml.h"
|
|
|
|
|
|
BEGIN_C_DECLS
|
|
|
|
OPAL_TIMING_DECLARE_EXT(ORTE_DECLSPEC, tm_rml)
|
|
|
|
/*
|
|
* MCA Framework
|
|
*/
|
|
ORTE_DECLSPEC extern mca_base_framework_t orte_rml_base_framework;
|
|
/* select a component */
|
|
ORTE_DECLSPEC int orte_rml_base_select(void);
|
|
|
|
/**
|
|
* Post receive to get updates regarding contact information
|
|
*
|
|
* Post a non-blocking receive (likely during orte_init()) to receive
|
|
* updated contact information from the HNP when it becomes available.
|
|
* This should be called in any process that needs such updates, and
|
|
* the receive will continue to get update callbacks until
|
|
* orte_rml_base_comm_stop() is called.
|
|
*/
|
|
ORTE_DECLSPEC void orte_rml_base_comm_start(void);
|
|
|
|
|
|
/**
|
|
* Stop receiving contact information updates
|
|
*
|
|
* Shut down the receive posted during orte_rml_base_comm_start(),
|
|
* likely during orte_finalize().
|
|
*/
|
|
ORTE_DECLSPEC void orte_rml_base_comm_stop(void);
|
|
|
|
|
|
/*
|
|
* globals that might be needed
|
|
*/
|
|
/* adding element to hold the active modules and components */
|
|
typedef struct {
|
|
opal_list_item_t super;
|
|
int pri;
|
|
orte_rml_component_t *component;
|
|
} orte_rml_base_active_t;
|
|
OBJ_CLASS_DECLARATION(orte_rml_base_active_t);
|
|
|
|
/* a global struct containing framework-level values */
|
|
typedef struct {
|
|
opal_list_t actives; /* list to hold the active components */
|
|
opal_pointer_array_t conduits; /* array to hold the open conduits */
|
|
opal_list_t posted_recvs;
|
|
opal_list_t unmatched_msgs;
|
|
int max_retries;
|
|
#if OPAL_ENABLE_TIMING
|
|
bool timing;
|
|
#endif
|
|
} orte_rml_base_t;
|
|
ORTE_DECLSPEC extern orte_rml_base_t orte_rml_base;
|
|
|
|
|
|
/* structure to send RML messages - used internally */
|
|
typedef struct {
|
|
opal_list_item_t super;
|
|
orte_process_name_t dst; // targeted recipient
|
|
orte_process_name_t origin;
|
|
int status; // returned status on send
|
|
orte_rml_tag_t tag; // targeted tag
|
|
int retries; // #times we have tried to send it
|
|
|
|
/* user's send callback functions and data */
|
|
union {
|
|
orte_rml_callback_fn_t iov;
|
|
orte_rml_buffer_callback_fn_t buffer;
|
|
} cbfunc;
|
|
void *cbdata;
|
|
|
|
/* pointer to the user's iovec array */
|
|
struct iovec *iov;
|
|
int count;
|
|
/* pointer to the user's buffer */
|
|
opal_buffer_t *buffer;
|
|
/* msg seq number */
|
|
uint32_t seq_num;
|
|
/* pointer to raw data for cross-transport
|
|
* transfers
|
|
*/
|
|
char *data;
|
|
/* routed module to be used */
|
|
char *routed;
|
|
} orte_rml_send_t;
|
|
OBJ_CLASS_DECLARATION(orte_rml_send_t);
|
|
|
|
/* define an object for transferring send requests to the event lib */
|
|
typedef struct {
|
|
opal_object_t super;
|
|
opal_event_t ev;
|
|
orte_rml_send_t send;
|
|
} orte_rml_send_request_t;
|
|
OBJ_CLASS_DECLARATION(orte_rml_send_request_t);
|
|
|
|
/* structure to recv RML messages - used internally */
|
|
typedef struct {
|
|
opal_list_item_t super;
|
|
opal_event_t ev;
|
|
orte_process_name_t sender; // sender
|
|
orte_rml_tag_t tag; // targeted tag
|
|
uint32_t seq_num; //sequence number
|
|
struct iovec iov; // the recvd data
|
|
} orte_rml_recv_t;
|
|
OBJ_CLASS_DECLARATION(orte_rml_recv_t);
|
|
|
|
typedef struct {
|
|
opal_list_item_t super;
|
|
bool buffer_data;
|
|
orte_process_name_t peer;
|
|
orte_rml_tag_t tag;
|
|
bool persistent;
|
|
union {
|
|
orte_rml_callback_fn_t iov;
|
|
orte_rml_buffer_callback_fn_t buffer;
|
|
} cbfunc;
|
|
void *cbdata;
|
|
} orte_rml_posted_recv_t;
|
|
OBJ_CLASS_DECLARATION(orte_rml_posted_recv_t);
|
|
|
|
/* define an object for transferring recv requests to the list of posted recvs */
|
|
typedef struct {
|
|
opal_object_t super;
|
|
opal_event_t ev;
|
|
bool cancel;
|
|
orte_rml_posted_recv_t *post;
|
|
} orte_rml_recv_request_t;
|
|
OBJ_CLASS_DECLARATION(orte_rml_recv_request_t);
|
|
|
|
/* define a structure for sending a message to myself */
|
|
typedef struct {
|
|
opal_object_t object;
|
|
opal_event_t ev;
|
|
orte_rml_tag_t tag;
|
|
struct iovec* iov;
|
|
int count;
|
|
opal_buffer_t *buffer;
|
|
union {
|
|
orte_rml_callback_fn_t iov;
|
|
orte_rml_buffer_callback_fn_t buffer;
|
|
} cbfunc;
|
|
void *cbdata;
|
|
} orte_self_send_xfer_t;
|
|
OBJ_CLASS_DECLARATION(orte_self_send_xfer_t);
|
|
|
|
#define ORTE_RML_POST_MESSAGE(p, t, s, b, l) \
|
|
do { \
|
|
orte_rml_recv_t *msg; \
|
|
opal_output_verbose(5, orte_rml_base_framework.framework_output, \
|
|
"%s Message posted at %s:%d", \
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME), \
|
|
__FILE__, __LINE__); \
|
|
msg = OBJ_NEW(orte_rml_recv_t); \
|
|
msg->sender.jobid = (p)->jobid; \
|
|
msg->sender.vpid = (p)->vpid; \
|
|
msg->tag = (t); \
|
|
msg->seq_num = (s); \
|
|
msg->iov.iov_base = (IOVBASE_TYPE*)(b); \
|
|
msg->iov.iov_len = (l); \
|
|
/* setup the event */ \
|
|
opal_event_set(orte_event_base, &msg->ev, -1, \
|
|
OPAL_EV_WRITE, \
|
|
orte_rml_base_process_msg, msg); \
|
|
opal_event_set_priority(&msg->ev, ORTE_MSG_PRI); \
|
|
opal_event_active(&msg->ev, OPAL_EV_WRITE, 1); \
|
|
} while(0);
|
|
|
|
#define ORTE_RML_ACTIVATE_MESSAGE(m) \
|
|
do { \
|
|
/* setup the event */ \
|
|
opal_event_set(orte_event_base, &(m)->ev, -1, \
|
|
OPAL_EV_WRITE, \
|
|
orte_rml_base_process_msg, (m)); \
|
|
opal_event_set_priority(&(m)->ev, ORTE_MSG_PRI); \
|
|
opal_event_active(&(m)->ev, OPAL_EV_WRITE, 1); \
|
|
} while(0);
|
|
|
|
#define ORTE_RML_SEND_COMPLETE(m) \
|
|
do { \
|
|
opal_output_verbose(5, orte_rml_base_framework.framework_output, \
|
|
"%s-%s Send message complete at %s:%d", \
|
|
ORTE_NAME_PRINT(ORTE_PROC_MY_NAME), \
|
|
ORTE_NAME_PRINT(&((m)->dst)), \
|
|
__FILE__, __LINE__); \
|
|
if (NULL != (m)->iov) { \
|
|
if (NULL != (m)->cbfunc.iov) { \
|
|
(m)->cbfunc.iov((m)->status, \
|
|
&((m)->dst), \
|
|
(m)->iov, (m)->count, \
|
|
(m)->tag, (m)->cbdata); \
|
|
} \
|
|
} else if (NULL != (m)->cbfunc.buffer) { \
|
|
/* non-blocking buffer send */ \
|
|
(m)->cbfunc.buffer((m)->status, &((m)->origin), \
|
|
(m)->buffer, \
|
|
(m)->tag, (m)->cbdata); \
|
|
} \
|
|
OBJ_RELEASE(m); \
|
|
}while(0);
|
|
|
|
#define ORTE_RML_INVALID_CHANNEL_NUM UINT32_MAX
|
|
/* common implementations */
|
|
ORTE_DECLSPEC void orte_rml_base_post_recv(int sd, short args, void *cbdata);
|
|
ORTE_DECLSPEC void orte_rml_base_process_msg(int fd, short flags, void *cbdata);
|
|
ORTE_DECLSPEC void orte_rml_base_complete_recv_msg (orte_rml_recv_t **recv_msg);
|
|
|
|
|
|
/* Stub API interfaces to cycle through active plugins */
|
|
char* orte_rml_API_get_contact_info(void);
|
|
void orte_rml_API_set_contact_info(const char *contact_info);
|
|
|
|
int orte_rml_API_ping(orte_rml_conduit_t conduit_id,
|
|
const char* contact_info,
|
|
const struct timeval* tv);
|
|
|
|
int orte_rml_API_send_nb(orte_rml_conduit_t conduit_id,
|
|
orte_process_name_t* peer, struct iovec* msg,
|
|
int count, orte_rml_tag_t tag,
|
|
orte_rml_callback_fn_t cbfunc, void* cbdata);
|
|
|
|
int orte_rml_API_send_buffer_nb(orte_rml_conduit_t conduit_id,
|
|
orte_process_name_t* peer,
|
|
struct opal_buffer_t* buffer,
|
|
orte_rml_tag_t tag,
|
|
orte_rml_buffer_callback_fn_t cbfunc,
|
|
void* cbdata);
|
|
|
|
void orte_rml_API_recv_nb(orte_process_name_t* peer,
|
|
orte_rml_tag_t tag,
|
|
bool persistent,
|
|
orte_rml_callback_fn_t cbfunc,
|
|
void* cbdata);
|
|
void orte_rml_API_recv_buffer_nb(orte_process_name_t* peer,
|
|
orte_rml_tag_t tag,
|
|
bool persistent,
|
|
orte_rml_buffer_callback_fn_t cbfunc,
|
|
void* cbdata);
|
|
|
|
void orte_rml_API_recv_cancel(orte_process_name_t* peer, orte_rml_tag_t tag);
|
|
|
|
void orte_rml_API_purge(orte_process_name_t *peer);
|
|
|
|
int orte_rml_API_query_transports(opal_list_t *providers);
|
|
|
|
orte_rml_conduit_t orte_rml_API_open_conduit(opal_list_t *attributes);
|
|
|
|
void orte_rml_API_close_conduit(orte_rml_conduit_t id);
|
|
|
|
char* orte_rml_API_get_routed(orte_rml_conduit_t id);
|
|
|
|
END_C_DECLS
|
|
|
|
#endif /* MCA_RML_BASE_H */
|