1
1
openmpi/src/mca/gpr/replica/gpr_replica.h

359 строки
13 KiB
C
Исходник Обычный вид История

/* -*- C -*-
*
* Copyright (c) 2004-2005 The Trustees of Indiana University.
* All rights reserved.
* Copyright (c) 2004-2005 The Trustees of the University of Tennessee.
* All rights reserved.
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
* University of Stuttgart. All rights reserved.
* Copyright (c) 2004-2005 The Regents of the University of California.
* All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*
*/
/** @file
*/
#ifndef ORTE_GPR_REPLICA_H
#define ORTE_GPR_REPLICA_H
#include "orte_config.h"
#include <time.h>
#include "class/orte_bitmap.h"
#include "class/orte_pointer_array.h"
#include "class/orte_value_array.h"
#include "threads/mutex.h"
#include "threads/condition.h"
#include "mca/ns/ns_types.h"
#include "mca/gpr/base/base.h"
#if defined(c_plusplus) || defined(__cplusplus)
extern "C" {
#endif
/*
* typedefs needed in replica component
*/
/* JMS: This is only INT_MAX until bug 1345 is fixed, because this
value is used to set an MAC parameter, which can [currently] only
take an int. */
#define ORTE_GPR_REPLICA_MAX_SIZE INT_MAX
#define ORTE_GPR_REPLICA_BLOCK_SIZE 100
typedef size_t orte_gpr_replica_itag_t;
#define ORTE_GPR_REPLICA_ITAG_MAX SIZE_MAX
typedef uint8_t orte_gpr_replica_addr_mode_t;
#define ORTE_GPR_REPLICA_AND (uint8_t)0x01
#define ORTE_GPR_REPLICA_OR (uint8_t)0x02
#define ORTE_GPR_REPLICA_XAND (uint8_t)0x04
#define ORTE_GPR_REPLICA_XOR (uint8_t)0x08
#define ORTE_GPR_REPLICA_NOT (uint8_t)0x40
/* define a few action flags for trigger evaluation
*/
#define ORTE_GPR_REPLICA_NO_ACTION (int8_t) 0
#define ORTE_GPR_REPLICA_ENTRY_ADDED (int8_t) 1
#define ORTE_GPR_REPLICA_ENTRY_DELETED (int8_t) 2
#define ORTE_GPR_REPLICA_ENTRY_CHANGED (int8_t) 3
#define ORTE_GPR_REPLICA_ENTRY_CHG_TO (int8_t) 4
#define ORTE_GPR_REPLICA_ENTRY_CHG_FRM (int8_t) 5
typedef int8_t orte_gpr_replica_action_t;
typedef struct {
int debug;
int isolate;
size_t block_size;
size_t max_size;
ompi_mutex_t mutex;
bool compound_cmd_mode;
bool exec_compound_cmd_mode;
orte_buffer_t *compound_cmd;
ompi_mutex_t wait_for_compound_mutex;
ompi_condition_t compound_cmd_condition;
int compound_cmd_waiting;
orte_pointer_array_t *srch_cptr;
orte_pointer_array_t *srch_ival;
orte_pointer_array_t *acted_upon;
orte_bitmap_t srch_itag;
} orte_gpr_replica_globals_t;
/** Dictionary of string-itag pairs.
* This structure is used to create a linked list of string-itag pairs. All calls to
* registry functions pass character strings for programming clarity - the replica_dict
* structure is used to translate those strings into an integer itag value, thus allowing
* for faster searches of the registry.
*/
struct orte_gpr_replica_dict_t {
char *entry; /**< Char string that defines the itag */
orte_gpr_replica_itag_t itag; /**< Numerical value assigned by registry to represent string */
};
typedef struct orte_gpr_replica_dict_t orte_gpr_replica_dict_t;
/*
* Registry "head"
* The registry "head" contains:
*
* (2) the next available itag for the segment dictionary.
*
* (3) a managed array of pointers to segment objects.
*
* (4) a managed array of pointers to triggers acting on the entire registry
*
*/
struct orte_gpr_replica_t {
orte_pointer_array_t *segments; /**< Managed array of pointers to segment objects */
orte_pointer_array_t *triggers; /**< Managed array of pointers to triggers */
ompi_list_t callbacks; /**< List of callbacks to be processed */
};
typedef struct orte_gpr_replica_t orte_gpr_replica_t;
/** Registry segment definition.
* The registry is subdivided into segments, each defining a unique domain. The "universe" segment
* is automatically created to allow the exchange of information supporting universe-level functions.
* Similarly, a segment is automatically created for each MPI CommWorld within the universe - the
* name for that segment is stored in each CommWorld's ompi_system_info structure so program
* elements within that CommWorld can access it. The segment structure serves as the "head" of a linked
* list of registry elements for that segment. Each segment also holds its own token-itag dictionary
* to avoid naming conflicts between tokens from CommWorlds sharing a given universe.
*/
struct orte_gpr_replica_segment_t {
ompi_object_t super; /**< Make this an object */
char *name; /**< Name of the segment */
orte_gpr_replica_itag_t itag; /**< itag of this segment */
orte_pointer_array_t *dict; /**< Managed array of dict structs */
orte_pointer_array_t *containers; /**< Managed array of pointers to containers on this segment */
};
typedef struct orte_gpr_replica_segment_t orte_gpr_replica_segment_t;
OBJ_CLASS_DECLARATION(orte_gpr_replica_segment_t);
/** The core registry structure.
* Each segment of the registry contains an array of registry containers, each composed
* of:
*
* (1) An object structure that allows the structure to be treated with the OBJ
* memory management system
*
* (2) An array of itags that define the container - these are 1:1 correspondents with
* the character string tokens provided by caller
*
* (3) An array of indices into the trigger notifier array - each index points to
* a notifier whose trigger refers to this container.
*
* (4) An array of pointers to keyval objects that actually hold the data.
*
* At this time, no security is provided on an object-level basis. Thus, all requests for an
* object are automatically granted. This may be changed at some future time by adding an
* "authorization" linked list of ID's and their access rights to this structure.
*/
struct orte_gpr_replica_container_t {
ompi_object_t super; /**< Make this an object */
size_t index; /**< Location in the pointer array */
orte_gpr_replica_itag_t *itags; /**< Array of itags that define this container */
size_t num_itags; /**< Number of itags in array */
orte_pointer_array_t *itagvals; /**< Array of itagval pointers */
orte_value_array_t itaglist; /**< Array of itags from all itagvals - used for rapid search */
};
typedef struct orte_gpr_replica_container_t orte_gpr_replica_container_t;
OBJ_CLASS_DECLARATION(orte_gpr_replica_container_t);
/* The itag-value pair for storing data entries in the registry
*/
typedef struct {
ompi_object_t super; /**< required for this to be an object */
size_t index; /**< index of this itagval on the container array */
orte_gpr_replica_itag_t itag; /**< itag for this value's key */
orte_data_type_t type; /**< the type of value stored */
orte_gpr_value_union_t value; /**< Actual stored value */
} orte_gpr_replica_itagval_t;
OMPI_DECLSPEC OBJ_CLASS_DECLARATION(orte_gpr_replica_itagval_t);
typedef struct {
ompi_object_t super;
orte_gpr_replica_segment_t *seg;
orte_gpr_replica_container_t *cptr;
orte_gpr_replica_itagval_t *iptr;
orte_gpr_replica_itagval_t trigger_level;
} orte_gpr_replica_counter_t;
OBJ_CLASS_DECLARATION(orte_gpr_replica_counter_t);
typedef struct {
ompi_object_t super; /**< Makes this an object */
size_t index; /**< Index of this entry in original subscription */
/* the segment upon which this data is located */
orte_gpr_replica_segment_t *seg;
/* describe the data to be returned with the message -
* for triggers that are counting themselves (i.e., not monitoring a separate
* counter), this also describes the data to be included in the count
*/
orte_gpr_addr_mode_t addr_mode; /**< Tokens/keys addressing mode */
orte_value_array_t tokentags; /**< Array of tokens defining which containers are affected */
orte_value_array_t keytags; /**< Array of keys defining which key-value pairs are affected */
/* where this block of data goes */
orte_gpr_notify_cb_fn_t callback; /**< Function to be called for notification */
void *user_tag; /**< User-provided tag for callback function */
} orte_gpr_replica_subscribed_data_t;
OBJ_CLASS_DECLARATION(orte_gpr_replica_subscribed_data_t);
struct orte_gpr_replica_triggers_t {
ompi_object_t super; /**< Make this an object */
/* index of this trigger in the triggers array */
size_t index;
Fix a subtle bug in the registry callback system that was manifesting itself in the singleton case and (randomly) in the multiprocess case. Update the unit-test-status matrix to include priority. Add several new registry diagnostics that helped track down the above bug. M test/mca/gpr/gpr_triggers.c M test/Unit-Test-Status.xls M test/Unit-Test-Status.pdf M src/mpi/runtime/ompi_mpi_init.c M src/mca/oob/base/oob_base_xcast.c M src/mca/ns/base/ns_base_nds_env.c M src/mca/gpr/replica/api_layer/gpr_replica_dump_api.c M src/mca/gpr/replica/api_layer/gpr_replica_api.h M src/mca/gpr/replica/communications/gpr_replica_comm.h M src/mca/gpr/replica/communications/gpr_replica_remote_msg.c M src/mca/gpr/replica/communications/gpr_replica_cmd_processor.c M src/mca/gpr/replica/communications/gpr_replica_dump_cm.c M src/mca/gpr/replica/gpr_replica_component.c M src/mca/gpr/replica/gpr_replica.h M src/mca/gpr/replica/functional_layer/gpr_replica_dump_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_fn.h M src/mca/gpr/replica/functional_layer/gpr_replica_trig_ops_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_messaging_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_segment_fn.c M src/mca/gpr/proxy/gpr_proxy_dump.c M src/mca/gpr/proxy/gpr_proxy.h M src/mca/gpr/proxy/gpr_proxy_component.c M src/mca/gpr/gpr_types.h M src/mca/gpr/base/base.h M src/mca/gpr/base/unpack_api_response/gpr_base_dump_notify.c M src/mca/gpr/base/pack_api_cmd/gpr_base_pack_dump.c M src/mca/gpr/gpr.h This commit was SVN r5080.
2005-03-29 02:37:54 +04:00
/* flag that indicates this trigger is a one-shot, has fired and
* now should be cleaned up
*/
bool one_shot_fired;
/* the action that causes a notification message to be sent out */
orte_gpr_notify_action_t action;
/* to whom the notification messages go - set to NULL if local */
orte_process_name_t *requestor; /**< Name of requesting process */
/* remote idtag associated with this subscription -
* set to ORTE_GPR_NOTIFY_ID_MAX if local
*/
orte_gpr_notify_id_t remote_idtag; /**< Remote ID tag of subscription */
/* a pointer to the data belonging to this subscription. Each subscribed data
* object describes a set of data to be returned whenever this subscription
* fires. for subscriptions that do not involve trigger events, these objects
* describe the data being monitored
*/
size_t num_subscribed_data;
orte_pointer_array_t *subscribed_data;
/* for triggers, store a pointer to the counters being monitored. This could
* be counters we are using ourselves, or could be counters being run by someone
* else. Store the trigger level for each counter that we are monitoring until they reach
* a specified level (as opposed to comparing values in two or more counters).
*/
size_t num_counters;
orte_pointer_array_t *counters;
};
typedef struct orte_gpr_replica_triggers_t orte_gpr_replica_triggers_t;
OMPI_DECLSPEC OBJ_CLASS_DECLARATION(orte_gpr_replica_triggers_t);
/*
* Action taken object - used to track what action was taken against what
* registry object during the course of a registry request. For example, if
* a PUT modifies an existing registry entry, then we store a pointer to that
* entry and a flag indicating that it was modified. This info is required for
* processing notification subscriptions.
*/
typedef struct {
ompi_object_t super; /**< Make this an object */
orte_gpr_replica_action_t action;
orte_gpr_replica_segment_t *seg;
orte_gpr_replica_container_t *cptr;
orte_gpr_replica_itagval_t *iptr;
} orte_gpr_replica_action_taken_t;
OMPI_DECLSPEC OBJ_CLASS_DECLARATION(orte_gpr_replica_action_taken_t);
Fix a subtle bug in the registry callback system that was manifesting itself in the singleton case and (randomly) in the multiprocess case. Update the unit-test-status matrix to include priority. Add several new registry diagnostics that helped track down the above bug. M test/mca/gpr/gpr_triggers.c M test/Unit-Test-Status.xls M test/Unit-Test-Status.pdf M src/mpi/runtime/ompi_mpi_init.c M src/mca/oob/base/oob_base_xcast.c M src/mca/ns/base/ns_base_nds_env.c M src/mca/gpr/replica/api_layer/gpr_replica_dump_api.c M src/mca/gpr/replica/api_layer/gpr_replica_api.h M src/mca/gpr/replica/communications/gpr_replica_comm.h M src/mca/gpr/replica/communications/gpr_replica_remote_msg.c M src/mca/gpr/replica/communications/gpr_replica_cmd_processor.c M src/mca/gpr/replica/communications/gpr_replica_dump_cm.c M src/mca/gpr/replica/gpr_replica_component.c M src/mca/gpr/replica/gpr_replica.h M src/mca/gpr/replica/functional_layer/gpr_replica_dump_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_fn.h M src/mca/gpr/replica/functional_layer/gpr_replica_trig_ops_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_messaging_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_segment_fn.c M src/mca/gpr/proxy/gpr_proxy_dump.c M src/mca/gpr/proxy/gpr_proxy.h M src/mca/gpr/proxy/gpr_proxy_component.c M src/mca/gpr/gpr_types.h M src/mca/gpr/base/base.h M src/mca/gpr/base/unpack_api_response/gpr_base_dump_notify.c M src/mca/gpr/base/pack_api_cmd/gpr_base_pack_dump.c M src/mca/gpr/gpr.h This commit was SVN r5080.
2005-03-29 02:37:54 +04:00
/*
* Notify message list objects - used to track individual messages going to
* the same recipient
*/
typedef struct {
ompi_list_item_t item;
orte_gpr_notify_message_t *message;
} orte_gpr_replica_notify_msg_list_t;
OBJ_CLASS_DECLARATION(orte_gpr_replica_notify_msg_list_t);
/*
* Callback list objects
*/
struct orte_gpr_replica_callbacks_t {
ompi_list_item_t item;
Fix a subtle bug in the registry callback system that was manifesting itself in the singleton case and (randomly) in the multiprocess case. Update the unit-test-status matrix to include priority. Add several new registry diagnostics that helped track down the above bug. M test/mca/gpr/gpr_triggers.c M test/Unit-Test-Status.xls M test/Unit-Test-Status.pdf M src/mpi/runtime/ompi_mpi_init.c M src/mca/oob/base/oob_base_xcast.c M src/mca/ns/base/ns_base_nds_env.c M src/mca/gpr/replica/api_layer/gpr_replica_dump_api.c M src/mca/gpr/replica/api_layer/gpr_replica_api.h M src/mca/gpr/replica/communications/gpr_replica_comm.h M src/mca/gpr/replica/communications/gpr_replica_remote_msg.c M src/mca/gpr/replica/communications/gpr_replica_cmd_processor.c M src/mca/gpr/replica/communications/gpr_replica_dump_cm.c M src/mca/gpr/replica/gpr_replica_component.c M src/mca/gpr/replica/gpr_replica.h M src/mca/gpr/replica/functional_layer/gpr_replica_dump_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_fn.h M src/mca/gpr/replica/functional_layer/gpr_replica_trig_ops_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_messaging_fn.c M src/mca/gpr/replica/functional_layer/gpr_replica_segment_fn.c M src/mca/gpr/proxy/gpr_proxy_dump.c M src/mca/gpr/proxy/gpr_proxy.h M src/mca/gpr/proxy/gpr_proxy_component.c M src/mca/gpr/gpr_types.h M src/mca/gpr/base/base.h M src/mca/gpr/base/unpack_api_response/gpr_base_dump_notify.c M src/mca/gpr/base/pack_api_cmd/gpr_base_pack_dump.c M src/mca/gpr/gpr.h This commit was SVN r5080.
2005-03-29 02:37:54 +04:00
ompi_list_t messages;
orte_process_name_t *requestor;
};
typedef struct orte_gpr_replica_callbacks_t orte_gpr_replica_callbacks_t;
OBJ_CLASS_DECLARATION(orte_gpr_replica_callbacks_t);
/** List of replicas that hold a stored entry.
* Each entry can have an arbitrary number of replicas that hold a copy
* of the entry. The GPR requires that each entry be replicated in at least
* two locations. This structure is used to create a linked list of
* replicas for the entry.
*
* THIS IS NOT IMPLEMENTED YET
*/
struct orte_gpr_replica_list_t {
ompi_list_item_t item; /**< Allows this item to be placed on a list */
orte_process_name_t *replica; /**< Name of the replica */
};
typedef struct orte_gpr_replica_list_t orte_gpr_replica_list_t;
OBJ_CLASS_DECLARATION(orte_gpr_replica_list_t);
/** Write invalidate structure.
* The structure used to indicate that an entry has been updated somewhere else in the GPR.
* The structure contains a flag indicating that the locally stored copy of the entry
* is no longer valid, a time tag indicating the time of the last known modification
* of the entry within the global registry, and the replica holding the last known
* up-to-date version of the entry.
*
* THIS IS NOT IMPLEMENTED YET
*/
struct orte_gpr_replica_write_invalidate_t {
bool invalidate;
time_t last_mod;
orte_process_name_t *valid_replica;
};
typedef struct orte_gpr_replica_write_invalidate_t orte_gpr_replica_write_invalidate_t;
/*
* globals needed within component
*/
extern orte_gpr_replica_t orte_gpr_replica;
extern orte_gpr_replica_globals_t orte_gpr_replica_globals;
/*
* Module open / close
*/
int orte_gpr_replica_open(void);
int orte_gpr_replica_close(void);
/*
* Startup / Shutdown
*/
orte_gpr_base_module_t *orte_gpr_replica_init(bool *allow_multi_user_threads, bool *have_hidden_threads, int *priority);
int orte_gpr_replica_finalize(void);
int orte_gpr_replica_module_init(void);
#if defined(c_plusplus) || defined(__cplusplus)
}
#endif
#endif