7e2874a83d
Useful when debugging RTE-related issues Not for inclusion in the tarball - just added to git repo for use by developers. Signed-off-by: Ralph Castain <rhc@pmix.org>
294 строки
9.4 KiB
C
294 строки
9.4 KiB
C
/* -*- C -*-
|
|
*
|
|
* $HEADER$
|
|
*
|
|
* The most basic of MPI applications
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <pthread.h>
|
|
|
|
#include "opal/mca/hwloc/base/base.h"
|
|
#include "mpi.h"
|
|
|
|
#include "orte/util/proc_info.h"
|
|
#include "opal/mca/pmix/base/base.h"
|
|
|
|
static size_t interlibhandler_id = SIZE_MAX;
|
|
static opal_pmix_lock_t thread_complete;
|
|
|
|
static void model_registration_callback(int status,
|
|
size_t errhandler_ref,
|
|
void *cbdata)
|
|
{
|
|
opal_pmix_lock_t *lock = (opal_pmix_lock_t*)cbdata;
|
|
|
|
interlibhandler_id = errhandler_ref;
|
|
OPAL_PMIX_WAKEUP_THREAD(lock);
|
|
}
|
|
static void model_callback(int status,
|
|
const opal_process_name_t *source,
|
|
opal_list_t *info, opal_list_t *results,
|
|
opal_pmix_notification_complete_fn_t cbfunc,
|
|
void *cbdata)
|
|
{
|
|
opal_value_t *val;
|
|
|
|
/* we can ignore our own callback as we obviously
|
|
* know that we are OpenMP */
|
|
if (NULL != info) {
|
|
OPAL_LIST_FOREACH(val, info, opal_value_t) {
|
|
if (0 == strcmp(val->key, OPAL_PMIX_PROGRAMMING_MODEL) &&
|
|
0 == strcmp(val->data.string, "OpenMP")) {
|
|
goto cback;
|
|
}
|
|
if (OPAL_STRING == val->type) {
|
|
opal_output(0, "Thread Model Callback Key: %s Val %s", val->key, val->data.string);
|
|
}
|
|
}
|
|
}
|
|
/* otherwise, do something clever here */
|
|
|
|
cback:
|
|
/* we must NOT tell the event handler state machine that we
|
|
* are the last step as that will prevent it from notifying
|
|
* anyone else that might be listening for declarations */
|
|
if (NULL != cbfunc) {
|
|
cbfunc(OPAL_SUCCESS, NULL, NULL, NULL, cbdata);
|
|
}
|
|
OPAL_PMIX_WAKEUP_THREAD(&thread_complete);
|
|
}
|
|
|
|
static void opcbfunc(int status, void *cbdata)
|
|
{
|
|
opal_pmix_lock_t *lock = (opal_pmix_lock_t*)cbdata;
|
|
OPAL_PMIX_WAKEUP_THREAD(lock);
|
|
}
|
|
|
|
static void infocb(int status,
|
|
opal_list_t *info,
|
|
void *cbdata,
|
|
opal_pmix_release_cbfunc_t release_fn,
|
|
void *release_cbdata)
|
|
{
|
|
opal_pmix_lock_t *lock = (opal_pmix_lock_t*)cbdata;
|
|
opal_value_t *kv;
|
|
|
|
OPAL_LIST_FOREACH(kv, info, opal_value_t) {
|
|
opal_output(0, "QUERY DATA KEY: %s VALUE %s", kv->key, kv->data.string);
|
|
}
|
|
if (NULL != release_fn) {
|
|
release_fn(release_cbdata);
|
|
}
|
|
OPAL_PMIX_WAKEUP_THREAD(lock);
|
|
}
|
|
|
|
static void *mylib(void *ptr)
|
|
{
|
|
opal_list_t info, directives;
|
|
opal_value_t *kv;
|
|
int ret;
|
|
opal_pmix_lock_t lock;
|
|
bool init = false;
|
|
opal_pmix_query_t *query;
|
|
opal_pmix_pdata_t *pdata;
|
|
|
|
OPAL_PMIX_CONSTRUCT_LOCK(&thread_complete);
|
|
|
|
/* declare that we are present and active */
|
|
OBJ_CONSTRUCT(&info, opal_list_t);
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup(OPAL_PMIX_PROGRAMMING_MODEL);
|
|
kv->type = OPAL_STRING;
|
|
kv->data.string = strdup("OpenMP");
|
|
opal_list_append(&info, &kv->super);
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup(OPAL_PMIX_MODEL_LIBRARY_NAME);
|
|
kv->type = OPAL_STRING;
|
|
kv->data.string = strdup("foobar");
|
|
opal_list_append(&info, &kv->super);
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup(OPAL_PMIX_MODEL_LIBRARY_VERSION);
|
|
kv->type = OPAL_STRING;
|
|
kv->data.string = strdup("1.2.3.4");
|
|
opal_list_append(&info, &kv->super);
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup(OPAL_PMIX_THREADING_MODEL);
|
|
kv->type = OPAL_STRING;
|
|
kv->data.string = strdup("PTHREAD");
|
|
opal_list_append(&info, &kv->super);
|
|
|
|
/* see if pmix is already initialized */
|
|
if (opal_pmix.initialized()) {
|
|
/* mark that this isn't to go to any default event handler - pmix_init
|
|
* takes care of that for us, but we have to explicitly do it here */
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup(OPAL_PMIX_EVENT_NON_DEFAULT);
|
|
kv->type = OPAL_BOOL;
|
|
kv->data.flag = true;
|
|
opal_list_append(&info, &kv->super);
|
|
/* it is, so let's just use the event notification
|
|
* API to let everyone know we are here */
|
|
OPAL_PMIX_CONSTRUCT_LOCK(&lock);
|
|
ret = opal_pmix.notify_event(OPAL_ERR_MODEL_DECLARED,
|
|
&orte_process_info.my_name,
|
|
OPAL_PMIX_RANGE_PROC_LOCAL, &info,
|
|
opcbfunc, &lock);
|
|
OPAL_PMIX_WAIT_THREAD(&lock);
|
|
OPAL_PMIX_DESTRUCT_LOCK(&lock);
|
|
OPAL_LIST_DESTRUCT(&info);
|
|
} else {
|
|
/* call pmix to initialize these values */
|
|
ret = opal_pmix.init(&info);
|
|
OPAL_LIST_DESTRUCT(&info);
|
|
init = true;
|
|
}
|
|
|
|
/* register to receive model callbacks */
|
|
|
|
/* give it a name so we can distinguish it */
|
|
OBJ_CONSTRUCT(&directives, opal_list_t);
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup(OPAL_PMIX_EVENT_HDLR_NAME);
|
|
kv->type = OPAL_STRING;
|
|
kv->data.string = strdup("My-Declarations");
|
|
opal_list_append(&directives, &kv->super);
|
|
/* specify the event code */
|
|
OBJ_CONSTRUCT(&info, opal_list_t);
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup("status"); // the key here is irrelevant
|
|
kv->type = OPAL_INT;
|
|
kv->data.integer = OPAL_ERR_MODEL_DECLARED;
|
|
opal_list_append(&info, &kv->super);
|
|
/* we could constrain the range to proc_local - technically, this
|
|
* isn't required so long as the code that generates
|
|
* the event stipulates its range as proc_local. We rely
|
|
* on that here */
|
|
OPAL_PMIX_CONSTRUCT_LOCK(&lock);
|
|
opal_pmix.register_evhandler(&info, &directives, model_callback,
|
|
model_registration_callback,
|
|
(void*)&lock);
|
|
OPAL_PMIX_WAIT_THREAD(&lock);
|
|
OPAL_PMIX_DESTRUCT_LOCK(&lock);
|
|
OPAL_LIST_DESTRUCT(&info);
|
|
OPAL_LIST_DESTRUCT(&directives);
|
|
|
|
/* wait for the model callback */
|
|
OPAL_PMIX_WAIT_THREAD(&thread_complete);
|
|
|
|
/* let's do a couple of operations just to verify we can,
|
|
* starting with a query */
|
|
OBJ_CONSTRUCT(&info, opal_list_t);
|
|
query = OBJ_NEW(opal_pmix_query_t);
|
|
opal_argv_append_nosize(&query->keys, OPAL_PMIX_QUERY_NAMESPACES);
|
|
opal_list_append(&info, &query->super);
|
|
OPAL_PMIX_CONSTRUCT_LOCK(&lock);
|
|
opal_pmix.query(&info, infocb, &lock);
|
|
OPAL_PMIX_WAIT_THREAD(&lock);
|
|
OPAL_PMIX_DESTRUCT_LOCK(&lock);
|
|
OPAL_LIST_DESTRUCT(&info);
|
|
|
|
/* Get something */
|
|
opal_pmix.get(&orte_process_info.my_name,
|
|
"WASSUP", NULL, &kv);
|
|
if (NULL == kv) {
|
|
fprintf(stderr, "ERROR GETTING WASSUP\n");
|
|
} else {
|
|
fprintf(stderr, "THREAD WASSUP: %s\n", kv->data.string);
|
|
OBJ_RELEASE(kv);
|
|
}
|
|
|
|
/* lookup something published by the main thread */
|
|
OBJ_CONSTRUCT(&info, opal_list_t);
|
|
pdata = OBJ_NEW(opal_pmix_pdata_t);
|
|
pdata->proc = orte_process_info.my_name;
|
|
pdata->value.key = strdup("SOMETHING");
|
|
opal_list_append(&info, &pdata->super);
|
|
/* tell the call to wait for the data to be published */
|
|
OBJ_CONSTRUCT(&directives, opal_list_t);
|
|
kv = OBJ_NEW(opal_value_t);
|
|
kv->key = strdup(OPAL_PMIX_WAIT);
|
|
kv->type = OPAL_INT;
|
|
kv->data.integer = 0; // wait for all
|
|
opal_list_append(&directives, &kv->super);
|
|
|
|
if (OPAL_SUCCESS != opal_pmix.lookup(&info, &directives)) {
|
|
fprintf(stderr, "LOOKUP FAILED\n");
|
|
} else {
|
|
pdata = (opal_pmix_pdata_t*)opal_list_get_first(&info);
|
|
fprintf(stderr, "LOOKUP RETURNED %s\n", pdata->value.data.string);
|
|
}
|
|
OPAL_LIST_DESTRUCT(&info);
|
|
OPAL_LIST_DESTRUCT(&directives);
|
|
|
|
if (init) {
|
|
/* need to finalize to maintain refcount */
|
|
opal_pmix.finalize();
|
|
}
|
|
|
|
/* done */
|
|
return NULL;
|
|
}
|
|
|
|
int main(int argc, char* argv[])
|
|
{
|
|
int rank, size, rc;
|
|
hwloc_cpuset_t cpus;
|
|
char *bindings = NULL;
|
|
pid_t pid;
|
|
pthread_t mythread;
|
|
opal_value_t kv, *kptr;
|
|
opal_list_t list;
|
|
|
|
MPI_Init(&argc, &argv);
|
|
MPI_Comm_rank(MPI_COMM_WORLD, &rank);
|
|
MPI_Comm_size(MPI_COMM_WORLD, &size);
|
|
pid = getpid();
|
|
|
|
/* push something the thread can recognize */
|
|
OBJ_CONSTRUCT(&kv, opal_value_t);
|
|
kv.key = strdup("WASSUP");
|
|
kv.type = OPAL_STRING;
|
|
kv.data.string = strdup("nothing");
|
|
opal_pmix.put(OPAL_PMIX_LOCAL, &kv);
|
|
OBJ_DESTRUCT(&kv);
|
|
/* no need to commit it as this is strictly within ourselves */
|
|
|
|
/* spin up a thread */
|
|
if (pthread_create(&mythread, NULL, mylib, NULL)) {
|
|
fprintf(stderr, "Error creating thread\n");
|
|
goto done;
|
|
}
|
|
|
|
printf("[%lu] Rank %d: getting topology\n", (unsigned long)pid, rank);
|
|
fflush(stdout);
|
|
if (OPAL_SUCCESS == opal_hwloc_base_get_topology()) {
|
|
cpus = hwloc_bitmap_alloc();
|
|
rc = hwloc_get_cpubind(opal_hwloc_topology, cpus, HWLOC_CPUBIND_PROCESS);
|
|
hwloc_bitmap_list_asprintf(&bindings, cpus);
|
|
}
|
|
|
|
printf("Hello, World, I am %d of %d [%d local peers]: get_cpubind: %d bitmap %s\n",
|
|
rank, size, orte_process_info.num_local_peers, rc,
|
|
(NULL == bindings) ? "NULL" : bindings);
|
|
|
|
/* publish something */
|
|
OBJ_CONSTRUCT(&list, opal_list_t);
|
|
kptr = OBJ_NEW(opal_value_t);
|
|
kptr->key = strdup("SOMETHING");
|
|
kptr->type = OPAL_STRING;
|
|
kptr->data.string = strdup("SILLY-THING");
|
|
opal_list_append(&list, &kptr->super);
|
|
opal_pmix.publish(&list);
|
|
OPAL_LIST_DESTRUCT(&list);
|
|
|
|
/* wait for the thread to finish */
|
|
if (pthread_join(mythread, NULL)) {
|
|
fprintf(stderr, "Error joining thread\n");
|
|
}
|
|
|
|
done:
|
|
MPI_Finalize();
|
|
return 0;
|
|
}
|