
Add a framework to support different types of threading models including user space thread packages such as Qthreads and argobot: https://github.com/pmodels/argobots https://github.com/Qthreads/qthreads The default threading model is pthreads. Alternate thread models are specificed at configure time using the --with-threads=X option. The framework is static. The theading model to use is selected at Open MPI configure/build time. mca/threads: implement Argobots threading layer config: fix thread configury - Add double quotations - Change Argobot to Argobots config: implement Argobots check If the poll time is too long, MPI hangs. This quick fix just sets it to 0, but it is not good for the Pthreads version. Need to find a good way to abstract it. Note that even 1 (= 1 millisecond) causes disastrous performance degradation. rework threads MCA framework configury It now works more like the ompi/mca/rte configury, modulo some edge items that are special for threading package linking, etc. qthreads module some argobots cleanup Signed-off-by: Noah Evans <noah.evans@gmail.com> Signed-off-by: Shintaro Iwasaki <siwasaki@anl.gov> Signed-off-by: Howard Pritchard <howardp@lanl.gov>
117 строки
3.9 KiB
C
117 строки
3.9 KiB
C
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
|
/*
|
|
* Copyright (c) 2014-2016 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2016 Los Alamos National Security, LLC. All rights
|
|
* reserved.
|
|
* Copyright (c) 2017 IBM Corporation. All rights reserved.
|
|
* Copyright (c) 2019 Sandia National Laboratories. All rights reserved.
|
|
*
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "opal/mca/threads/argobots/threads_argobots.h"
|
|
#include "opal/mca/threads/wait_sync.h"
|
|
|
|
static opal_mutex_t wait_sync_lock = OPAL_MUTEX_STATIC_INIT;
|
|
static ompi_wait_sync_t *wait_sync_list = NULL;
|
|
|
|
static opal_atomic_int32_t num_thread_in_progress = 0;
|
|
|
|
#define WAIT_SYNC_PASS_OWNERSHIP(who) \
|
|
do { \
|
|
ABT_mutex_lock((who)->lock); \
|
|
ABT_cond_signal((who)->condition ); \
|
|
ABT_mutex_unlock((who)->lock); \
|
|
} while (0)
|
|
|
|
int ompi_sync_wait_mt(ompi_wait_sync_t *sync)
|
|
{
|
|
/* Don't stop if the waiting synchronization is completed. We avoid the
|
|
* race condition around the release of the synchronization using the
|
|
* signaling field.
|
|
*/
|
|
if (sync->count <= 0) {
|
|
return (0 == sync->status) ? OPAL_SUCCESS : OPAL_ERROR;
|
|
}
|
|
|
|
/* lock so nobody can signal us during the list updating */
|
|
ABT_mutex_lock(sync->lock);
|
|
|
|
/* Now that we hold the lock make sure another thread has not already
|
|
* call cond_signal.
|
|
*/
|
|
if (sync->count <= 0) {
|
|
ABT_mutex_unlock(sync->lock);
|
|
return (0 == sync->status) ? OPAL_SUCCESS : OPAL_ERROR;
|
|
}
|
|
|
|
/* Insert sync on the list of pending synchronization constructs */
|
|
OPAL_THREAD_LOCK(&wait_sync_lock);
|
|
if (NULL == wait_sync_list) {
|
|
sync->next = sync->prev = sync;
|
|
wait_sync_list = sync;
|
|
} else {
|
|
sync->prev = wait_sync_list->prev;
|
|
sync->prev->next = sync;
|
|
sync->next = wait_sync_list;
|
|
wait_sync_list->prev = sync;
|
|
}
|
|
OPAL_THREAD_UNLOCK(&wait_sync_lock);
|
|
|
|
/**
|
|
* If we are not responsible for progressing, go silent until something
|
|
* worth noticing happen:
|
|
* - this thread has been promoted to take care of the progress
|
|
* - our sync has been triggered.
|
|
*/
|
|
check_status:
|
|
if (sync != wait_sync_list &&
|
|
num_thread_in_progress >= opal_max_thread_in_progress) {
|
|
ABT_cond_wait(sync->condition, sync->lock);
|
|
|
|
/**
|
|
* At this point either the sync was completed in which case
|
|
* we should remove it from the wait list, or/and I was
|
|
* promoted as the progress manager.
|
|
*/
|
|
|
|
if (sync->count <= 0) { /* Completed? */
|
|
ABT_mutex_unlock(sync->lock);
|
|
goto i_am_done;
|
|
}
|
|
/* either promoted, or spurious wakeup ! */
|
|
goto check_status;
|
|
}
|
|
ABT_mutex_unlock(sync->lock);
|
|
|
|
OPAL_THREAD_ADD_FETCH32(&num_thread_in_progress, 1);
|
|
while (sync->count > 0) { /* progress till completion */
|
|
/* don't progress with the sync lock locked or you'll deadlock */
|
|
opal_progress();
|
|
ABT_thread_yield();
|
|
}
|
|
OPAL_THREAD_ADD_FETCH32(&num_thread_in_progress, -1);
|
|
|
|
i_am_done:
|
|
/* My sync is now complete. Trim the list: remove self, wake next */
|
|
OPAL_THREAD_LOCK(&wait_sync_lock);
|
|
sync->prev->next = sync->next;
|
|
sync->next->prev = sync->prev;
|
|
/* In case I am the progress manager, pass the duties on */
|
|
if (sync == wait_sync_list) {
|
|
wait_sync_list = (sync == sync->next) ? NULL : sync->next;
|
|
if (NULL != wait_sync_list) {
|
|
WAIT_SYNC_PASS_OWNERSHIP(wait_sync_list);
|
|
}
|
|
}
|
|
OPAL_THREAD_UNLOCK(&wait_sync_lock);
|
|
|
|
return (0 == sync->status) ? OPAL_SUCCESS : OPAL_ERROR;
|
|
}
|