Merge pull request #2590 from jjhursey/topic/osc-pt2pt-1-thread-fixes
Topic/osc pt2pt 1 thread fixes
Этот коммит содержится в:
Коммит
ced245d093
@ -10,7 +10,7 @@
|
||||
* All rights reserved.
|
||||
* Copyright (c) 2007-2016 Los Alamos National Security, LLC. All rights
|
||||
* reserved.
|
||||
* Copyright (c) 2010 IBM Corporation. All rights reserved.
|
||||
* Copyright (c) 2010-2016 IBM Corporation. All rights reserved.
|
||||
* Copyright (c) 2012-2013 Sandia National Laboratories. All rights reserved.
|
||||
* Copyright (c) 2015 Research Organization for Information Science
|
||||
* and Technology (RIST). All rights reserved.
|
||||
@ -227,6 +227,12 @@ int ompi_osc_pt2pt_start (ompi_group_t *group, int assert, ompi_win_t *win)
|
||||
/* haven't processed any post messages yet */
|
||||
sync->sync_expected = sync->num_peers;
|
||||
|
||||
/* If the previous epoch was from Fence, then eager_send_active is still
|
||||
* set to true at this time, but it shoulnd't be true until we get our
|
||||
* incoming Posts. So reset to 'false' for this new epoch.
|
||||
*/
|
||||
sync->eager_send_active = false;
|
||||
|
||||
OPAL_OUTPUT_VERBOSE((50, ompi_osc_base_framework.framework_output,
|
||||
"ompi_osc_pt2pt_start entering with group size %d...",
|
||||
sync->num_peers));
|
||||
|
@ -15,6 +15,7 @@
|
||||
* Copyright (c) 2015 Research Organization for Information Science
|
||||
* and Technology (RIST). All rights reserved.
|
||||
* Copyright (c) 2016 FUJITSU LIMITED. All rights reserved.
|
||||
* Copyright (c) 2016 IBM Corporation. All rights reserved.
|
||||
* $COPYRIGHT$
|
||||
*
|
||||
* Additional copyrights may follow
|
||||
@ -336,7 +337,16 @@ static inline int ompi_osc_pt2pt_put_w_req (const void *origin_addr, int origin_
|
||||
|
||||
if (is_long_msg) {
|
||||
/* wait for eager sends to be active before starting a long put */
|
||||
ompi_osc_pt2pt_sync_wait_expected (pt2pt_sync);
|
||||
if (pt2pt_sync->type == OMPI_OSC_PT2PT_SYNC_TYPE_LOCK) {
|
||||
OPAL_THREAD_LOCK(&pt2pt_sync->lock);
|
||||
ompi_osc_pt2pt_peer_t *peer = ompi_osc_pt2pt_peer_lookup (module, target);
|
||||
while (!(peer->flags & OMPI_OSC_PT2PT_PEER_FLAG_EAGER)) {
|
||||
opal_condition_wait(&pt2pt_sync->cond, &pt2pt_sync->lock);
|
||||
}
|
||||
OPAL_THREAD_UNLOCK(&pt2pt_sync->lock);
|
||||
} else {
|
||||
ompi_osc_pt2pt_sync_wait_expected (pt2pt_sync);
|
||||
}
|
||||
}
|
||||
|
||||
OPAL_OUTPUT_VERBOSE((50, ompi_osc_base_framework.framework_output,
|
||||
@ -495,7 +505,16 @@ ompi_osc_pt2pt_accumulate_w_req (const void *origin_addr, int origin_count,
|
||||
|
||||
if (is_long_msg) {
|
||||
/* wait for synchronization before posting a long message */
|
||||
ompi_osc_pt2pt_sync_wait_expected (pt2pt_sync);
|
||||
if (pt2pt_sync->type == OMPI_OSC_PT2PT_SYNC_TYPE_LOCK) {
|
||||
OPAL_THREAD_LOCK(&pt2pt_sync->lock);
|
||||
ompi_osc_pt2pt_peer_t *peer = ompi_osc_pt2pt_peer_lookup (module, target);
|
||||
while (!(peer->flags & OMPI_OSC_PT2PT_PEER_FLAG_EAGER)) {
|
||||
opal_condition_wait(&pt2pt_sync->cond, &pt2pt_sync->lock);
|
||||
}
|
||||
OPAL_THREAD_UNLOCK(&pt2pt_sync->lock);
|
||||
} else {
|
||||
ompi_osc_pt2pt_sync_wait_expected (pt2pt_sync);
|
||||
}
|
||||
}
|
||||
|
||||
header = (ompi_osc_pt2pt_header_acc_t*) ptr;
|
||||
|
@ -10,7 +10,7 @@
|
||||
* All rights reserved.
|
||||
* Copyright (c) 2007-2016 Los Alamos National Security, LLC. All rights
|
||||
* reserved.
|
||||
* Copyright (c) 2010 IBM Corporation. All rights reserved.
|
||||
* Copyright (c) 2010-2016 IBM Corporation. All rights reserved.
|
||||
* Copyright (c) 2012-2013 Sandia National Laboratories. All rights reserved.
|
||||
* Copyright (c) 2015 Intel, Inc. All rights reserved.
|
||||
* Copyright (c) 2015-2016 Research Organization for Information Science
|
||||
@ -421,6 +421,16 @@ static int ompi_osc_pt2pt_unlock_internal (int target, ompi_win_t *win)
|
||||
/* wait for unlock acks. this signals remote completion of fragments */
|
||||
ompi_osc_pt2pt_sync_wait_expected (lock);
|
||||
|
||||
/* It is possible for the unlock to finish too early before the data
|
||||
* is actually present in the recv buffer (for non-contiguous datatypes)
|
||||
* So make sure to wait for all of the fragments to arrive.
|
||||
*/
|
||||
OPAL_THREAD_LOCK(&module->lock);
|
||||
while (module->outgoing_frag_count < module->outgoing_frag_signal_count) {
|
||||
opal_condition_wait(&module->cond, &module->lock);
|
||||
}
|
||||
OPAL_THREAD_UNLOCK(&module->lock);
|
||||
|
||||
OPAL_OUTPUT_VERBOSE((25, ompi_osc_base_framework.framework_output,
|
||||
"ompi_osc_pt2pt_unlock: unlock of %d complete", target));
|
||||
} else {
|
||||
|
Загрузка…
x
Ссылка в новой задаче
Block a user