Fix for fix of fix for handling misalignment when sending
onesided multifrag. This fixes trac:2532. This commit was SVN r23760. The following Trac tickets were found above: Ticket 2532 --> https://svn.open-mpi.org/trac/ompi/ticket/2532
Этот коммит содержится в:
родитель
8052c9dd46
Коммит
91c1ee86d7
@ -921,10 +921,13 @@ component_fragment_cb(struct mca_btl_base_module_t *btl,
|
||||
}
|
||||
|
||||
if ((base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI) != 0) {
|
||||
|
||||
/* The next header starts at the next aligned address in the
|
||||
* buffer. Therefore, bump pointer forward if necessary. */
|
||||
payload = (char *)payload + OPAL_ALIGN_PAD_AMOUNT(payload, sizeof(void*));
|
||||
/* The next header starts at the next aligned address in
|
||||
* the buffer. Therefore, check the hdr_flags to see if
|
||||
* any extra alignment is necessary, and if so, pull value
|
||||
* from the flags. */
|
||||
if (base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK) {
|
||||
payload = (char *)payload + (base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK);
|
||||
}
|
||||
base_header = (ompi_osc_rdma_base_header_t*) payload;
|
||||
} else {
|
||||
done = true;
|
||||
|
@ -362,16 +362,15 @@ ompi_osc_rdma_sendreq_send_cb(struct mca_btl_base_module_t* btl,
|
||||
if (0 == (header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI)) {
|
||||
done = true;
|
||||
} else {
|
||||
/* Find starting point for next header. Note that the last part
|
||||
* added in to compute the starting point for the next header is
|
||||
* extra padding that may have been inserted. */
|
||||
header = (ompi_osc_rdma_send_header_t*)
|
||||
(((char*) header) +
|
||||
sizeof(ompi_osc_rdma_send_header_t) +
|
||||
ompi_datatype_pack_description_length(sendreq->req_target_datatype) +
|
||||
header->hdr_msg_length);
|
||||
|
||||
/* The next header starts at the next aligned address in the
|
||||
* buffer. Therefore, bump pointer forward if necessary. */
|
||||
header = (ompi_osc_rdma_send_header_t*)((char*)header +
|
||||
OPAL_ALIGN_PAD_AMOUNT(header, sizeof(void*)));
|
||||
header->hdr_msg_length +
|
||||
(header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK));
|
||||
|
||||
if (header->hdr_base.hdr_type == OMPI_OSC_RDMA_HDR_MULTI_END) {
|
||||
done = true;
|
||||
@ -574,14 +573,21 @@ ompi_osc_rdma_sendreq_send(ompi_osc_rdma_module_t *module,
|
||||
* pointer addresses. Therefore, the pointer, amount written
|
||||
* and space remaining are adjusted forward so that the
|
||||
* starting position for the next message is aligned properly.
|
||||
* This strict alignment is required by certain platforms like
|
||||
* SPARC. Without it, bus errors can occur. Keeping things
|
||||
* aligned also may offer some performance improvements on
|
||||
* other platforms. */
|
||||
* The amount of this alignment is embedded in the hdr_flags
|
||||
* field so the callback completion and receiving side can
|
||||
* also know how much to move the pointer to find the starting
|
||||
* point of the next header. This strict alignment is
|
||||
* required by certain platforms like SPARC. Without it,
|
||||
* bus errors can occur. Keeping things aligned also may
|
||||
* offer some performance improvements on other platforms.
|
||||
*/
|
||||
offset = OPAL_ALIGN_PAD_AMOUNT(descriptor->des_src[0].seg_len, sizeof(void*));
|
||||
if (0 != offset) {
|
||||
header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK & offset;
|
||||
descriptor->des_src[0].seg_len += offset;
|
||||
written_data += offset;
|
||||
module->m_pending_buffers[sendreq->req_target_rank].remain_len -= offset;
|
||||
}
|
||||
|
||||
#ifdef WORDS_BIGENDIAN
|
||||
header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_NBO;
|
||||
|
@ -10,6 +10,7 @@
|
||||
* Copyright (c) 2007 Los Alamos National Security, LLC. All rights
|
||||
* reserved.
|
||||
* Copyright (c) 2010 Cisco Systems, Inc. All rights reserved.
|
||||
* Copyright (c) 2010 Oracle and/or its affiliates. All rights reserved.
|
||||
* $COPYRIGHT$
|
||||
*
|
||||
* Additional copyrights may follow
|
||||
@ -40,8 +41,9 @@
|
||||
#define OMPI_OSC_RDMA_HDR_MULTI_END 0x0B
|
||||
#define OMPI_OSC_RDMA_HDR_RDMA_INFO 0x0C
|
||||
|
||||
#define OMPI_OSC_RDMA_HDR_FLAG_NBO 0x01
|
||||
#define OMPI_OSC_RDMA_HDR_FLAG_MULTI 0x02
|
||||
#define OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK 0x0F
|
||||
#define OMPI_OSC_RDMA_HDR_FLAG_NBO 0x10
|
||||
#define OMPI_OSC_RDMA_HDR_FLAG_MULTI 0x20
|
||||
|
||||
struct ompi_osc_rdma_base_header_t {
|
||||
uint8_t hdr_type;
|
||||
|
Загрузка…
Ссылка в новой задаче
Block a user