Fix for fix of fix for handling misalignment when sending
onesided multifrag. This fixes trac:2532. This commit was SVN r23760. The following Trac tickets were found above: Ticket 2532 --> https://svn.open-mpi.org/trac/ompi/ticket/2532
Этот коммит содержится в:
родитель
8052c9dd46
Коммит
91c1ee86d7
@ -921,10 +921,13 @@ component_fragment_cb(struct mca_btl_base_module_t *btl,
|
|||||||
}
|
}
|
||||||
|
|
||||||
if ((base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI) != 0) {
|
if ((base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI) != 0) {
|
||||||
|
/* The next header starts at the next aligned address in
|
||||||
/* The next header starts at the next aligned address in the
|
* the buffer. Therefore, check the hdr_flags to see if
|
||||||
* buffer. Therefore, bump pointer forward if necessary. */
|
* any extra alignment is necessary, and if so, pull value
|
||||||
payload = (char *)payload + OPAL_ALIGN_PAD_AMOUNT(payload, sizeof(void*));
|
* from the flags. */
|
||||||
|
if (base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK) {
|
||||||
|
payload = (char *)payload + (base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK);
|
||||||
|
}
|
||||||
base_header = (ompi_osc_rdma_base_header_t*) payload;
|
base_header = (ompi_osc_rdma_base_header_t*) payload;
|
||||||
} else {
|
} else {
|
||||||
done = true;
|
done = true;
|
||||||
|
@ -362,16 +362,15 @@ ompi_osc_rdma_sendreq_send_cb(struct mca_btl_base_module_t* btl,
|
|||||||
if (0 == (header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI)) {
|
if (0 == (header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI)) {
|
||||||
done = true;
|
done = true;
|
||||||
} else {
|
} else {
|
||||||
|
/* Find starting point for next header. Note that the last part
|
||||||
|
* added in to compute the starting point for the next header is
|
||||||
|
* extra padding that may have been inserted. */
|
||||||
header = (ompi_osc_rdma_send_header_t*)
|
header = (ompi_osc_rdma_send_header_t*)
|
||||||
(((char*) header) +
|
(((char*) header) +
|
||||||
sizeof(ompi_osc_rdma_send_header_t) +
|
sizeof(ompi_osc_rdma_send_header_t) +
|
||||||
ompi_datatype_pack_description_length(sendreq->req_target_datatype) +
|
ompi_datatype_pack_description_length(sendreq->req_target_datatype) +
|
||||||
header->hdr_msg_length);
|
header->hdr_msg_length +
|
||||||
|
(header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK));
|
||||||
/* The next header starts at the next aligned address in the
|
|
||||||
* buffer. Therefore, bump pointer forward if necessary. */
|
|
||||||
header = (ompi_osc_rdma_send_header_t*)((char*)header +
|
|
||||||
OPAL_ALIGN_PAD_AMOUNT(header, sizeof(void*)));
|
|
||||||
|
|
||||||
if (header->hdr_base.hdr_type == OMPI_OSC_RDMA_HDR_MULTI_END) {
|
if (header->hdr_base.hdr_type == OMPI_OSC_RDMA_HDR_MULTI_END) {
|
||||||
done = true;
|
done = true;
|
||||||
@ -574,14 +573,21 @@ ompi_osc_rdma_sendreq_send(ompi_osc_rdma_module_t *module,
|
|||||||
* pointer addresses. Therefore, the pointer, amount written
|
* pointer addresses. Therefore, the pointer, amount written
|
||||||
* and space remaining are adjusted forward so that the
|
* and space remaining are adjusted forward so that the
|
||||||
* starting position for the next message is aligned properly.
|
* starting position for the next message is aligned properly.
|
||||||
* This strict alignment is required by certain platforms like
|
* The amount of this alignment is embedded in the hdr_flags
|
||||||
* SPARC. Without it, bus errors can occur. Keeping things
|
* field so the callback completion and receiving side can
|
||||||
* aligned also may offer some performance improvements on
|
* also know how much to move the pointer to find the starting
|
||||||
* other platforms. */
|
* point of the next header. This strict alignment is
|
||||||
|
* required by certain platforms like SPARC. Without it,
|
||||||
|
* bus errors can occur. Keeping things aligned also may
|
||||||
|
* offer some performance improvements on other platforms.
|
||||||
|
*/
|
||||||
offset = OPAL_ALIGN_PAD_AMOUNT(descriptor->des_src[0].seg_len, sizeof(void*));
|
offset = OPAL_ALIGN_PAD_AMOUNT(descriptor->des_src[0].seg_len, sizeof(void*));
|
||||||
descriptor->des_src[0].seg_len += offset;
|
if (0 != offset) {
|
||||||
written_data += offset;
|
header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK & offset;
|
||||||
module->m_pending_buffers[sendreq->req_target_rank].remain_len -= offset;
|
descriptor->des_src[0].seg_len += offset;
|
||||||
|
written_data += offset;
|
||||||
|
module->m_pending_buffers[sendreq->req_target_rank].remain_len -= offset;
|
||||||
|
}
|
||||||
|
|
||||||
#ifdef WORDS_BIGENDIAN
|
#ifdef WORDS_BIGENDIAN
|
||||||
header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_NBO;
|
header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_NBO;
|
||||||
|
@ -10,6 +10,7 @@
|
|||||||
* Copyright (c) 2007 Los Alamos National Security, LLC. All rights
|
* Copyright (c) 2007 Los Alamos National Security, LLC. All rights
|
||||||
* reserved.
|
* reserved.
|
||||||
* Copyright (c) 2010 Cisco Systems, Inc. All rights reserved.
|
* Copyright (c) 2010 Cisco Systems, Inc. All rights reserved.
|
||||||
|
* Copyright (c) 2010 Oracle and/or its affiliates. All rights reserved.
|
||||||
* $COPYRIGHT$
|
* $COPYRIGHT$
|
||||||
*
|
*
|
||||||
* Additional copyrights may follow
|
* Additional copyrights may follow
|
||||||
@ -40,8 +41,9 @@
|
|||||||
#define OMPI_OSC_RDMA_HDR_MULTI_END 0x0B
|
#define OMPI_OSC_RDMA_HDR_MULTI_END 0x0B
|
||||||
#define OMPI_OSC_RDMA_HDR_RDMA_INFO 0x0C
|
#define OMPI_OSC_RDMA_HDR_RDMA_INFO 0x0C
|
||||||
|
|
||||||
#define OMPI_OSC_RDMA_HDR_FLAG_NBO 0x01
|
#define OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK 0x0F
|
||||||
#define OMPI_OSC_RDMA_HDR_FLAG_MULTI 0x02
|
#define OMPI_OSC_RDMA_HDR_FLAG_NBO 0x10
|
||||||
|
#define OMPI_OSC_RDMA_HDR_FLAG_MULTI 0x20
|
||||||
|
|
||||||
struct ompi_osc_rdma_base_header_t {
|
struct ompi_osc_rdma_base_header_t {
|
||||||
uint8_t hdr_type;
|
uint8_t hdr_type;
|
||||||
|
Загрузка…
x
Ссылка в новой задаче
Block a user