1
1

Fix for fix of fix for handling misalignment when sending

onesided multifrag.

This fixes trac:2532.

This commit was SVN r23760.

The following Trac tickets were found above:
  Ticket 2532 --> https://svn.open-mpi.org/trac/ompi/ticket/2532
Этот коммит содержится в:
Rolf vandeVaart 2010-09-16 18:58:11 +00:00
родитель 8052c9dd46
Коммит 91c1ee86d7
3 изменённых файлов: 30 добавлений и 19 удалений

Просмотреть файл

@ -921,10 +921,13 @@ component_fragment_cb(struct mca_btl_base_module_t *btl,
} }
if ((base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI) != 0) { if ((base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI) != 0) {
/* The next header starts at the next aligned address in
/* The next header starts at the next aligned address in the * the buffer. Therefore, check the hdr_flags to see if
* buffer. Therefore, bump pointer forward if necessary. */ * any extra alignment is necessary, and if so, pull value
payload = (char *)payload + OPAL_ALIGN_PAD_AMOUNT(payload, sizeof(void*)); * from the flags. */
if (base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK) {
payload = (char *)payload + (base_header->hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK);
}
base_header = (ompi_osc_rdma_base_header_t*) payload; base_header = (ompi_osc_rdma_base_header_t*) payload;
} else { } else {
done = true; done = true;

Просмотреть файл

@ -362,16 +362,15 @@ ompi_osc_rdma_sendreq_send_cb(struct mca_btl_base_module_t* btl,
if (0 == (header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI)) { if (0 == (header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_MULTI)) {
done = true; done = true;
} else { } else {
/* Find starting point for next header. Note that the last part
* added in to compute the starting point for the next header is
* extra padding that may have been inserted. */
header = (ompi_osc_rdma_send_header_t*) header = (ompi_osc_rdma_send_header_t*)
(((char*) header) + (((char*) header) +
sizeof(ompi_osc_rdma_send_header_t) + sizeof(ompi_osc_rdma_send_header_t) +
ompi_datatype_pack_description_length(sendreq->req_target_datatype) + ompi_datatype_pack_description_length(sendreq->req_target_datatype) +
header->hdr_msg_length); header->hdr_msg_length +
(header->hdr_base.hdr_flags & OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK));
/* The next header starts at the next aligned address in the
* buffer. Therefore, bump pointer forward if necessary. */
header = (ompi_osc_rdma_send_header_t*)((char*)header +
OPAL_ALIGN_PAD_AMOUNT(header, sizeof(void*)));
if (header->hdr_base.hdr_type == OMPI_OSC_RDMA_HDR_MULTI_END) { if (header->hdr_base.hdr_type == OMPI_OSC_RDMA_HDR_MULTI_END) {
done = true; done = true;
@ -574,14 +573,21 @@ ompi_osc_rdma_sendreq_send(ompi_osc_rdma_module_t *module,
* pointer addresses. Therefore, the pointer, amount written * pointer addresses. Therefore, the pointer, amount written
* and space remaining are adjusted forward so that the * and space remaining are adjusted forward so that the
* starting position for the next message is aligned properly. * starting position for the next message is aligned properly.
* This strict alignment is required by certain platforms like * The amount of this alignment is embedded in the hdr_flags
* SPARC. Without it, bus errors can occur. Keeping things * field so the callback completion and receiving side can
* aligned also may offer some performance improvements on * also know how much to move the pointer to find the starting
* other platforms. */ * point of the next header. This strict alignment is
* required by certain platforms like SPARC. Without it,
* bus errors can occur. Keeping things aligned also may
* offer some performance improvements on other platforms.
*/
offset = OPAL_ALIGN_PAD_AMOUNT(descriptor->des_src[0].seg_len, sizeof(void*)); offset = OPAL_ALIGN_PAD_AMOUNT(descriptor->des_src[0].seg_len, sizeof(void*));
descriptor->des_src[0].seg_len += offset; if (0 != offset) {
written_data += offset; header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK & offset;
module->m_pending_buffers[sendreq->req_target_rank].remain_len -= offset; descriptor->des_src[0].seg_len += offset;
written_data += offset;
module->m_pending_buffers[sendreq->req_target_rank].remain_len -= offset;
}
#ifdef WORDS_BIGENDIAN #ifdef WORDS_BIGENDIAN
header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_NBO; header->hdr_base.hdr_flags |= OMPI_OSC_RDMA_HDR_FLAG_NBO;

Просмотреть файл

@ -10,6 +10,7 @@
* Copyright (c) 2007 Los Alamos National Security, LLC. All rights * Copyright (c) 2007 Los Alamos National Security, LLC. All rights
* reserved. * reserved.
* Copyright (c) 2010 Cisco Systems, Inc. All rights reserved. * Copyright (c) 2010 Cisco Systems, Inc. All rights reserved.
* Copyright (c) 2010 Oracle and/or its affiliates. All rights reserved.
* $COPYRIGHT$ * $COPYRIGHT$
* *
* Additional copyrights may follow * Additional copyrights may follow
@ -40,8 +41,9 @@
#define OMPI_OSC_RDMA_HDR_MULTI_END 0x0B #define OMPI_OSC_RDMA_HDR_MULTI_END 0x0B
#define OMPI_OSC_RDMA_HDR_RDMA_INFO 0x0C #define OMPI_OSC_RDMA_HDR_RDMA_INFO 0x0C
#define OMPI_OSC_RDMA_HDR_FLAG_NBO 0x01 #define OMPI_OSC_RDMA_HDR_FLAG_ALIGN_MASK 0x0F
#define OMPI_OSC_RDMA_HDR_FLAG_MULTI 0x02 #define OMPI_OSC_RDMA_HDR_FLAG_NBO 0x10
#define OMPI_OSC_RDMA_HDR_FLAG_MULTI 0x20
struct ompi_osc_rdma_base_header_t { struct ompi_osc_rdma_base_header_t {
uint8_t hdr_type; uint8_t hdr_type;