539 строки
20 KiB
C
539 строки
20 KiB
C
|
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
|
||
|
/*
|
||
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
||
|
* University Research and Technology
|
||
|
* Corporation. All rights reserved.
|
||
|
* Copyright (c) 2004-2005 The University of Tennessee and The University
|
||
|
* of Tennessee Research Foundation. All rights
|
||
|
* reserved.
|
||
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
||
|
* University of Stuttgart. All rights reserved.
|
||
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
||
|
* All rights reserved.
|
||
|
* Copyright (c) 2009 IBM Corporation. All rights reserved.
|
||
|
* Copyright (c) 2012-2015 Los Alamos National Security, LLC. All rights
|
||
|
* reserved.
|
||
|
* $COPYRIGHT$
|
||
|
*
|
||
|
* Additional copyrights may follow
|
||
|
*
|
||
|
* $HEADER$
|
||
|
*/
|
||
|
/**
|
||
|
* @file
|
||
|
*/
|
||
|
#ifndef MCA_PML_OB1_HEADER_H
|
||
|
#define MCA_PML_OB1_HEADER_H
|
||
|
|
||
|
#include "ompi_config.h"
|
||
|
#ifdef HAVE_SYS_TYPES_H
|
||
|
#include <sys/types.h>
|
||
|
#endif
|
||
|
#ifdef HAVE_NETINET_IN_H
|
||
|
#include <netinet/in.h>
|
||
|
#endif
|
||
|
|
||
|
#include "opal/types.h"
|
||
|
#include "opal/util/arch.h"
|
||
|
#include "opal/mca/btl/btl.h"
|
||
|
#include "ompi/proc/proc.h"
|
||
|
|
||
|
#define MCA_PML_OB1_HDR_TYPE_MATCH (MCA_BTL_TAG_PML + 1)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_RNDV (MCA_BTL_TAG_PML + 2)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_RGET (MCA_BTL_TAG_PML + 3)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_ACK (MCA_BTL_TAG_PML + 4)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_NACK (MCA_BTL_TAG_PML + 5)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_FRAG (MCA_BTL_TAG_PML + 6)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_GET (MCA_BTL_TAG_PML + 7)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_PUT (MCA_BTL_TAG_PML + 8)
|
||
|
#define MCA_PML_OB1_HDR_TYPE_FIN (MCA_BTL_TAG_PML + 9)
|
||
|
|
||
|
#define MCA_PML_OB1_HDR_FLAGS_ACK 1 /* is an ack required */
|
||
|
#define MCA_PML_OB1_HDR_FLAGS_NBO 2 /* is the hdr in network byte order */
|
||
|
#define MCA_PML_OB1_HDR_FLAGS_PIN 4 /* is user buffer pinned */
|
||
|
#define MCA_PML_OB1_HDR_FLAGS_CONTIG 8 /* is user buffer contiguous */
|
||
|
#define MCA_PML_OB1_HDR_FLAGS_NORDMA 16 /* rest will be send by copy-in-out */
|
||
|
#define MCA_PML_OB1_HDR_FLAGS_SIGNAL 32 /* message can be optionally signalling */
|
||
|
|
||
|
/**
|
||
|
* Common hdr attributes - must be first element in each hdr type
|
||
|
*/
|
||
|
struct mca_pml_ob1_common_hdr_t {
|
||
|
uint8_t hdr_type; /**< type of envelope */
|
||
|
uint8_t hdr_flags; /**< flags indicating how fragment should be processed */
|
||
|
};
|
||
|
typedef struct mca_pml_ob1_common_hdr_t mca_pml_ob1_common_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_common_hdr_prepare (mca_pml_ob1_common_hdr_t *hdr, uint8_t hdr_type,
|
||
|
uint8_t hdr_flags)
|
||
|
{
|
||
|
hdr->hdr_type = hdr_type;
|
||
|
hdr->hdr_flags = hdr_flags;
|
||
|
}
|
||
|
|
||
|
#define MCA_PML_OB1_COMMON_HDR_NTOH(h)
|
||
|
#define MCA_PML_OB1_COMMON_HDR_HTON(h)
|
||
|
|
||
|
/**
|
||
|
* Header definition for the first fragment, contains the
|
||
|
* attributes required to match the corresponding posted receive.
|
||
|
*/
|
||
|
struct mca_pml_ob1_match_hdr_t {
|
||
|
mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */
|
||
|
uint16_t hdr_ctx; /**< communicator index */
|
||
|
int32_t hdr_src; /**< source rank */
|
||
|
int32_t hdr_tag; /**< user tag */
|
||
|
uint16_t hdr_seq; /**< message sequence number */
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
uint8_t hdr_padding[2]; /**< explicitly pad to 16 bytes. Compilers seem to already prefer to do this, but make it explicit just in case */
|
||
|
#endif
|
||
|
};
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
#define OMPI_PML_OB1_MATCH_HDR_LEN 16
|
||
|
#else
|
||
|
#define OMPI_PML_OB1_MATCH_HDR_LEN 14
|
||
|
#endif
|
||
|
|
||
|
typedef struct mca_pml_ob1_match_hdr_t mca_pml_ob1_match_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_match_hdr_prepare (mca_pml_ob1_match_hdr_t *hdr, uint8_t hdr_type, uint8_t hdr_flags,
|
||
|
uint16_t hdr_ctx, int32_t hdr_src, int32_t hdr_tag, uint16_t hdr_seq)
|
||
|
{
|
||
|
mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, hdr_type, hdr_flags);
|
||
|
hdr->hdr_ctx = hdr_ctx;
|
||
|
hdr->hdr_src = hdr_src;
|
||
|
hdr->hdr_tag = hdr_tag;
|
||
|
hdr->hdr_seq = hdr_seq;
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT && OPAL_ENABLE_DEBUG
|
||
|
hdr->hdr_padding[0] = 0;
|
||
|
hdr->hdr_padding[1] = 0;
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
#define MCA_PML_OB1_MATCH_HDR_NTOH(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \
|
||
|
(h).hdr_ctx = ntohs((h).hdr_ctx); \
|
||
|
(h).hdr_src = ntohl((h).hdr_src); \
|
||
|
(h).hdr_tag = ntohl((h).hdr_tag); \
|
||
|
(h).hdr_seq = ntohs((h).hdr_seq); \
|
||
|
} while (0)
|
||
|
|
||
|
#define MCA_PML_OB1_MATCH_HDR_HTON(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \
|
||
|
(h).hdr_ctx = htons((h).hdr_ctx); \
|
||
|
(h).hdr_src = htonl((h).hdr_src); \
|
||
|
(h).hdr_tag = htonl((h).hdr_tag); \
|
||
|
(h).hdr_seq = htons((h).hdr_seq); \
|
||
|
} while (0)
|
||
|
|
||
|
/**
|
||
|
* Header definition for the first fragment when an acknowledgment
|
||
|
* is required. This could be the first fragment of a large message
|
||
|
* or a short message that requires an ack (synchronous).
|
||
|
*/
|
||
|
struct mca_pml_ob1_rendezvous_hdr_t {
|
||
|
mca_pml_ob1_match_hdr_t hdr_match;
|
||
|
uint64_t hdr_msg_length; /**< message length */
|
||
|
opal_ptr_t hdr_src_req; /**< pointer to source request - returned in ack */
|
||
|
};
|
||
|
typedef struct mca_pml_ob1_rendezvous_hdr_t mca_pml_ob1_rendezvous_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_rendezvous_hdr_prepare (mca_pml_ob1_rendezvous_hdr_t *hdr, uint8_t hdr_type, uint8_t hdr_flags,
|
||
|
uint16_t hdr_ctx, int32_t hdr_src, int32_t hdr_tag, uint16_t hdr_seq,
|
||
|
uint64_t hdr_msg_length, void *hdr_src_req)
|
||
|
{
|
||
|
mca_pml_ob1_match_hdr_prepare (&hdr->hdr_match, hdr_type, hdr_flags, hdr_ctx, hdr_src, hdr_tag, hdr_seq);
|
||
|
hdr->hdr_msg_length = hdr_msg_length;
|
||
|
hdr->hdr_src_req.pval = hdr_src_req;
|
||
|
}
|
||
|
|
||
|
/* Note that hdr_src_req is not put in network byte order because it
|
||
|
is never processed by the receiver, other than being copied into
|
||
|
the ack header */
|
||
|
#define MCA_PML_OB1_RNDV_HDR_NTOH(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_MATCH_HDR_NTOH((h).hdr_match); \
|
||
|
(h).hdr_msg_length = ntoh64((h).hdr_msg_length); \
|
||
|
} while (0)
|
||
|
|
||
|
#define MCA_PML_OB1_RNDV_HDR_HTON(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_MATCH_HDR_HTON((h).hdr_match); \
|
||
|
(h).hdr_msg_length = hton64((h).hdr_msg_length); \
|
||
|
} while (0)
|
||
|
|
||
|
/**
|
||
|
* Header definition for a combined rdma rendezvous/get
|
||
|
*/
|
||
|
struct mca_pml_ob1_rget_hdr_t {
|
||
|
mca_pml_ob1_rendezvous_hdr_t hdr_rndv;
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
uint8_t hdr_padding[4];
|
||
|
#endif
|
||
|
opal_ptr_t hdr_frag; /**< source fragment (for fin) */
|
||
|
uint64_t hdr_src_ptr; /**< source pointer */
|
||
|
/* btl registration handle data follows */
|
||
|
};
|
||
|
typedef struct mca_pml_ob1_rget_hdr_t mca_pml_ob1_rget_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_rget_hdr_prepare (mca_pml_ob1_rget_hdr_t *hdr, uint8_t hdr_flags,
|
||
|
uint16_t hdr_ctx, int32_t hdr_src, int32_t hdr_tag, uint16_t hdr_seq,
|
||
|
uint64_t hdr_msg_length, void *hdr_src_req, void *hdr_frag,
|
||
|
void *hdr_src_ptr, void *local_handle, size_t local_handle_size)
|
||
|
{
|
||
|
mca_pml_ob1_rendezvous_hdr_prepare (&hdr->hdr_rndv, MCA_PML_OB1_HDR_TYPE_RGET, hdr_flags,
|
||
|
hdr_ctx, hdr_src, hdr_tag, hdr_seq, hdr_msg_length, hdr_src_req);
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT && OPAL_ENABLE_DEBUG
|
||
|
hdr->hdr_padding[0] = 0;
|
||
|
hdr->hdr_padding[1] = 0;
|
||
|
hdr->hdr_padding[2] = 0;
|
||
|
hdr->hdr_padding[3] = 0;
|
||
|
#endif
|
||
|
hdr->hdr_frag.pval = hdr_frag;
|
||
|
hdr->hdr_src_ptr = (uint64_t)(intptr_t) hdr_src_ptr;
|
||
|
|
||
|
/* copy registration handle */
|
||
|
memcpy (hdr + 1, local_handle, local_handle_size);
|
||
|
}
|
||
|
|
||
|
#define MCA_PML_OB1_RGET_HDR_NTOH(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_RNDV_HDR_NTOH((h).hdr_rndv); \
|
||
|
(h).hdr_src_ptr = ntoh64((h).hdr_src_ptr); \
|
||
|
} while (0)
|
||
|
|
||
|
#define MCA_PML_OB1_RGET_HDR_HTON(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_RNDV_HDR_HTON((h).hdr_rndv); \
|
||
|
(h).hdr_src_ptr = hton64((h).hdr_src_ptr); \
|
||
|
} while (0)
|
||
|
|
||
|
/**
|
||
|
* Header for subsequent fragments.
|
||
|
*/
|
||
|
struct mca_pml_ob1_frag_hdr_t {
|
||
|
mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
uint8_t hdr_padding[6];
|
||
|
#endif
|
||
|
uint64_t hdr_frag_offset; /**< offset into message */
|
||
|
opal_ptr_t hdr_src_req; /**< pointer to source request */
|
||
|
opal_ptr_t hdr_dst_req; /**< pointer to matched receive */
|
||
|
};
|
||
|
typedef struct mca_pml_ob1_frag_hdr_t mca_pml_ob1_frag_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_frag_hdr_prepare (mca_pml_ob1_frag_hdr_t *hdr, uint8_t hdr_flags,
|
||
|
uint64_t hdr_frag_offset, void *hdr_src_req,
|
||
|
uint64_t hdr_dst_req)
|
||
|
{
|
||
|
mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_FRAG, hdr_flags);
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT && OPAL_ENABLE_DEBUG
|
||
|
hdr->hdr_padding[0] = 0;
|
||
|
hdr->hdr_padding[1] = 0;
|
||
|
hdr->hdr_padding[2] = 0;
|
||
|
hdr->hdr_padding[3] = 0;
|
||
|
hdr->hdr_padding[4] = 0;
|
||
|
hdr->hdr_padding[5] = 0;
|
||
|
#endif
|
||
|
hdr->hdr_frag_offset = hdr_frag_offset;
|
||
|
hdr->hdr_src_req.pval = hdr_src_req;
|
||
|
hdr->hdr_dst_req.lval = hdr_dst_req;
|
||
|
}
|
||
|
|
||
|
#define MCA_PML_OB1_FRAG_HDR_NTOH(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \
|
||
|
(h).hdr_frag_offset = ntoh64((h).hdr_frag_offset); \
|
||
|
} while (0)
|
||
|
|
||
|
#define MCA_PML_OB1_FRAG_HDR_HTON(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \
|
||
|
(h).hdr_frag_offset = hton64((h).hdr_frag_offset); \
|
||
|
} while (0)
|
||
|
|
||
|
/**
|
||
|
* Header used to acknowledgment outstanding fragment(s).
|
||
|
*/
|
||
|
|
||
|
struct mca_pml_ob1_ack_hdr_t {
|
||
|
mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
uint8_t hdr_padding[6];
|
||
|
#endif
|
||
|
opal_ptr_t hdr_src_req; /**< source request */
|
||
|
opal_ptr_t hdr_dst_req; /**< matched receive request */
|
||
|
uint64_t hdr_send_offset; /**< starting point of copy in/out */
|
||
|
uint64_t hdr_send_size; /**< number of bytes requested (0: all remaining) */
|
||
|
};
|
||
|
typedef struct mca_pml_ob1_ack_hdr_t mca_pml_ob1_ack_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_ack_hdr_prepare (mca_pml_ob1_ack_hdr_t *hdr, uint8_t hdr_flags,
|
||
|
uint64_t hdr_src_req, void *hdr_dst_req,
|
||
|
uint64_t hdr_send_offset, uint64_t hdr_send_size)
|
||
|
{
|
||
|
mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_ACK, hdr_flags);
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT && OPAL_ENABLE_DEBUG
|
||
|
hdr->hdr_padding[0] = 0;
|
||
|
hdr->hdr_padding[1] = 0;
|
||
|
hdr->hdr_padding[2] = 0;
|
||
|
hdr->hdr_padding[3] = 0;
|
||
|
hdr->hdr_padding[4] = 0;
|
||
|
hdr->hdr_padding[5] = 0;
|
||
|
#endif
|
||
|
hdr->hdr_src_req.lval = hdr_src_req;
|
||
|
hdr->hdr_dst_req.pval = hdr_dst_req;
|
||
|
hdr->hdr_send_offset = hdr_send_offset;
|
||
|
hdr->hdr_send_size = hdr_send_size;
|
||
|
}
|
||
|
|
||
|
/* Note that the request headers are not put in NBO because the
|
||
|
src_req is already in receiver's byte order and the dst_req is not
|
||
|
used by the receiver for anything other than backpointers in return
|
||
|
headers */
|
||
|
#define MCA_PML_OB1_ACK_HDR_NTOH(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \
|
||
|
(h).hdr_send_offset = ntoh64((h).hdr_send_offset); \
|
||
|
(h).hdr_send_size = ntoh64((h).hdr_send_size); \
|
||
|
} while (0)
|
||
|
|
||
|
#define MCA_PML_OB1_ACK_HDR_HTON(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \
|
||
|
(h).hdr_send_offset = hton64((h).hdr_send_offset); \
|
||
|
(h).hdr_send_size = hton64((h).hdr_send_size); \
|
||
|
} while (0)
|
||
|
|
||
|
/**
|
||
|
* Header used to initiate an RDMA operation.
|
||
|
*/
|
||
|
|
||
|
struct mca_pml_ob1_rdma_hdr_t {
|
||
|
mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
uint8_t hdr_padding[2]; /** two to pad out the hdr to a 4 byte alignment. hdr_req will then be 8 byte aligned after 4 for hdr_seg_cnt */
|
||
|
#endif
|
||
|
/* TODO: add real support for multiple destination segments */
|
||
|
opal_ptr_t hdr_req; /**< destination request */
|
||
|
opal_ptr_t hdr_frag; /**< receiver fragment */
|
||
|
opal_ptr_t hdr_recv_req; /**< receive request (NTH: needed for put fallback on send) */
|
||
|
uint64_t hdr_rdma_offset; /**< current offset into user buffer */
|
||
|
uint64_t hdr_dst_ptr; /**< destination address */
|
||
|
uint64_t hdr_dst_size; /**< destination size */
|
||
|
/* registration data follows */
|
||
|
};
|
||
|
typedef struct mca_pml_ob1_rdma_hdr_t mca_pml_ob1_rdma_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_rdma_hdr_prepare (mca_pml_ob1_rdma_hdr_t *hdr, uint8_t hdr_flags,
|
||
|
uint64_t hdr_req, void *hdr_frag, void *hdr_recv_req,
|
||
|
uint64_t hdr_rdma_offset, void *hdr_dst_ptr,
|
||
|
uint64_t hdr_dst_size, void *local_handle,
|
||
|
size_t local_handle_size)
|
||
|
{
|
||
|
mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_PUT, hdr_flags);
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT && OPAL_ENABLE_DEBUG
|
||
|
hdr->hdr_padding[0] = 0;
|
||
|
hdr->hdr_padding[1] = 0;
|
||
|
#endif
|
||
|
hdr->hdr_req.lval = hdr_req;
|
||
|
hdr->hdr_frag.pval = hdr_frag;
|
||
|
hdr->hdr_recv_req.pval = hdr_recv_req;
|
||
|
hdr->hdr_rdma_offset = hdr_rdma_offset;
|
||
|
hdr->hdr_dst_ptr = (uint64_t)(intptr_t) hdr_dst_ptr;
|
||
|
hdr->hdr_dst_size = hdr_dst_size;
|
||
|
|
||
|
/* copy segments */
|
||
|
memcpy (hdr + 1, local_handle, local_handle_size);
|
||
|
}
|
||
|
|
||
|
#define MCA_PML_OB1_RDMA_HDR_NTOH(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \
|
||
|
(h).hdr_rdma_offset = ntoh64((h).hdr_rdma_offset); \
|
||
|
(h).hdr_dst_ptr = ntoh64((h).hdr_dst_ptr); \
|
||
|
(h).hdr_dst_size = ntoh64((h).hdr_dst_size); \
|
||
|
} while (0)
|
||
|
|
||
|
#define MCA_PML_OB1_RDMA_HDR_HTON(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \
|
||
|
(h).hdr_rdma_offset = hton64((h).hdr_rdma_offset); \
|
||
|
(h).hdr_dst_ptr = hton64((h).hdr_dst_ptr); \
|
||
|
(h).hdr_dst_size = hton64((h).hdr_dst_size); \
|
||
|
} while (0)
|
||
|
|
||
|
/**
|
||
|
* Header used to complete an RDMA operation.
|
||
|
*/
|
||
|
|
||
|
struct mca_pml_ob1_fin_hdr_t {
|
||
|
mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
uint8_t hdr_padding[2];
|
||
|
#endif
|
||
|
int64_t hdr_size; /**< number of bytes completed (positive), error code (negative) */
|
||
|
opal_ptr_t hdr_frag; /**< completed RDMA fragment */
|
||
|
};
|
||
|
typedef struct mca_pml_ob1_fin_hdr_t mca_pml_ob1_fin_hdr_t;
|
||
|
|
||
|
static inline void mca_pml_ob1_fin_hdr_prepare (mca_pml_ob1_fin_hdr_t *hdr, uint8_t hdr_flags,
|
||
|
uint64_t hdr_frag, int64_t hdr_size)
|
||
|
{
|
||
|
mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_FIN, hdr_flags);
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT && OPAL_ENABLE_DEBUG
|
||
|
hdr->hdr_padding[0] = 0;
|
||
|
hdr->hdr_padding[1] = 0;
|
||
|
#endif
|
||
|
hdr->hdr_frag.lval = hdr_frag;
|
||
|
hdr->hdr_size = hdr_size;
|
||
|
}
|
||
|
|
||
|
#define MCA_PML_OB1_FIN_HDR_NTOH(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \
|
||
|
(h).hdr_size = ntoh64((h).hdr_size); \
|
||
|
} while (0)
|
||
|
|
||
|
#define MCA_PML_OB1_FIN_HDR_HTON(h) \
|
||
|
do { \
|
||
|
MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \
|
||
|
(h).hdr_size = hton64((h).hdr_size); \
|
||
|
} while (0)
|
||
|
|
||
|
/**
|
||
|
* Union of defined hdr types.
|
||
|
*/
|
||
|
union mca_pml_ob1_hdr_t {
|
||
|
mca_pml_ob1_common_hdr_t hdr_common;
|
||
|
mca_pml_ob1_match_hdr_t hdr_match;
|
||
|
mca_pml_ob1_rendezvous_hdr_t hdr_rndv;
|
||
|
mca_pml_ob1_rget_hdr_t hdr_rget;
|
||
|
mca_pml_ob1_frag_hdr_t hdr_frag;
|
||
|
mca_pml_ob1_ack_hdr_t hdr_ack;
|
||
|
mca_pml_ob1_rdma_hdr_t hdr_rdma;
|
||
|
mca_pml_ob1_fin_hdr_t hdr_fin;
|
||
|
};
|
||
|
typedef union mca_pml_ob1_hdr_t mca_pml_ob1_hdr_t;
|
||
|
|
||
|
#if !defined(WORDS_BIGENDIAN) && OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
static inline __opal_attribute_always_inline__ void
|
||
|
ob1_hdr_ntoh(mca_pml_ob1_hdr_t *hdr, const uint8_t hdr_type)
|
||
|
{
|
||
|
if(!(hdr->hdr_common.hdr_flags & MCA_PML_OB1_HDR_FLAGS_NBO))
|
||
|
return;
|
||
|
|
||
|
switch(hdr_type) {
|
||
|
case MCA_PML_OB1_HDR_TYPE_MATCH:
|
||
|
MCA_PML_OB1_MATCH_HDR_NTOH(hdr->hdr_match);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_RNDV:
|
||
|
MCA_PML_OB1_RNDV_HDR_NTOH(hdr->hdr_rndv);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_RGET:
|
||
|
MCA_PML_OB1_RGET_HDR_NTOH(hdr->hdr_rget);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_ACK:
|
||
|
MCA_PML_OB1_ACK_HDR_NTOH(hdr->hdr_ack);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_FRAG:
|
||
|
MCA_PML_OB1_FRAG_HDR_NTOH(hdr->hdr_frag);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_PUT:
|
||
|
MCA_PML_OB1_RDMA_HDR_NTOH(hdr->hdr_rdma);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_FIN:
|
||
|
MCA_PML_OB1_FIN_HDR_NTOH(hdr->hdr_fin);
|
||
|
break;
|
||
|
default:
|
||
|
assert(0);
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
#else
|
||
|
#define ob1_hdr_ntoh(h, t) do{}while(0)
|
||
|
#endif
|
||
|
|
||
|
#if OPAL_ENABLE_HETEROGENEOUS_SUPPORT
|
||
|
#define ob1_hdr_hton(h, t, p) \
|
||
|
ob1_hdr_hton_intr((mca_pml_ob1_hdr_t*)h, t, p)
|
||
|
static inline __opal_attribute_always_inline__ void
|
||
|
ob1_hdr_hton_intr(mca_pml_ob1_hdr_t *hdr, const uint8_t hdr_type,
|
||
|
const ompi_proc_t *proc)
|
||
|
{
|
||
|
#ifdef WORDS_BIGENDIAN
|
||
|
hdr->hdr_common.hdr_flags |= MCA_PML_OB1_HDR_FLAGS_NBO;
|
||
|
#else
|
||
|
|
||
|
if(!(proc->super.proc_arch & OPAL_ARCH_ISBIGENDIAN))
|
||
|
return;
|
||
|
|
||
|
hdr->hdr_common.hdr_flags |= MCA_PML_OB1_HDR_FLAGS_NBO;
|
||
|
switch(hdr_type) {
|
||
|
case MCA_PML_OB1_HDR_TYPE_MATCH:
|
||
|
MCA_PML_OB1_MATCH_HDR_HTON(hdr->hdr_match);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_RNDV:
|
||
|
MCA_PML_OB1_RNDV_HDR_HTON(hdr->hdr_rndv);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_RGET:
|
||
|
MCA_PML_OB1_RGET_HDR_HTON(hdr->hdr_rget);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_ACK:
|
||
|
MCA_PML_OB1_ACK_HDR_HTON(hdr->hdr_ack);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_FRAG:
|
||
|
MCA_PML_OB1_FRAG_HDR_HTON(hdr->hdr_frag);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_PUT:
|
||
|
MCA_PML_OB1_RDMA_HDR_HTON(hdr->hdr_rdma);
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_FIN:
|
||
|
MCA_PML_OB1_FIN_HDR_HTON(hdr->hdr_fin);
|
||
|
break;
|
||
|
default:
|
||
|
assert(0);
|
||
|
break;
|
||
|
}
|
||
|
#endif
|
||
|
}
|
||
|
#else
|
||
|
#define ob1_hdr_hton(h, t, p) do{}while(0)
|
||
|
#endif
|
||
|
|
||
|
static inline __opal_attribute_always_inline__ void
|
||
|
ob1_hdr_copy(mca_pml_ob1_hdr_t *src, mca_pml_ob1_hdr_t *dst)
|
||
|
{
|
||
|
switch(src->hdr_common.hdr_type) {
|
||
|
case MCA_PML_OB1_HDR_TYPE_MATCH:
|
||
|
memcpy( &(dst->hdr_match), &(src->hdr_match), sizeof(mca_pml_ob1_match_hdr_t) );
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_RNDV:
|
||
|
memcpy( &(dst->hdr_rndv), &(src->hdr_rndv), sizeof(mca_pml_ob1_rendezvous_hdr_t) );
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_RGET:
|
||
|
memcpy( &(dst->hdr_rget), &(src->hdr_rget), sizeof(mca_pml_ob1_rget_hdr_t) );
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_ACK:
|
||
|
memcpy( &(dst->hdr_ack), &(src->hdr_ack), sizeof(mca_pml_ob1_ack_hdr_t) );
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_FRAG:
|
||
|
memcpy( &(dst->hdr_frag), &(src->hdr_frag), sizeof(mca_pml_ob1_frag_hdr_t) );
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_PUT:
|
||
|
memcpy( &(dst->hdr_rdma), &(src->hdr_rdma), sizeof(mca_pml_ob1_rdma_hdr_t) );
|
||
|
break;
|
||
|
case MCA_PML_OB1_HDR_TYPE_FIN:
|
||
|
memcpy( &(dst->hdr_fin), &(src->hdr_fin), sizeof(mca_pml_ob1_fin_hdr_t) );
|
||
|
break;
|
||
|
default:
|
||
|
memcpy( &(dst->hdr_common), &(src->hdr_common), sizeof(mca_pml_ob1_common_hdr_t) );
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
#endif /* MCA_PML_OB1_HEADER_H */
|
||
|
|