1
1
openmpi/ompi/mca/osc/rdma/osc_rdma_request.h
Nathan Hjelm 45da311473 osc/rdma: fix hang when performing large unaligned gets
This commit adds code to handle large unaligned gets. There are two
possible code paths for these transactions:

 1) The remote region and local region have the same alignment. In
 this case the get will be broken down into at most three get
 transactions: 1 transaction to get the unaligned start of the region
 (buffered), 1 transaction to get the aligned portion of the region,
 and 1 transaction to get the end of the region.

 2) The remote and local regions do not have the same alignment. This
 should be an uncommon case and is not optimized. In this case a
 buffer is allocated and registered locally to hold the aligned data
 from the remote region. There may be cases where this fails (low
 memory, can't register memory). Those conditions are unlikely and
 will be handled later.

Signed-off-by: Nathan Hjelm <hjelmn@lanl.gov>
2016-01-22 21:06:46 -07:00

112 строки
3.9 KiB
C

/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
/*
* Copyright (c) 2012 Sandia National Laboratories. All rights reserved.
* Copyright (c) 2014-2015 Los Alamos National Security, LLC. All rights
* reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#ifndef OMPI_OSC_RDMA_REQUEST_H
#define OMPI_OSC_RDMA_REQUEST_H
#include "osc_rdma.h"
enum ompi_osc_rdma_request_type_t {
OMPI_OSC_RDMA_TYPE_GET,
OMPI_OSC_RDMA_TYPE_PUT,
OMPI_OSC_RDMA_TYPE_RDMA,
OMPI_OSC_RDMA_TYPE_ACC,
OMPI_OSC_RDMA_TYPE_GET_ACC,
OMPI_OSC_RDMA_TYPE_CSWAP,
};
typedef enum ompi_osc_rdma_request_type_t ompi_osc_rdma_request_type_t;
struct ompi_osc_rdma_request_t {
ompi_request_t super;
ompi_osc_rdma_peer_t *peer;
ompi_osc_rdma_request_type_t type;
void *origin_addr;
int origin_count;
struct ompi_datatype_t *origin_dt;
void *result_addr;
int result_count;
struct ompi_datatype_t *result_dt;
const void *compare_addr;
ompi_op_t *op;
ompi_osc_rdma_module_t *module;
int32_t outstanding_requests;
bool internal;
ptrdiff_t offset;
size_t len;
void *ctx;
void *frag;
uint64_t target_address;
struct ompi_osc_rdma_request_t *parent_request;
/* used for non-contiguous get accumulate operations */
opal_convertor_t convertor;
/** synchronization object */
struct ompi_osc_rdma_sync_t *sync;
void *buffer;
};
typedef struct ompi_osc_rdma_request_t ompi_osc_rdma_request_t;
OBJ_CLASS_DECLARATION(ompi_osc_rdma_request_t);
/* REQUEST_ALLOC is only called from "top-level" functions (rdma_rput,
rdma_rget, etc.), so it's ok to spin here... */
#define OMPI_OSC_RDMA_REQUEST_ALLOC(rmodule, rpeer, req) \
do { \
opal_free_list_item_t *item; \
do { \
item = opal_free_list_get (&mca_osc_rdma_component.requests); \
if (NULL == item) { \
ompi_osc_rdma_progress (rmodule); \
} \
} while (NULL == item); \
req = (ompi_osc_rdma_request_t*) item; \
OMPI_REQUEST_INIT(&req->super, false); \
req->super.req_mpi_object.win = module->win; \
req->super.req_state = OMPI_REQUEST_ACTIVE; \
req->module = rmodule; \
req->peer = (rpeer); \
} while (0)
#define OMPI_OSC_RDMA_REQUEST_RETURN(req) \
do { \
OMPI_REQUEST_FINI(&(req)->super); \
free ((req)->buffer); \
(req)->buffer = NULL; \
(req)->parent_request = NULL; \
(req)->internal = false; \
(req)->outstanding_requests = 0; \
opal_free_list_return (&mca_osc_rdma_component.requests, \
(opal_free_list_item_t *) (req)); \
} while (0)
static inline void ompi_osc_rdma_request_complete (ompi_osc_rdma_request_t *request, int mpi_error)
{
if (!request->internal) {
request->super.req_status.MPI_ERROR = mpi_error;
/* mark the request complete at the mpi level */
ompi_request_complete (&request->super, true);
} else {
OMPI_OSC_RDMA_REQUEST_RETURN (request);
}
}
#endif /* OMPI_OSC_RDMA_REQUEST_H */