1
1
openmpi/ompi/request/grequest.c
bosilca b90c83840f Refactor the request completion (#1422)
* Remodel the request.
Added the wait sync primitive and integrate it into the PML and MTL
infrastructure. The multi-threaded requests are now significantly
less heavy and less noisy (only the threads associated with completed
requests are signaled).

* Fix the condition to release the request.
2016-05-24 18:20:51 -05:00

228 строки
7.8 KiB
C

/*
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
* University Research and Technology
* Corporation. All rights reserved.
* Copyright (c) 2004-2016 The University of Tennessee and The University
* of Tennessee Research Foundation. All rights
* reserved.
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
* University of Stuttgart. All rights reserved.
* Copyright (c) 2004-2005 The Regents of the University of California.
* All rights reserved.
* Copyright (c) 2006-2012 Cisco Systems, Inc. All rights reserved.
* Copyright (c) 2009 Sun Microsystems, Inc. All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "ompi_config.h"
#include "ompi/communicator/communicator.h"
#include "ompi/request/grequest.h"
#include "ompi/mpi/fortran/base/fint_2_int.h"
/*
* See the comment in the grequest destructor for the weird semantics
* here. If the request has been marked complete via a call to
* MPI_GREQUEST_COMPLETE, actually release the object. OTherwise,
* just mark this object as "freed" so that a later call to
* MPI_GREQUEST_COMPLETE will release it (!).
*
* Note that TEST* and WAIT* will call this function when a request
* has been completed.
*/
static int ompi_grequest_free(ompi_request_t** req)
{
OBJ_RELEASE(*req);
*req = MPI_REQUEST_NULL;
return OMPI_SUCCESS;
}
static int ompi_grequest_cancel(ompi_request_t* req, int flag)
{
int rc = OMPI_SUCCESS;
MPI_Fint ierr;
ompi_fortran_logical_t fflag;
ompi_grequest_t* greq = (ompi_grequest_t*)req;
if (greq->greq_cancel.c_cancel != NULL) {
if (greq->greq_funcs_are_c) {
rc = greq->greq_cancel.c_cancel(greq->greq_state,
REQUEST_COMPLETE(&greq->greq_base));
} else {
fflag = (ompi_fortran_logical_t) REQUEST_COMPLETE(&greq->greq_base);
greq->greq_cancel.f_cancel((MPI_Aint*)greq->greq_state, &fflag, &ierr);
rc = OMPI_FINT_2_INT(ierr);
}
}
return rc;
}
static void ompi_grequest_construct(ompi_grequest_t* greq)
{
greq->greq_base.req_free = ompi_grequest_free;
greq->greq_base.req_cancel = ompi_grequest_cancel;
greq->greq_base.req_type = OMPI_REQUEST_GEN;
greq->greq_base.req_mpi_object.comm = &(ompi_mpi_comm_world.comm);
/* Set the function pointers to C here; the F77 MPI API will
override this value if the gen request was created from
Fortran */
greq->greq_funcs_are_c = true;
}
/*
* MPI has some weird semantics with respect to generalized requests
* -- different than all other MPI object types. So we move some
* cleanup stuff here to the destructor rather than in
* greqeust_request_free -- mainly because the cleanup may be required
* in two different places.
*
* Specifically, generalized requests can be completed (and therefore
* released) the following ways:
*
* 1. Call to MPI_GREQUEST_COMPLETE and then a corresponding call to
* some flavor of MPI_TEST* or MPI_WAIT*. This will both complete the
* requests and destroy the coresponding MPI generalized request
* object.
*
* 2. Call MPI_REQUEST_FREE and then (!) -- with some other
* still-valid copy of the handler -- call MPI_GREQUEST_COMPLETE.
*
* 3. Reverse the order of #2 -- call MPI_GREQUEST_COMPLETE and then
* MPI_REQUEST_FREE.
*
* So any one of these functions may actually be the one that
* de-allocates the back-end request object. Hence, this is perfect
* for our reference counting system -- so the call to the gen request
* free_fn() is back here in the destructor, whenever the object is
* actually freed.
*
* Hence, the following must occur before a grequest is freed:
*
* - ompi_grequest_complete() (i.e., GREQUEST_COMPLETE) is invoked
* - ompi_grequest_free() is invoked
*
* Remember that ompi_grequest_free() is invoked by MPI_TEST* and
* MPI_WAIT* when the request was previously marked as complete and
* TEST* / WAIT* notified the user as such, and this function is also
* invoked by REQUEST_FREE). Hence, these two functions will *always*
* be invoked, but the order in which they are invoked is up to the
* user. So this is a perfect opprotunity for the OBJ_* reference
* count system. When we create an ompi_grequest_t in
* ompi_grequest_start(), we both OBJ_NEW and OBJ_RETAIN it so that
* its reference count goes to 0. Then in ompi_grequest_complete()
* and ompi_grequest_free(), we OBJ_RELEASE it. Hence, when both of
* them have RELEASEd -- regardless of the order in which the
* functions were invoked, then the destructor is invoked and
* everything is cleaned up (and we invoked the grequest free_fn).
*/
static void ompi_grequest_destruct(ompi_grequest_t* greq)
{
MPI_Fint ierr;
if (greq->greq_free.c_free != NULL) {
if (greq->greq_funcs_are_c) {
greq->greq_free.c_free(greq->greq_state);
} else {
greq->greq_free.f_free((MPI_Aint*)greq->greq_state, &ierr);
}
}
OMPI_REQUEST_FINI(&greq->greq_base);
}
OBJ_CLASS_INSTANCE(
ompi_grequest_t,
ompi_request_t,
ompi_grequest_construct,
ompi_grequest_destruct);
int ompi_grequest_start(
MPI_Grequest_query_function *gquery_fn,
MPI_Grequest_free_function *gfree_fn,
MPI_Grequest_cancel_function *gcancel_fn,
void* gstate,
ompi_request_t** request)
{
ompi_grequest_t *greq = OBJ_NEW(ompi_grequest_t);
if(greq == NULL) {
return OMPI_ERR_OUT_OF_RESOURCE;
}
/* We call RETAIN here specifically to increase the refcount to 2.
See comment before the destructor for an explanation. */
OBJ_RETAIN(greq);
greq->greq_base.req_state = OMPI_REQUEST_ACTIVE;
greq->greq_state = gstate;
greq->greq_query.c_query = gquery_fn;
greq->greq_free.c_free = gfree_fn;
greq->greq_cancel.c_cancel = gcancel_fn;
greq->greq_base.req_status = ompi_status_empty;
*request = &greq->greq_base;
return OMPI_SUCCESS;
}
/*
* Beware the odd semantics listed in MPI-2:8.2... See the comment in
* the grequest destructor.
*
* First do the normal stuff to complete the request (i.e., call
* ompi_request_complete()). Then, if this request object was
* previously freed via MPI_REQUEST_FREE, release it.
*/
int ompi_grequest_complete(ompi_request_t *req)
{
int rc;
rc = ompi_request_complete(req, true);
OBJ_RELEASE(req);
return rc;
}
/*
* Grequest queries are invoked in two places:
*
* 1. MPI_TEST* / MPI_WAIT*, when requests have completed.
*
* 2. MPI_REQUEST_GET_STATUS, when requests may or may not have
* completed.
*
*/
int ompi_grequest_invoke_query(ompi_request_t *request,
ompi_status_public_t *status)
{
int rc = OMPI_SUCCESS;
ompi_grequest_t *g = (ompi_grequest_t*) request;
/* MPI-2:8.2 does not say what to do with the return value from
the query function (i.e., the int return value from the C
function or the ierr argument from the Fortran function).
Making the command decision here to ignore it. If the handler
wants to pass an error back, it should set it in the MPI_ERROR
field in the status (which is always kept, regardless if the
top-level function was invoked with MPI_STATUS[ES]_IGNORE or
not). */
if (NULL != g->greq_query.c_query) {
if (g->greq_funcs_are_c) {
rc = g->greq_query.c_query(g->greq_state, status);
} else {
MPI_Fint ierr;
MPI_Fint fstatus[sizeof(MPI_Status) / sizeof(int)];
g->greq_query.f_query((MPI_Aint*)g->greq_state, fstatus, &ierr);
MPI_Status_f2c(fstatus, status);
rc = OMPI_FINT_2_INT(ierr);
}
}
return rc;
}