433f8a7694
receive queues are shared among all PMLs, they are declared in the base PML, and the selected PML is in charge of initializing and releasing them. The CM PML is slightly different compared with OB1 or DR. Internally it use 2 different types of requests: light and heavy. However, now with this patch both types of requests are stored in the same queue, and cast appropriately on the allocation macro. This means we might use less memory than we allocate, but in exchange we got full support for most of the parallel debuggers. Another thing with this patch, is that now for all PML (CM included) the basic PML requests start with the same fields, and they are declared in the same order in the request structure. Moreover, the fields have been moved in such a way that only one volatile/atomic will exist per line of cache (hopefully). This commit was SVN r15346.
141 строка
5.3 KiB
C
141 строка
5.3 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2007 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2006 Cisco Systems, Inc. All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "ompi_config.h"
|
|
|
|
#include "pml_ob1.h"
|
|
#include "pml_ob1_recvreq.h"
|
|
#include "pml_ob1_sendreq.h"
|
|
|
|
|
|
int mca_pml_ob1_start(size_t count, ompi_request_t** requests)
|
|
{
|
|
int rc;
|
|
size_t i;
|
|
bool reuse_old_request = true;
|
|
|
|
for(i=0; i<count; i++) {
|
|
mca_pml_base_request_t *pml_request = (mca_pml_base_request_t*)requests[i];
|
|
if(NULL == pml_request) {
|
|
continue;
|
|
}
|
|
if (OMPI_REQUEST_PML != requests[i]->req_type) {
|
|
continue;
|
|
}
|
|
|
|
/* If the persistent request is currently active - obtain the
|
|
* request lock and verify the status is incomplete. if the
|
|
* pml layer has not completed the request - mark the request
|
|
* as free called - so that it will be freed when the request
|
|
* completes - and create a new request.
|
|
*/
|
|
|
|
switch(pml_request->req_ompi.req_state) {
|
|
case OMPI_REQUEST_INACTIVE:
|
|
if(pml_request->req_pml_complete == true)
|
|
break;
|
|
/* otherwise fall through */
|
|
case OMPI_REQUEST_ACTIVE: {
|
|
|
|
ompi_request_t *request;
|
|
OPAL_THREAD_LOCK(&ompi_request_lock);
|
|
if (pml_request->req_pml_complete == false) {
|
|
/* free request after it completes */
|
|
pml_request->req_free_called = true;
|
|
} else {
|
|
/* can reuse the existing request */
|
|
OPAL_THREAD_UNLOCK(&ompi_request_lock);
|
|
break;
|
|
}
|
|
|
|
reuse_old_request = false;
|
|
/* allocate a new request */
|
|
switch(pml_request->req_type) {
|
|
case MCA_PML_REQUEST_SEND: {
|
|
mca_pml_base_send_mode_t sendmode =
|
|
((mca_pml_base_send_request_t*)pml_request)->req_send_mode;
|
|
rc = mca_pml_ob1_isend_init(
|
|
pml_request->req_addr,
|
|
pml_request->req_count,
|
|
pml_request->req_datatype,
|
|
pml_request->req_peer,
|
|
pml_request->req_tag,
|
|
sendmode,
|
|
pml_request->req_comm,
|
|
&request);
|
|
break;
|
|
}
|
|
case MCA_PML_REQUEST_RECV:
|
|
rc = mca_pml_ob1_irecv_init(
|
|
pml_request->req_addr,
|
|
pml_request->req_count,
|
|
pml_request->req_datatype,
|
|
pml_request->req_peer,
|
|
pml_request->req_tag,
|
|
pml_request->req_comm,
|
|
&request);
|
|
break;
|
|
default:
|
|
rc = OMPI_ERR_REQUEST;
|
|
break;
|
|
}
|
|
OPAL_THREAD_UNLOCK(&ompi_request_lock);
|
|
if(OMPI_SUCCESS != rc)
|
|
return rc;
|
|
pml_request = (mca_pml_base_request_t*)request;
|
|
requests[i] = request;
|
|
break;
|
|
}
|
|
default:
|
|
return OMPI_ERR_REQUEST;
|
|
}
|
|
|
|
/* start the request */
|
|
switch(pml_request->req_type) {
|
|
case MCA_PML_REQUEST_SEND:
|
|
{
|
|
mca_pml_ob1_send_request_t* sendreq = (mca_pml_ob1_send_request_t*)pml_request;
|
|
if( reuse_old_request && (sendreq->req_send.req_bytes_packed != 0) ) {
|
|
size_t offset = 0;
|
|
/**
|
|
* Reset the convertor in case we're dealing with the original
|
|
* request, which when completed do not reset the convertor.
|
|
*/
|
|
ompi_convertor_set_position( &sendreq->req_send.req_base.req_convertor,
|
|
&offset );
|
|
}
|
|
MCA_PML_OB1_SEND_REQUEST_START(sendreq, rc);
|
|
if(rc != OMPI_SUCCESS)
|
|
return rc;
|
|
break;
|
|
}
|
|
case MCA_PML_REQUEST_RECV:
|
|
{
|
|
mca_pml_ob1_recv_request_t* recvreq = (mca_pml_ob1_recv_request_t*)pml_request;
|
|
MCA_PML_OB1_RECV_REQUEST_START(recvreq);
|
|
break;
|
|
}
|
|
default:
|
|
return OMPI_ERR_REQUEST;
|
|
}
|
|
}
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|