17f51a0389
Add two new configure options that specify: 1. when to add padding to the openib control header - this *only* happens when the configure option is specified 2. when to use the dr-like checksum as opposed to the memcpy checksum. Not selectable at runtime - to eliminate performance impacts, this is a configure-only option Also removed an unused checksum version from opal/util/crc.h. The new component still needs a little cleanup and some sync with recent ob1 bug fixes. It was created as a separate module to avoid performance hits in ob1 itself, though most of the code is duplicative. The component is only selectable by either specifying it directly, or configuring with the dr-like checksum -and- setting -mca pml_csum_enable_checksum 1. Modify the LANL platform files to take advantage of the new module. This commit was SVN r20846.
143 строки
5.4 KiB
C
143 строки
5.4 KiB
C
/*
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
* University Research and Technology
|
|
* Corporation. All rights reserved.
|
|
* Copyright (c) 2004-2007 The University of Tennessee and The University
|
|
* of Tennessee Research Foundation. All rights
|
|
* reserved.
|
|
* Copyright (c) 2004-2008 High Performance Computing Center Stuttgart,
|
|
* University of Stuttgart. All rights reserved.
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
* All rights reserved.
|
|
* Copyright (c) 2006 Cisco Systems, Inc. All rights reserved.
|
|
* $COPYRIGHT$
|
|
*
|
|
* Additional copyrights may follow
|
|
*
|
|
* $HEADER$
|
|
*/
|
|
|
|
#include "ompi_config.h"
|
|
|
|
#include "pml_csum.h"
|
|
#include "pml_csum_recvreq.h"
|
|
#include "pml_csum_sendreq.h"
|
|
#include "ompi/memchecker.h"
|
|
|
|
|
|
int mca_pml_csum_start(size_t count, ompi_request_t** requests)
|
|
{
|
|
int rc;
|
|
size_t i;
|
|
bool reuse_old_request = true;
|
|
|
|
for(i=0; i<count; i++) {
|
|
mca_pml_base_request_t *pml_request = (mca_pml_base_request_t*)requests[i];
|
|
if(NULL == pml_request) {
|
|
continue;
|
|
}
|
|
if (OMPI_REQUEST_PML != requests[i]->req_type) {
|
|
continue;
|
|
}
|
|
|
|
/* If the persistent request is currently active - obtain the
|
|
* request lock and verify the status is incomplete. if the
|
|
* pml layer has not completed the request - mark the request
|
|
* as free called - so that it will be freed when the request
|
|
* completes - and create a new request.
|
|
*/
|
|
|
|
reuse_old_request = true;
|
|
switch(pml_request->req_ompi.req_state) {
|
|
case OMPI_REQUEST_INACTIVE:
|
|
if(pml_request->req_pml_complete == true)
|
|
break;
|
|
/* otherwise fall through */
|
|
case OMPI_REQUEST_ACTIVE: {
|
|
|
|
ompi_request_t *request;
|
|
OPAL_THREAD_LOCK(&ompi_request_lock);
|
|
if (pml_request->req_pml_complete == false) {
|
|
/* free request after it completes */
|
|
pml_request->req_free_called = true;
|
|
} else {
|
|
/* can reuse the existing request */
|
|
OPAL_THREAD_UNLOCK(&ompi_request_lock);
|
|
break;
|
|
}
|
|
|
|
reuse_old_request = false;
|
|
/* allocate a new request */
|
|
switch(pml_request->req_type) {
|
|
case MCA_PML_REQUEST_SEND: {
|
|
mca_pml_base_send_mode_t sendmode =
|
|
((mca_pml_base_send_request_t*)pml_request)->req_send_mode;
|
|
rc = mca_pml_csum_isend_init(
|
|
pml_request->req_addr,
|
|
pml_request->req_count,
|
|
pml_request->req_datatype,
|
|
pml_request->req_peer,
|
|
pml_request->req_tag,
|
|
sendmode,
|
|
pml_request->req_comm,
|
|
&request);
|
|
break;
|
|
}
|
|
case MCA_PML_REQUEST_RECV:
|
|
rc = mca_pml_csum_irecv_init(
|
|
pml_request->req_addr,
|
|
pml_request->req_count,
|
|
pml_request->req_datatype,
|
|
pml_request->req_peer,
|
|
pml_request->req_tag,
|
|
pml_request->req_comm,
|
|
&request);
|
|
break;
|
|
default:
|
|
rc = OMPI_ERR_REQUEST;
|
|
break;
|
|
}
|
|
OPAL_THREAD_UNLOCK(&ompi_request_lock);
|
|
if(OMPI_SUCCESS != rc)
|
|
return rc;
|
|
pml_request = (mca_pml_base_request_t*)request;
|
|
requests[i] = request;
|
|
break;
|
|
}
|
|
default:
|
|
return OMPI_ERR_REQUEST;
|
|
}
|
|
|
|
/* start the request */
|
|
switch(pml_request->req_type) {
|
|
case MCA_PML_REQUEST_SEND:
|
|
{
|
|
mca_pml_csum_send_request_t* sendreq = (mca_pml_csum_send_request_t*)pml_request;
|
|
if( reuse_old_request && (sendreq->req_send.req_bytes_packed != 0) ) {
|
|
size_t offset = 0;
|
|
/**
|
|
* Reset the convertor in case we're dealing with the original
|
|
* request, which when completed do not reset the convertor.
|
|
*/
|
|
ompi_convertor_set_position( &sendreq->req_send.req_base.req_convertor,
|
|
&offset );
|
|
}
|
|
MCA_PML_CSUM_SEND_REQUEST_START(sendreq, rc);
|
|
if(rc != OMPI_SUCCESS)
|
|
return rc;
|
|
break;
|
|
}
|
|
case MCA_PML_REQUEST_RECV:
|
|
{
|
|
mca_pml_csum_recv_request_t* recvreq = (mca_pml_csum_recv_request_t*)pml_request;
|
|
MCA_PML_CSUM_RECV_REQUEST_START(recvreq);
|
|
break;
|
|
}
|
|
default:
|
|
return OMPI_ERR_REQUEST;
|
|
}
|
|
}
|
|
return OMPI_SUCCESS;
|
|
}
|
|
|