2007-07-25 22:28:04 +00:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2004-2007 The Trustees of the University of Tennessee.
|
|
|
|
* All rights reserved.
|
|
|
|
* $COPYRIGHT$
|
|
|
|
*
|
|
|
|
* Additional copyrights may follow
|
|
|
|
*
|
|
|
|
* $HEADER$
|
|
|
|
*/
|
|
|
|
|
2007-07-20 21:36:11 +00:00
|
|
|
#ifndef __VPROTOCOL_PESSIMIST_SENDERBASED_H__
|
|
|
|
#define __VPROTOCOL_PESSIMIST_SENDERBASED_H__
|
|
|
|
|
2008-03-27 21:05:44 +00:00
|
|
|
#include "ompi_config.h"
|
2007-08-16 05:52:30 +00:00
|
|
|
#include "ompi/mca/pml/base/pml_base_sendreq.h"
|
2008-06-09 20:38:44 +00:00
|
|
|
#include "ompi/mca/pml/v/pml_v_output.h"
|
2008-03-27 21:05:44 +00:00
|
|
|
#include "vprotocol_pessimist_sender_based_types.h"
|
|
|
|
#include "vprotocol_pessimist_request.h"
|
2007-08-16 05:52:30 +00:00
|
|
|
#include "vprotocol_pessimist.h"
|
|
|
|
|
2008-03-27 21:05:44 +00:00
|
|
|
BEGIN_C_DECLS
|
2007-07-20 21:36:11 +00:00
|
|
|
|
2008-03-27 21:05:44 +00:00
|
|
|
/** Prepare for using the sender based storage
|
|
|
|
*/
|
2007-07-20 21:36:11 +00:00
|
|
|
int vprotocol_pessimist_sender_based_init(const char *mmapfile, size_t size);
|
|
|
|
|
2008-03-27 21:05:44 +00:00
|
|
|
/** Cleanup mmap etc
|
|
|
|
*/
|
2007-07-20 21:36:11 +00:00
|
|
|
void vprotocol_pessimist_sender_based_finalize(void);
|
|
|
|
|
|
|
|
/** Manage mmap floating window, allocating enough memory for the message to be
|
|
|
|
* asynchronously copied to disk.
|
|
|
|
*/
|
|
|
|
void vprotocol_pessimist_sender_based_alloc(size_t len);
|
|
|
|
|
2007-09-19 03:42:56 +00:00
|
|
|
|
2007-09-21 03:24:08 +00:00
|
|
|
/*******************************************************************************
|
|
|
|
* Convertor pack (blocking) method (good latency, bad bandwidth)
|
|
|
|
*/
|
2007-09-19 03:42:56 +00:00
|
|
|
#if defined(SB_USE_PACK_METHOD)
|
2008-03-27 21:05:44 +00:00
|
|
|
static inline void __SENDER_BASED_METHOD_COPY(mca_pml_base_send_request_t *pmlreq)
|
|
|
|
{
|
|
|
|
if(0 != pmlreq->req_bytes_packed)
|
|
|
|
{
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
opal_convertor_t conv;
|
2008-03-27 21:05:44 +00:00
|
|
|
size_t max_data;
|
|
|
|
size_t zero = 0;
|
|
|
|
unsigned int iov_count = 1;
|
|
|
|
struct iovec iov;
|
|
|
|
|
|
|
|
max_data = iov.iov_len = pmlreq->req_bytes_packed;
|
|
|
|
iov.iov_base = (IOVBASE_TYPE *) VPESSIMIST_SEND_FTREQ(pmlreq)->sb.cursor;
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
opal_convertor_clone_with_position( &pmlreq->req_base.req_convertor,
|
2008-03-27 21:05:44 +00:00
|
|
|
&conv, 0, &zero );
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
opal_convertor_pack(&conv, &iov, &iov_count, &max_data);
|
2008-03-27 21:05:44 +00:00
|
|
|
}
|
|
|
|
}
|
2007-07-20 21:36:11 +00:00
|
|
|
|
2007-09-19 03:42:56 +00:00
|
|
|
#define __SENDER_BASED_METHOD_FLUSH(REQ)
|
2007-08-16 05:52:30 +00:00
|
|
|
|
2007-09-21 03:24:08 +00:00
|
|
|
|
|
|
|
/*******************************************************************************
|
|
|
|
* Convertor replacement (non blocking) method (under testing)
|
|
|
|
*/
|
|
|
|
#elif defined(SB_USE_CONVERTOR_METHOD)
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
int32_t vprotocol_pessimist_sender_based_convertor_advance(opal_convertor_t*,
|
2007-09-21 03:24:08 +00:00
|
|
|
struct iovec*,
|
|
|
|
uint32_t*,
|
|
|
|
size_t*);
|
|
|
|
|
|
|
|
#define __SENDER_BASED_METHOD_COPY(REQ) do { \
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
opal_convertor_t *pConv; \
|
2008-03-27 21:05:44 +00:00
|
|
|
mca_vprotocol_pessimist_send_request_t *ftreq; \
|
2007-09-21 03:24:08 +00:00
|
|
|
\
|
|
|
|
pConv = & (REQ)->req_base.req_convertor; \
|
2008-03-27 21:05:44 +00:00
|
|
|
ftreq = VPESSIMIST_SEND_FTREQ(REQ); \
|
|
|
|
ftreq->sb.conv_flags = pConv->flags; \
|
|
|
|
ftreq->sb.conv_advance = pConv->fAdvance; \
|
2007-09-21 03:24:08 +00:00
|
|
|
\
|
|
|
|
pConv->flags &= ~CONVERTOR_NO_OP; \
|
|
|
|
pConv->fAdvance = vprotocol_pessimist_sender_based_convertor_advance; \
|
|
|
|
} while(0)
|
|
|
|
|
|
|
|
#define __SENDER_BASED_METHOD_FLUSH(REQ)
|
|
|
|
|
|
|
|
#define VPESSIMIST_CONV_REQ(CONV) ((mca_vprotocol_pessimist_send_request_t *) \
|
|
|
|
(mca_vprotocol_pessimist.sender_based.sb_conv_to_pessimist_offset + \
|
2008-01-07 23:35:44 +00:00
|
|
|
(uintptr_t) ((CONV)->clone_of)))
|
2007-09-21 03:24:08 +00:00
|
|
|
|
|
|
|
|
|
|
|
/*******************************************************************************
|
2008-03-27 21:05:44 +00:00
|
|
|
* progress method
|
2007-09-21 03:24:08 +00:00
|
|
|
*/
|
2008-03-27 21:05:44 +00:00
|
|
|
#elif defined(SB_USE_PROGRESS_METHOD)
|
|
|
|
static inline void __SENDER_BASED_METHOD_COPY(mca_pml_base_send_request_t *req)
|
|
|
|
{
|
|
|
|
if(req->req_bytes_packed)
|
|
|
|
{
|
|
|
|
mca_vprotocol_pessimist_send_request_t *ftreq = VPESSIMIST_SEND_FTREQ(req);
|
|
|
|
ftreq->sb.bytes_progressed = 0;
|
|
|
|
opal_list_append(&mca_vprotocol_pessimist.sender_based.sb_sendreq,
|
|
|
|
&ftreq->list_item);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int vprotocol_pessimist_sb_progress_req(mca_pml_base_send_request_t *req)
|
|
|
|
{
|
|
|
|
mca_vprotocol_pessimist_request_t *ftreq = VPESSIMIST_SEND_FTREQ(req);
|
|
|
|
size_t max_data = 0;
|
|
|
|
|
|
|
|
if(ftreq->sb.bytes_progressed < req->req_bytes_packed)
|
|
|
|
{
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
opal_convertor_t conv;
|
2008-03-27 21:05:44 +00:00
|
|
|
unsigned int iov_count = 1;
|
|
|
|
struct iovec iov;
|
|
|
|
uintptr_t position = ftreq->sb.bytes_progressed;
|
|
|
|
max_data = req->req_bytes_packed - ftreq->sb.bytes_progressed;
|
|
|
|
iov.iov_len = max_data;
|
|
|
|
iov.iov_base = (IOVBASE_TYPE *) (ftreq->sb.cursor + position);
|
|
|
|
|
|
|
|
V_OUTPUT_VERBOSE(80, "pessimist:\tsb\tprgress\t%"PRIpclock"\tsize %lu from position %lu", ftreq->reqid, max_data, position);
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
opal_convertor_clone_with_position(&req->req_base.req_convertor,
|
2008-03-27 21:05:44 +00:00
|
|
|
&conv, 0, &position );
|
- Split the datatype engine into two parts: an MPI specific part in
OMPI
and a language agnostic part in OPAL. The convertor is completely
moved into OPAL. This offers several benefits as described in RFC
http://www.open-mpi.org/community/lists/devel/2009/07/6387.php
namely:
- Fewer basic types (int* and float* types, boolean and wchar
- Fixing naming scheme to ompi-nomenclature.
- Usability outside of the ompi-layer.
- Due to the fixed nature of simple opal types, their information is
completely
known at compile time and therefore constified
- With fewer datatypes (22), the actual sizes of bit-field types may be
reduced
from 64 to 32 bits, allowing reorganizing the opal_datatype
structure, eliminating holes and keeping data required in convertor
(upon send/recv) in one cacheline...
This has implications to the convertor-datastructure and other parts
of the code.
- Several performance tests have been run, the netpipe latency does not
change with
this patch on Linux/x86-64 on the smoky cluster.
- Extensive tests have been done to verify correctness (no new
regressions) using:
1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and
ompi-ddt:
a. running both trunk and ompi-ddt resulted in no differences
(except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run
correctly).
b. with --enable-memchecker and running under valgrind (one buglet
when run with static found in test-suite, commited)
2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt:
all passed (except for the dynamic/ tests failed!! as trunk/MTT)
3. compilation and usage of HDF5 tests on Jaguar using PGI and
PathScale compilers.
4. compilation and usage on Scicortex.
- Please note, that for the heterogeneous case, (-m32 compiled
binaries/ompi), neither
ompi-trunk, nor ompi-ddt branch would successfully launch.
This commit was SVN r21641.
2009-07-13 04:56:31 +00:00
|
|
|
opal_convertor_pack(&conv, &iov, &iov_count, &max_data);
|
2008-03-27 21:05:44 +00:00
|
|
|
ftreq->sb.bytes_progressed += max_data;
|
|
|
|
}
|
|
|
|
return max_data;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int vprotocol_pessimist_sb_progress_all_reqs(void)
|
|
|
|
{
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
/* progress any waiting Sender Based copy */
|
|
|
|
if(!opal_list_is_empty(&mca_vprotocol_pessimist.sender_based.sb_sendreq))
|
|
|
|
{
|
|
|
|
mca_vprotocol_pessimist_request_t *ftreq = (mca_vprotocol_pessimist_request_t *)
|
|
|
|
opal_list_remove_first(&mca_vprotocol_pessimist.sender_based.sb_sendreq);
|
|
|
|
if(vprotocol_pessimist_sb_progress_req(VPROTOCOL_SEND_REQ(ftreq)))
|
|
|
|
ret = 1;
|
|
|
|
opal_list_append(&mca_vprotocol_pessimist.sender_based.sb_sendreq,
|
|
|
|
&ftreq->list_item);
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __SENDER_BASED_METHOD_FLUSH(ompi_request_t *req)
|
|
|
|
{
|
|
|
|
mca_pml_base_send_request_t *pmlreq = (mca_pml_base_send_request_t *) req;
|
|
|
|
|
|
|
|
if((pmlreq->req_base.req_type == MCA_PML_REQUEST_SEND) &&
|
|
|
|
pmlreq->req_bytes_packed)
|
|
|
|
{
|
|
|
|
mca_vprotocol_pessimist_request_t *ftreq = VPESSIMIST_SEND_FTREQ(req);
|
|
|
|
assert(!opal_list_is_empty(&mca_vprotocol_pessimist.sender_based.sb_sendreq));
|
|
|
|
opal_list_remove_item(&mca_vprotocol_pessimist.sender_based.sb_sendreq,
|
|
|
|
(opal_list_item_t *) ftreq);
|
|
|
|
vprotocol_pessimist_sb_progress_req(pmlreq);
|
|
|
|
assert(pmlreq->req_bytes_packed == ftreq->sb.bytes_progressed);
|
|
|
|
}
|
|
|
|
}
|
2007-07-20 21:36:11 +00:00
|
|
|
|
2007-09-19 03:42:56 +00:00
|
|
|
#endif /* SB_USE_*_METHOD */
|
|
|
|
|
2008-03-27 21:05:44 +00:00
|
|
|
|
|
|
|
/** Copy data associated to a pml_base_send_request_t to the sender based
|
|
|
|
* message payload buffer
|
|
|
|
*/
|
|
|
|
static inline void vprotocol_pessimist_sender_based_copy_start(ompi_request_t *req)
|
|
|
|
{
|
|
|
|
vprotocol_pessimist_sender_based_header_t *sbhdr;
|
|
|
|
mca_vprotocol_pessimist_request_t *ftreq = VPESSIMIST_SEND_FTREQ(req);
|
|
|
|
mca_pml_base_send_request_t *pmlreq = (mca_pml_base_send_request_t *) req;
|
|
|
|
|
|
|
|
/* Allocate enough sender-based space to hold the message */
|
|
|
|
if(mca_vprotocol_pessimist.sender_based.sb_available <
|
|
|
|
pmlreq->req_bytes_packed +
|
|
|
|
sizeof(vprotocol_pessimist_sender_based_header_t))
|
|
|
|
{
|
|
|
|
vprotocol_pessimist_sender_based_alloc(pmlreq->req_bytes_packed);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Copy message header to the sender-based space */
|
|
|
|
/* /!\ This is NOT thread safe */
|
|
|
|
ftreq->sb.cursor = mca_vprotocol_pessimist.sender_based.sb_cursor;
|
2009-03-18 13:42:48 +00:00
|
|
|
#if 1
|
2008-03-27 21:05:44 +00:00
|
|
|
mca_vprotocol_pessimist.sender_based.sb_cursor +=
|
|
|
|
sizeof(vprotocol_pessimist_sender_based_header_t) +
|
|
|
|
pmlreq->req_bytes_packed;
|
|
|
|
mca_vprotocol_pessimist.sender_based.sb_available -=
|
|
|
|
sizeof(vprotocol_pessimist_sender_based_header_t) +
|
|
|
|
pmlreq->req_bytes_packed;
|
|
|
|
#endif
|
|
|
|
sbhdr = (vprotocol_pessimist_sender_based_header_t *) ftreq->sb.cursor;
|
|
|
|
sbhdr->size = pmlreq->req_bytes_packed;
|
|
|
|
sbhdr->dst = pmlreq->req_base.req_peer;
|
|
|
|
sbhdr->tag = pmlreq->req_base.req_tag;
|
|
|
|
sbhdr->contextid = pmlreq->req_base.req_comm->c_contextid;
|
|
|
|
sbhdr->sequence = pmlreq->req_base.req_sequence;
|
|
|
|
ftreq->sb.cursor += sizeof(vprotocol_pessimist_sender_based_header_t);
|
2008-04-17 12:25:05 +00:00
|
|
|
V_OUTPUT_VERBOSE(70, "pessimist:\tsb\tsend\t%"PRIpclock"\tsize %lu (+%lu header)", VPESSIMIST_FTREQ(req)->reqid, (long unsigned)pmlreq->req_bytes_packed, (long unsigned)sizeof(vprotocol_pessimist_sender_based_header_t));
|
2008-03-27 21:05:44 +00:00
|
|
|
|
|
|
|
/* Use one of the previous data copy method */
|
|
|
|
__SENDER_BASED_METHOD_COPY(pmlreq);
|
|
|
|
}
|
|
|
|
|
|
|
|
/** Ensure sender based is finished before allowing user to touch send buffer
|
|
|
|
*/
|
|
|
|
#define vprotocol_pessimist_sender_based_flush(REQ) __SENDER_BASED_METHOD_FLUSH(REQ)
|
|
|
|
|
2008-01-07 23:35:44 +00:00
|
|
|
END_C_DECLS
|
|
|
|
|
2007-07-20 21:36:11 +00:00
|
|
|
#endif
|
2008-03-30 19:05:56 +00:00
|
|
|
|