openmpi/ompi/mca/mtl/psm/mtl_psm_send.c

/*
 * Copyright (c) 2004-2006 The Trustees of Indiana University and Indiana
 *                         University Research and Technology
 *                         Corporation.  All rights reserved.
 * Copyright (c) 2004-2005 The University of Tennessee and The University
 *                         of Tennessee Research Foundation.  All rights
 *                         reserved.
 * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
 *                         University of Stuttgart.  All rights reserved.
 * Copyright (c) 2004-2006 The Regents of the University of California.
 *                         All rights reserved.
 * Copyright (c) 2006      QLogic Corporation. All rights reserved.
 * $COPYRIGHT$
 *
 * Additional copyrights may follow
 *
 * $HEADER$
 */

#include "ompi_config.h"
#include "ompi/mca/pml/pml.h"
#include "ompi/communicator/communicator.h"
#include "opal/datatype/opal_convertor.h"

#include "mtl_psm.h"
#include "mtl_psm_types.h"
#include "mtl_psm_request.h"
#include "ompi/mca/mtl/base/mtl_base_datatype.h"

int
ompi_mtl_psm_send(struct mca_mtl_base_module_t* mtl, 
                 struct ompi_communicator_t* comm,
                 int dest,
                 int tag,
                 struct opal_convertor_t *convertor,
                 mca_pml_base_send_mode_t mode)
{
    psm_error_t err;
    mca_mtl_psm_request_t mtl_psm_request;
    uint64_t mqtag;
    uint32_t flags = 0;
    int ret;
    size_t length;
    ompi_proc_t* ompi_proc = ompi_comm_peer_lookup( comm, dest );
    mca_mtl_psm_endpoint_t* psm_endpoint = (mca_mtl_psm_endpoint_t*) ompi_proc->proc_endpoints[OMPI_PROC_ENDPOINT_TAG_MTL];

    assert(mtl == &ompi_mtl_psm.super);

    mqtag = PSM_MAKE_MQTAG(comm->c_contextid, comm->c_my_rank, tag);
    
    ret = ompi_mtl_datatype_pack(convertor, 
                                 &mtl_psm_request.buf,
                                 &length, 
                                 &mtl_psm_request.free_after);

    
    mtl_psm_request.length = length;
    mtl_psm_request.convertor = convertor;
    mtl_psm_request.type = OMPI_MTL_PSM_ISEND;

    if (OMPI_SUCCESS != ret) return ret;

    if (mode == MCA_PML_BASE_SEND_SYNCHRONOUS)
	flags |= PSM_MQ_FLAG_SENDSYNC;

    err = psm_mq_send(ompi_mtl_psm.mq,
		      psm_endpoint->peer_addr,
		      flags,
		      mqtag,
		      mtl_psm_request.buf,
		      length);

    if (mtl_psm_request.free_after) {
	free(mtl_psm_request.buf);
    }

    return err == PSM_OK ? OMPI_SUCCESS : OMPI_ERROR;
}

int
ompi_mtl_psm_isend(struct mca_mtl_base_module_t* mtl, 
                  struct ompi_communicator_t* comm,
                  int dest,
                  int tag,
                  struct opal_convertor_t *convertor,
                  mca_pml_base_send_mode_t mode,
                  bool blocking,
                  mca_mtl_request_t * mtl_request)
{
    psm_error_t psm_error;
    uint64_t mqtag;
    uint32_t flags = 0;
    int ret;
    mca_mtl_psm_request_t * mtl_psm_request = (mca_mtl_psm_request_t*) mtl_request;
    size_t length;
    ompi_proc_t* ompi_proc = ompi_comm_peer_lookup( comm, dest );
    mca_mtl_psm_endpoint_t* psm_endpoint = (mca_mtl_psm_endpoint_t*)ompi_proc->proc_endpoints[OMPI_PROC_ENDPOINT_TAG_MTL];

    assert(mtl == &ompi_mtl_psm.super);

    mqtag = PSM_MAKE_MQTAG(comm->c_contextid, comm->c_my_rank, tag);

    
    ret = ompi_mtl_datatype_pack(convertor, 
                                 &mtl_psm_request->buf,
                                 &length, 
                                 &mtl_psm_request->free_after);

    mtl_psm_request->length= length;
    mtl_psm_request->convertor = convertor;
    mtl_psm_request->type = OMPI_MTL_PSM_ISEND;

    if (OMPI_SUCCESS != ret) return ret;

    if (mode == MCA_PML_BASE_SEND_SYNCHRONOUS)
	flags |= PSM_MQ_FLAG_SENDSYNC;
    
    psm_error = psm_mq_isend(ompi_mtl_psm.mq,
			     psm_endpoint->peer_addr,
			     flags,
			     mqtag,
			     mtl_psm_request->buf,
			     length,
			     mtl_psm_request,
			     &mtl_psm_request->psm_request);
    
    return psm_error == PSM_OK ? OMPI_SUCCESS : OMPI_ERROR;
}
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00			`/*`
			`* Copyright (c) 2004-2006 The Trustees of Indiana University and Indiana`
			`* University Research and Technology`
			`* Corporation. All rights reserved.`
			`* Copyright (c) 2004-2005 The University of Tennessee and The University`
			`* of Tennessee Research Foundation. All rights`
			`* reserved.`
			`* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,`
			`* University of Stuttgart. All rights reserved.`
			`* Copyright (c) 2004-2006 The Regents of the University of California.`
			`* All rights reserved.`
			`* Copyright (c) 2006 QLogic Corporation. All rights reserved.`
			`* $COPYRIGHT$`
			`*`
			`* Additional copyrights may follow`
			`*`
			`* $HEADER$`
			`*/`

			`#include "ompi_config.h"`
- Last of intrusive commits (promised)... err for now. Anyway, this is blocking the move: do not include pml.h if not really needed, aka none of the following used: mca_pml MCA_PML_CALL OMPI_ANY_TAG OMPI_ANY_SOURCE OMPI_PROC_NULL - Notable exceptions (deleting in one header->adding): - ompi/mca/mtl/psm/ - ompi/mca/osc/rdma/ - ompi/mca/btl/openib/btl_openib_endpoint.c depended on pml_base_sendreq.h - Tested on Linux/x86-64, this time including make check (thanks Jeff and Ralph) This commit was SVN r20725. 2009-03-04 20:06:51 +03:00			`#include "ompi/mca/pml/pml.h"`
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00			`#include "ompi/communicator/communicator.h"`
- Split the datatype engine into two parts: an MPI specific part in OMPI and a language agnostic part in OPAL. The convertor is completely moved into OPAL. This offers several benefits as described in RFC http://www.open-mpi.org/community/lists/devel/2009/07/6387.php namely: - Fewer basic types (int* and float* types, boolean and wchar - Fixing naming scheme to ompi-nomenclature. - Usability outside of the ompi-layer. - Due to the fixed nature of simple opal types, their information is completely known at compile time and therefore constified - With fewer datatypes (22), the actual sizes of bit-field types may be reduced from 64 to 32 bits, allowing reorganizing the opal_datatype structure, eliminating holes and keeping data required in convertor (upon send/recv) in one cacheline... This has implications to the convertor-datastructure and other parts of the code. - Several performance tests have been run, the netpipe latency does not change with this patch on Linux/x86-64 on the smoky cluster. - Extensive tests have been done to verify correctness (no new regressions) using: 1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and ompi-ddt: a. running both trunk and ompi-ddt resulted in no differences (except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run correctly). b. with --enable-memchecker and running under valgrind (one buglet when run with static found in test-suite, commited) 2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt: all passed (except for the dynamic/ tests failed!! as trunk/MTT) 3. compilation and usage of HDF5 tests on Jaguar using PGI and PathScale compilers. 4. compilation and usage on Scicortex. - Please note, that for the heterogeneous case, (-m32 compiled binaries/ompi), neither ompi-trunk, nor ompi-ddt branch would successfully launch. This commit was SVN r21641. 2009-07-13 08:56:31 +04:00			`#include "opal/datatype/opal_convertor.h"`
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00
			`#include "mtl_psm.h"`
			`#include "mtl_psm_types.h"`
			`#include "mtl_psm_request.h"`
			`#include "ompi/mca/mtl/base/mtl_base_datatype.h"`

			`int`
			`ompi_mtl_psm_send(struct mca_mtl_base_module_t* mtl,`
			`struct ompi_communicator_t* comm,`
			`int dest,`
			`int tag,`
- Split the datatype engine into two parts: an MPI specific part in OMPI and a language agnostic part in OPAL. The convertor is completely moved into OPAL. This offers several benefits as described in RFC http://www.open-mpi.org/community/lists/devel/2009/07/6387.php namely: - Fewer basic types (int* and float* types, boolean and wchar - Fixing naming scheme to ompi-nomenclature. - Usability outside of the ompi-layer. - Due to the fixed nature of simple opal types, their information is completely known at compile time and therefore constified - With fewer datatypes (22), the actual sizes of bit-field types may be reduced from 64 to 32 bits, allowing reorganizing the opal_datatype structure, eliminating holes and keeping data required in convertor (upon send/recv) in one cacheline... This has implications to the convertor-datastructure and other parts of the code. - Several performance tests have been run, the netpipe latency does not change with this patch on Linux/x86-64 on the smoky cluster. - Extensive tests have been done to verify correctness (no new regressions) using: 1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and ompi-ddt: a. running both trunk and ompi-ddt resulted in no differences (except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run correctly). b. with --enable-memchecker and running under valgrind (one buglet when run with static found in test-suite, commited) 2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt: all passed (except for the dynamic/ tests failed!! as trunk/MTT) 3. compilation and usage of HDF5 tests on Jaguar using PGI and PathScale compilers. 4. compilation and usage on Scicortex. - Please note, that for the heterogeneous case, (-m32 compiled binaries/ompi), neither ompi-trunk, nor ompi-ddt branch would successfully launch. This commit was SVN r21641. 2009-07-13 08:56:31 +04:00			`struct opal_convertor_t *convertor,`
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00			`mca_pml_base_send_mode_t mode)`
			`{`
			`psm_error_t err;`
			`mca_mtl_psm_request_t mtl_psm_request;`
			`uint64_t mqtag;`
			`uint32_t flags = 0;`
			`int ret;`
			`size_t length;`
A long time waiting patch. Get rid of the comm->c_pml_procs. It was (and that was long ago) supposed to be used as a cache for accessing the PML procs. But in all of the PMLs the PML proc contain only one field i.e. a pointer to the ompi_proc. This pointer can be accessed using the c_remote_group easily. Therefore, there is no meaning of keeping the PML procs around. Slim fast commit ... This commit was SVN r11730. 2006-09-21 02:14:46 +04:00			`ompi_proc_t* ompi_proc = ompi_comm_peer_lookup( comm, dest );`
Remove the proc_pml and proc_bml fields from ompi_proc_t and replace with a configure-time dynamic allocation of flags. The net result for platforms which only support BTL-based communication is a reduction of 8*nprocs bytes per process. Platforms which support both MTLs and BTLs will not see a space reduction, but will now be able to safely run both the MTL and BTL side-by-side, which will prove useful. This commit was SVN r29100. 2013-08-30 20:54:55 +04:00			`mca_mtl_psm_endpoint_t* psm_endpoint = (mca_mtl_psm_endpoint_t*) ompi_proc->proc_endpoints[OMPI_PROC_ENDPOINT_TAG_MTL];`
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00
			`assert(mtl == &ompi_mtl_psm.super);`

			`mqtag = PSM_MAKE_MQTAG(comm->c_contextid, comm->c_my_rank, tag);`

			`ret = ompi_mtl_datatype_pack(convertor,`
			`&mtl_psm_request.buf,`
			`&length,`
			`&mtl_psm_request.free_after);`


			`mtl_psm_request.length = length;`
			`mtl_psm_request.convertor = convertor;`
			`mtl_psm_request.type = OMPI_MTL_PSM_ISEND;`

			`if (OMPI_SUCCESS != ret) return ret;`

			`if (mode == MCA_PML_BASE_SEND_SYNCHRONOUS)`
			`flags \|= PSM_MQ_FLAG_SENDSYNC;`

			`err = psm_mq_send(ompi_mtl_psm.mq,`
			`psm_endpoint->peer_addr,`
			`flags,`
			`mqtag,`
			`mtl_psm_request.buf,`
			`length);`

Convert a few opal_output() calls to instead use orte_show_help() as well as do some minor cosmetic changes dealing with tab spacing and c-blocks being enclosed with \{\}. There was also a long standing bug with the PSM mtl if the number of hardware contexts on adapter were less than the number of cores on a node (The default case is they are the same hence no issues were reported). For completeness we take care of this case as well but it requires us to tell PSM how many local processes are running on a node and the local rank of the process on a node so it can allocate the available hardware contexts appropriately. This commit was SVN r21745. 2009-07-30 06:55:20 +04:00			`if (mtl_psm_request.free_after) {`
Fixes to psm mtl following a more comprehensive testing of intel tests. This commit was SVN r13471. 2007-02-03 00:55:04 +03:00			`free(mtl_psm_request.buf);`
Convert a few opal_output() calls to instead use orte_show_help() as well as do some minor cosmetic changes dealing with tab spacing and c-blocks being enclosed with \{\}. There was also a long standing bug with the PSM mtl if the number of hardware contexts on adapter were less than the number of cores on a node (The default case is they are the same hence no issues were reported). For completeness we take care of this case as well but it requires us to tell PSM how many local processes are running on a node and the local rank of the process on a node so it can allocate the available hardware contexts appropriately. This commit was SVN r21745. 2009-07-30 06:55:20 +04:00			`}`
Fixes to psm mtl following a more comprehensive testing of intel tests. This commit was SVN r13471. 2007-02-03 00:55:04 +03:00
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00			`return err == PSM_OK ? OMPI_SUCCESS : OMPI_ERROR;`
			`}`

			`int`
			`ompi_mtl_psm_isend(struct mca_mtl_base_module_t* mtl,`
			`struct ompi_communicator_t* comm,`
			`int dest,`
			`int tag,`
- Split the datatype engine into two parts: an MPI specific part in OMPI and a language agnostic part in OPAL. The convertor is completely moved into OPAL. This offers several benefits as described in RFC http://www.open-mpi.org/community/lists/devel/2009/07/6387.php namely: - Fewer basic types (int* and float* types, boolean and wchar - Fixing naming scheme to ompi-nomenclature. - Usability outside of the ompi-layer. - Due to the fixed nature of simple opal types, their information is completely known at compile time and therefore constified - With fewer datatypes (22), the actual sizes of bit-field types may be reduced from 64 to 32 bits, allowing reorganizing the opal_datatype structure, eliminating holes and keeping data required in convertor (upon send/recv) in one cacheline... This has implications to the convertor-datastructure and other parts of the code. - Several performance tests have been run, the netpipe latency does not change with this patch on Linux/x86-64 on the smoky cluster. - Extensive tests have been done to verify correctness (no new regressions) using: 1. mpi_test_suite on linux/x86-64 using clean ompi-trunk and ompi-ddt: a. running both trunk and ompi-ddt resulted in no differences (except for MPI_SHORT_INT and MPI_TYPE_MIX_LB_UB do now run correctly). b. with --enable-memchecker and running under valgrind (one buglet when run with static found in test-suite, commited) 2. ibm testsuite on linux/x86-64 using clean ompi-trunk and ompi-ddt: all passed (except for the dynamic/ tests failed!! as trunk/MTT) 3. compilation and usage of HDF5 tests on Jaguar using PGI and PathScale compilers. 4. compilation and usage on Scicortex. - Please note, that for the heterogeneous case, (-m32 compiled binaries/ompi), neither ompi-trunk, nor ompi-ddt branch would successfully launch. This commit was SVN r21641. 2009-07-13 08:56:31 +04:00			`struct opal_convertor_t *convertor,`
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00			`mca_pml_base_send_mode_t mode,`
			`bool blocking,`
			`mca_mtl_request_t * mtl_request)`
			`{`
			`psm_error_t psm_error;`
			`uint64_t mqtag;`
			`uint32_t flags = 0;`
			`int ret;`
			`mca_mtl_psm_request_t * mtl_psm_request = (mca_mtl_psm_request_t*) mtl_request;`
			`size_t length;`
Correct a type that break the PSM build. This commit was SVN r12069. 2006-10-10 03:14:22 +04:00			`ompi_proc_t* ompi_proc = ompi_comm_peer_lookup( comm, dest );`
Remove the proc_pml and proc_bml fields from ompi_proc_t and replace with a configure-time dynamic allocation of flags. The net result for platforms which only support BTL-based communication is a reduction of 8*nprocs bytes per process. Platforms which support both MTLs and BTLs will not see a space reduction, but will now be able to safely run both the MTL and BTL side-by-side, which will prove useful. This commit was SVN r29100. 2013-08-30 20:54:55 +04:00			`mca_mtl_psm_endpoint_t* psm_endpoint = (mca_mtl_psm_endpoint_t*)ompi_proc->proc_endpoints[OMPI_PROC_ENDPOINT_TAG_MTL];`
Initial commit of QLogic PSM MTL. This provides support for the Infinipath interconnect using the PSM API. Of note: This version has a "hackaround" we always return 1 or greater from the MTL PSM progress function, this should be examined further. This commit was SVN r11655. 2006-09-14 20:44:02 +04:00
			`assert(mtl == &ompi_mtl_psm.super);`

			`mqtag = PSM_MAKE_MQTAG(comm->c_contextid, comm->c_my_rank, tag);`


			`ret = ompi_mtl_datatype_pack(convertor,`
			`&mtl_psm_request->buf,`
			`&length,`
			`&mtl_psm_request->free_after);`

			`mtl_psm_request->length= length;`
			`mtl_psm_request->convertor = convertor;`
			`mtl_psm_request->type = OMPI_MTL_PSM_ISEND;`

			`if (OMPI_SUCCESS != ret) return ret;`

			`if (mode == MCA_PML_BASE_SEND_SYNCHRONOUS)`
			`flags \|= PSM_MQ_FLAG_SENDSYNC;`

			`psm_error = psm_mq_isend(ompi_mtl_psm.mq,`
			`psm_endpoint->peer_addr,`
			`flags,`
			`mqtag,`
			`mtl_psm_request->buf,`
			`length,`
			`mtl_psm_request,`
			`&mtl_psm_request->psm_request);`

			`return psm_error == PSM_OK ? OMPI_SUCCESS : OMPI_ERROR;`
			`}`