2004-01-15 06:08:25 +00:00
|
|
|
/*
|
|
|
|
* $HEADER$
|
|
|
|
*/
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
#include "ompi_config.h"
|
2004-01-15 06:08:25 +00:00
|
|
|
|
2004-03-18 21:35:28 +00:00
|
|
|
#include "include/constants.h"
|
2004-08-14 01:56:05 +00:00
|
|
|
#include "mpi/runtime/mpiruntime.h"
|
|
|
|
#include "mpi/runtime/params.h"
|
2004-03-17 18:45:16 +00:00
|
|
|
#include "runtime/runtime.h"
|
2004-06-17 17:29:47 +00:00
|
|
|
#include "util/sys_info.h"
|
2004-07-01 14:49:54 +00:00
|
|
|
#include "util/proc_info.h"
|
2004-09-10 03:21:03 +00:00
|
|
|
#include "util/session_dir.h"
|
2004-01-15 06:08:25 +00:00
|
|
|
#include "mpi.h"
|
2004-03-17 18:45:16 +00:00
|
|
|
#include "communicator/communicator.h"
|
|
|
|
#include "group/group.h"
|
2004-08-12 16:56:24 +00:00
|
|
|
#include "info/info.h"
|
2004-09-05 16:05:37 +00:00
|
|
|
#include "util/show_help.h"
|
2004-07-27 00:49:41 +00:00
|
|
|
#include "errhandler/errcode.h"
|
|
|
|
#include "errhandler/errclass.h"
|
2004-10-08 17:12:36 +00:00
|
|
|
#include "request/request.h"
|
2004-04-20 22:38:22 +00:00
|
|
|
#include "op/op.h"
|
2004-08-14 01:56:05 +00:00
|
|
|
#include "file/file.h"
|
2004-11-05 07:52:30 +00:00
|
|
|
#include "attribute/attribute.h"
|
2004-08-14 01:56:05 +00:00
|
|
|
|
2004-03-17 18:45:16 +00:00
|
|
|
#include "mca/base/base.h"
|
|
|
|
#include "mca/base/base.h"
|
2004-06-17 16:23:34 +00:00
|
|
|
#include "mca/allocator/base/base.h"
|
|
|
|
#include "mca/allocator/allocator.h"
|
|
|
|
#include "mca/mpool/base/base.h"
|
|
|
|
#include "mca/mpool/mpool.h"
|
2004-03-17 18:45:16 +00:00
|
|
|
#include "mca/ptl/ptl.h"
|
|
|
|
#include "mca/ptl/base/base.h"
|
|
|
|
#include "mca/pml/pml.h"
|
|
|
|
#include "mca/pml/base/base.h"
|
|
|
|
#include "mca/coll/coll.h"
|
|
|
|
#include "mca/coll/base/base.h"
|
2004-07-20 22:21:47 +00:00
|
|
|
#include "mca/topo/topo.h"
|
|
|
|
#include "mca/topo/base/base.h"
|
2004-08-14 01:56:05 +00:00
|
|
|
#include "mca/io/io.h"
|
|
|
|
#include "mca/io/base/base.h"
|
Not as bad as this all may look. Tim and I made a significant change to the way we handle the startup of the oob, the seed, etc. We have made it backwards-compatible so that mpirun2 and singleton operations remain working. We had to adjust the name server and gpr as well, plus the process_info structure.
This also includes a checkpoint update to openmpi.c and ompid.c. I have re-enabled the ompid compile.
This latter raises an important point. The trunk compiles the programs like ompid just fine under Linux. It also does just fine for OSX under the dynamic libraries. However, we are seeing errors when compiling under OSX for the static case - the linker seems to have trouble resolving some variable names, even though linker diagnostics show the variables as being defined. Thus, a warning to Mac users that you may have to locally turn things off if you are trying to do static compiles. We ask, however, that you don't commit those changes that turn things off for everyone else - instead, let's try to figure out why the static compile is having a problem, and let everyone else continue to work.
Thanks
Ralph
This commit was SVN r2534.
2004-09-08 03:59:06 +00:00
|
|
|
#include "mca/oob/base/base.h"
|
|
|
|
#include "mca/ns/base/base.h"
|
2004-09-23 14:35:02 +00:00
|
|
|
#include "mca/gpr/base/base.h"
|
Not as bad as this all may look. Tim and I made a significant change to the way we handle the startup of the oob, the seed, etc. We have made it backwards-compatible so that mpirun2 and singleton operations remain working. We had to adjust the name server and gpr as well, plus the process_info structure.
This also includes a checkpoint update to openmpi.c and ompid.c. I have re-enabled the ompid compile.
This latter raises an important point. The trunk compiles the programs like ompid just fine under Linux. It also does just fine for OSX under the dynamic libraries. However, we are seeing errors when compiling under OSX for the static case - the linker seems to have trouble resolving some variable names, even though linker diagnostics show the variables as being defined. Thus, a warning to Mac users that you may have to locally turn things off if you are trying to do static compiles. We ask, however, that you don't commit those changes that turn things off for everyone else - instead, let's try to figure out why the static compile is having a problem, and let everyone else continue to work.
Thanks
Ralph
This commit was SVN r2534.
2004-09-08 03:59:06 +00:00
|
|
|
|
|
|
|
#include "runtime/runtime.h"
|
2004-10-28 19:12:45 +00:00
|
|
|
#include "event/event.h"
|
2004-01-15 06:08:25 +00:00
|
|
|
|
2004-02-05 01:52:56 +00:00
|
|
|
/*
|
|
|
|
* Global variables and symbols for the MPI layer
|
|
|
|
*/
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
bool ompi_mpi_initialized = false;
|
|
|
|
bool ompi_mpi_finalized = false;
|
2004-08-12 16:56:24 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
bool ompi_mpi_thread_multiple = false;
|
|
|
|
int ompi_mpi_thread_requested = MPI_THREAD_SINGLE;
|
|
|
|
int ompi_mpi_thread_provided = MPI_THREAD_SINGLE;
|
2004-02-05 01:52:56 +00:00
|
|
|
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
int ompi_mpi_init(int argc, char **argv, int requested, int *provided)
|
2004-01-15 06:08:25 +00:00
|
|
|
{
|
2004-08-14 01:56:05 +00:00
|
|
|
int ret, param;
|
2004-02-13 13:56:55 +00:00
|
|
|
bool allow_multi_user_threads;
|
|
|
|
bool have_hidden_threads;
|
2004-06-07 15:33:53 +00:00
|
|
|
ompi_proc_t** procs;
|
2004-03-03 16:44:41 +00:00
|
|
|
size_t nprocs;
|
2004-10-06 23:40:30 +00:00
|
|
|
char *error = NULL;
|
2004-10-01 22:22:21 +00:00
|
|
|
char *contact_info;
|
2004-01-15 06:08:25 +00:00
|
|
|
|
2004-09-10 03:21:03 +00:00
|
|
|
/* Become an OMPI process */
|
2004-01-29 19:40:22 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = ompi_init(argc, argv))) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "ompi_init() failed";
|
|
|
|
goto error;
|
2004-02-13 13:56:55 +00:00
|
|
|
}
|
2004-01-15 06:08:25 +00:00
|
|
|
|
2004-02-13 13:56:55 +00:00
|
|
|
/* Open up the MCA */
|
2004-01-30 03:59:39 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = mca_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_base_open() failed";
|
|
|
|
goto error;
|
2004-02-13 22:33:30 +00:00
|
|
|
}
|
2004-01-30 03:59:39 +00:00
|
|
|
|
2004-02-13 13:56:55 +00:00
|
|
|
/* Join the run-time environment */
|
2004-08-29 09:05:14 +00:00
|
|
|
allow_multi_user_threads = true;
|
|
|
|
have_hidden_threads = false;
|
2004-10-01 22:22:21 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = ompi_rte_init(NULL, &allow_multi_user_threads,
|
|
|
|
&have_hidden_threads))) {
|
2004-09-10 03:21:03 +00:00
|
|
|
goto error;
|
Not as bad as this all may look. Tim and I made a significant change to the way we handle the startup of the oob, the seed, etc. We have made it backwards-compatible so that mpirun2 and singleton operations remain working. We had to adjust the name server and gpr as well, plus the process_info structure.
This also includes a checkpoint update to openmpi.c and ompid.c. I have re-enabled the ompid compile.
This latter raises an important point. The trunk compiles the programs like ompid just fine under Linux. It also does just fine for OSX under the dynamic libraries. However, we are seeing errors when compiling under OSX for the static case - the linker seems to have trouble resolving some variable names, even though linker diagnostics show the variables as being defined. Thus, a warning to Mac users that you may have to locally turn things off if you are trying to do static compiles. We ask, however, that you don't commit those changes that turn things off for everyone else - instead, let's try to figure out why the static compile is having a problem, and let everyone else continue to work.
Thanks
Ralph
This commit was SVN r2534.
2004-09-08 03:59:06 +00:00
|
|
|
}
|
|
|
|
|
2004-09-16 08:38:24 +00:00
|
|
|
/*
|
|
|
|
* Register my process info with my replica. Note that this must be done
|
|
|
|
* after the rte init is completed.
|
|
|
|
*/
|
2004-09-23 14:35:02 +00:00
|
|
|
contact_info = mca_oob_get_contact_info();
|
|
|
|
ompi_rte_get_peers(NULL, &nprocs);
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_registry.rte_register(contact_info, nprocs,
|
|
|
|
ompi_rte_all_procs_registered, NULL,
|
|
|
|
ompi_rte_all_procs_unregistered, NULL))) {
|
2004-09-16 08:38:24 +00:00
|
|
|
error = "ompi_rte_init: failed in ompi_rte_register()\n";
|
|
|
|
goto error;
|
|
|
|
}
|
2004-09-14 14:21:04 +00:00
|
|
|
|
2004-09-23 14:35:02 +00:00
|
|
|
/* wait for all procs to have registered so we can be sure to get everyone's contact info */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_rte_monitor_procs_registered())) {
|
|
|
|
error = "ompi_rte_init: failed to see all procs register\n";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2004-08-14 01:56:05 +00:00
|
|
|
/* Once we've joined the RTE, see if any MCA parameters were
|
|
|
|
passed to the MPI level */
|
|
|
|
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_mpi_register_params())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_mpi_register_params() failed";
|
|
|
|
goto error;
|
2004-08-14 01:56:05 +00:00
|
|
|
}
|
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
/* initialize ompi procs */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_proc_init())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_proc_init() failed";
|
|
|
|
goto error;
|
2004-03-03 16:44:41 +00:00
|
|
|
}
|
|
|
|
|
2004-08-14 01:56:05 +00:00
|
|
|
/* Open up relevant MCA modules. */
|
|
|
|
|
2004-06-17 16:23:34 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = mca_allocator_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_allocator_base_open() failed";
|
|
|
|
goto error;
|
2004-06-17 16:23:34 +00:00
|
|
|
}
|
|
|
|
if (OMPI_SUCCESS != (ret = mca_mpool_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_mpool_base_open() failed";
|
|
|
|
goto error;
|
2004-06-17 16:23:34 +00:00
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = mca_pml_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_pml_base_open() failed";
|
|
|
|
goto error;
|
2004-02-13 13:56:55 +00:00
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = mca_ptl_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_ptl_base_open() failed";
|
|
|
|
goto error;
|
2004-02-13 13:56:55 +00:00
|
|
|
}
|
2004-06-07 15:33:53 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = mca_coll_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_coll_base_open() failed";
|
|
|
|
goto error;
|
2004-02-13 13:56:55 +00:00
|
|
|
}
|
2004-07-20 22:21:47 +00:00
|
|
|
if (OMPI_SUCCESS != (ret = mca_topo_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_topo_base_open() failed";
|
|
|
|
goto error;
|
2004-08-14 01:56:05 +00:00
|
|
|
}
|
|
|
|
if (OMPI_SUCCESS != (ret = mca_io_base_open())) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_io_base_open() failed";
|
|
|
|
goto error;
|
2004-07-20 22:21:47 +00:00
|
|
|
}
|
2004-01-30 03:59:39 +00:00
|
|
|
|
2004-10-14 20:50:06 +00:00
|
|
|
/* initialize module exchange */
|
|
|
|
if (OMPI_SUCCESS != (ret = mca_base_modex_init())) {
|
|
|
|
error = "mca_base_modex_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2004-02-13 13:56:55 +00:00
|
|
|
/* Select which pml, ptl, and coll modules to use, and determine the
|
2004-09-10 03:21:03 +00:00
|
|
|
final thread level */
|
2004-01-30 03:59:39 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
if (OMPI_SUCCESS !=
|
2004-09-10 03:21:03 +00:00
|
|
|
(ret = mca_base_init_select_components(requested,
|
|
|
|
allow_multi_user_threads,
|
|
|
|
have_hidden_threads,
|
|
|
|
provided))) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "mca_base_init_select_components() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2004-10-08 17:12:36 +00:00
|
|
|
/* initialize requests */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_request_init())) {
|
|
|
|
error = "ompi_request_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2004-09-05 16:05:37 +00:00
|
|
|
/* initialize info */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_info_init())) {
|
|
|
|
error = "ompi_info_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
2004-10-08 17:12:36 +00:00
|
|
|
|
2004-09-05 16:05:37 +00:00
|
|
|
/* initialize error handlers */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_errhandler_init())) {
|
|
|
|
error = "ompi_errhandler_init() failed";
|
|
|
|
goto error;
|
2004-02-13 13:56:55 +00:00
|
|
|
}
|
2004-01-30 03:59:39 +00:00
|
|
|
|
2004-09-05 16:05:37 +00:00
|
|
|
/* initialize error codes */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_mpi_errcode_init())) {
|
|
|
|
error = "ompi_mpi_errcode_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* initialize error classes */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_errclass_init())) {
|
|
|
|
error = "ompi_errclass_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* initialize internal error codes */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_errcode_intern_init())) {
|
|
|
|
error = "ompi_errcode_intern_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
2004-05-07 23:23:03 +00:00
|
|
|
|
2004-09-05 16:05:37 +00:00
|
|
|
/* initialize groups */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_group_init())) {
|
|
|
|
error = "ompi_group_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* initialize communicators */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_comm_init())) {
|
|
|
|
error = "ompi_comm_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* initialize datatypes */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_ddt_init())) {
|
|
|
|
error = "ompi_ddt_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* initialize ops */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_op_init())) {
|
|
|
|
error = "ompi_op_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* initialize file handles */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_file_init())) {
|
|
|
|
error = "ompi_file_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2004-09-16 00:00:09 +00:00
|
|
|
/* initialize attribute meta-data structure for comm/win/dtype */
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_attr_init())) {
|
|
|
|
error = "ompi_attr_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
2004-09-05 16:05:37 +00:00
|
|
|
/* do module exchange */
|
|
|
|
if (OMPI_SUCCESS != (ret = mca_base_modex_exchange())) {
|
|
|
|
error = "ompi_base_modex_exchange() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* add all ompi_proc_t's to PML */
|
|
|
|
if (NULL == (procs = ompi_proc_world(&nprocs))) {
|
|
|
|
error = "ompi_proc_world() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
if (OMPI_SUCCESS != (ret = mca_pml.pml_add_procs(procs, nprocs))) {
|
|
|
|
free(procs);
|
|
|
|
error = "PML add procs failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
free(procs);
|
|
|
|
|
|
|
|
/* start PTL's */
|
|
|
|
param = 1;
|
|
|
|
if (OMPI_SUCCESS !=
|
|
|
|
(ret = mca_pml.pml_control(MCA_PTL_ENABLE, ¶m, sizeof(param)))) {
|
|
|
|
error = "PML control failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* save the resulting thread levels */
|
2004-02-05 01:52:56 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
ompi_mpi_thread_requested = requested;
|
2004-10-10 00:03:42 +00:00
|
|
|
ompi_mpi_thread_provided = *provided;
|
2004-06-29 00:02:25 +00:00
|
|
|
ompi_mpi_thread_multiple = (ompi_mpi_thread_provided ==
|
|
|
|
MPI_THREAD_MULTIPLE);
|
2004-02-05 01:52:56 +00:00
|
|
|
|
2004-05-07 23:23:03 +00:00
|
|
|
/* Init coll for the comms */
|
|
|
|
|
2004-09-05 16:05:37 +00:00
|
|
|
if (OMPI_SUCCESS !=
|
|
|
|
(ret = mca_coll_base_comm_select(MPI_COMM_SELF, NULL))) {
|
|
|
|
error = "mca_coll_base_comm_select(MPI_COMM_SELF) failed";
|
|
|
|
goto error;
|
2004-07-13 12:35:43 +00:00
|
|
|
}
|
2004-05-07 23:23:03 +00:00
|
|
|
|
2004-09-05 16:05:37 +00:00
|
|
|
if (OMPI_SUCCESS !=
|
|
|
|
(ret = mca_coll_base_comm_select(MPI_COMM_WORLD, NULL))) {
|
|
|
|
error = "mca_coll_base_comm_select(MPI_COMM_WORLD) failed";
|
|
|
|
goto error;
|
2004-07-13 12:35:43 +00:00
|
|
|
}
|
2004-05-07 23:23:03 +00:00
|
|
|
|
|
|
|
/* Wait for everyone to initialize */
|
|
|
|
|
2004-06-29 00:02:25 +00:00
|
|
|
if (MPI_SUCCESS != (ret =
|
|
|
|
MPI_COMM_WORLD->c_coll.coll_barrier(MPI_COMM_WORLD))) {
|
2004-09-05 16:05:37 +00:00
|
|
|
error = "Barrier over MPI_COMM_WORLD failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2004-09-29 12:41:55 +00:00
|
|
|
/* new very last step: check whether we have been spawned or not.
|
|
|
|
We introduce that at the very end, since we need collectives,
|
|
|
|
datatypes, ptls etc. up and running here....
|
|
|
|
*/
|
|
|
|
if (OMPI_SUCCESS != (ret = ompi_comm_dyn_init())) {
|
|
|
|
error = "ompi_comm_dyn_init() failed";
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2004-10-28 15:40:46 +00:00
|
|
|
#if OMPI_HAVE_THREADS == 0
|
|
|
|
ompi_progress_events(OMPI_EVLOOP_NONBLOCK);
|
|
|
|
#endif
|
|
|
|
|
2004-09-05 16:05:37 +00:00
|
|
|
error:
|
|
|
|
if (ret != OMPI_SUCCESS) {
|
|
|
|
ompi_show_help("help-mpi-runtime",
|
|
|
|
"mpi_init:startup:internal-failure", true,
|
|
|
|
"MPI_INIT", "MPI_INIT", error, ret);
|
|
|
|
return ret;
|
2004-06-29 00:02:25 +00:00
|
|
|
}
|
2004-05-07 23:23:03 +00:00
|
|
|
|
2004-02-13 13:56:55 +00:00
|
|
|
/* All done */
|
2004-02-05 01:52:56 +00:00
|
|
|
|
2004-06-07 15:33:53 +00:00
|
|
|
ompi_mpi_initialized = true;
|
|
|
|
ompi_mpi_finalized = false;
|
2004-02-13 13:56:55 +00:00
|
|
|
return MPI_SUCCESS;
|
2004-01-15 06:08:25 +00:00
|
|
|
}
|