/* * Copyright (c) 2004-2007 The Trustees of Indiana University and Indiana * University Research and Technology * Corporation. All rights reserved. * Copyright (c) 2004-2011 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. * Copyright (c) 2013 Los Alamos National Security, LLC. All rights reserved. * Copyright (c) 2013 Cisco Systems, Inc. All rights reserved. * Copyright (c) 2015-2016 Intel, Inc. All rights reserved. * Copyright (c) 2015 Research Organization for Information Science * and Technology (RIST). All rights reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ */ #include "orte_config.h" #include "orte/constants.h" #include #include #include "orte/mca/mca.h" #include "opal/mca/base/base.h" #include "opal/util/os_dirpath.h" #include "opal/util/output.h" #include "opal/util/basename.h" #include "orte/util/proc_info.h" #include "orte/runtime/orte_globals.h" #include "orte/util/name_fns.h" #include "orte/mca/iof/iof.h" #include "orte/mca/iof/base/base.h" /* * The following file was created by configure. It contains extern * statements and the definition of an array of pointers to each * component's public orte_base_component_t struct. */ #include "orte/mca/iof/base/static-components.h" orte_iof_base_module_t orte_iof = {0}; /* class instances */ static void orte_iof_job_construct(orte_iof_job_t *ptr) { ptr->jdata = NULL; OBJ_CONSTRUCT(&ptr->xoff, opal_bitmap_t); } static void orte_iof_job_destruct(orte_iof_job_t *ptr) { if (NULL != ptr->jdata) { OBJ_RELEASE(ptr->jdata); } OBJ_DESTRUCT(&ptr->xoff); } OBJ_CLASS_INSTANCE(orte_iof_job_t, opal_object_t, orte_iof_job_construct, orte_iof_job_destruct); static void orte_iof_base_proc_construct(orte_iof_proc_t* ptr) { ptr->stdinev = NULL; ptr->revstdout = NULL; ptr->revstderr = NULL; ptr->revstddiag = NULL; ptr->subscribers = NULL; ptr->copy = true; } static void orte_iof_base_proc_destruct(orte_iof_proc_t* ptr) { if (NULL != ptr->stdinev) { OBJ_RELEASE(ptr->stdinev); } if (NULL != ptr->revstdout) { OBJ_RELEASE(ptr->revstdout); } if (NULL != ptr->revstderr) { OBJ_RELEASE(ptr->revstderr); } if (NULL != ptr->revstddiag) { OBJ_RELEASE(ptr->revstddiag); } if (NULL != ptr->subscribers) { OPAL_LIST_RELEASE(ptr->subscribers); } } OBJ_CLASS_INSTANCE(orte_iof_proc_t, opal_list_item_t, orte_iof_base_proc_construct, orte_iof_base_proc_destruct); static void orte_iof_base_sink_construct(orte_iof_sink_t* ptr) { ptr->daemon.jobid = ORTE_JOBID_INVALID; ptr->daemon.vpid = ORTE_VPID_INVALID; ptr->wev = OBJ_NEW(orte_iof_write_event_t); ptr->xoff = false; ptr->exclusive = false; } static void orte_iof_base_sink_destruct(orte_iof_sink_t* ptr) { OPAL_OUTPUT_VERBOSE((20, orte_iof_base_framework.framework_output, "%s iof: closing sink for process %s", ORTE_NAME_PRINT(ORTE_PROC_MY_NAME), ORTE_NAME_PRINT(&ptr->name))); if (NULL != ptr->wev && 0 <= ptr->wev->fd) { OBJ_RELEASE(ptr->wev); } } OBJ_CLASS_INSTANCE(orte_iof_sink_t, opal_list_item_t, orte_iof_base_sink_construct, orte_iof_base_sink_destruct); static void orte_iof_base_read_event_construct(orte_iof_read_event_t* rev) { rev->proc = NULL; rev->fd = -1; rev->active = false; rev->ev = opal_event_alloc(); rev->sink = NULL; } static void orte_iof_base_read_event_destruct(orte_iof_read_event_t* rev) { orte_iof_proc_t *proct = (orte_iof_proc_t*)rev->proc; opal_event_free(rev->ev); if (0 <= rev->fd) { OPAL_OUTPUT_VERBOSE((20, orte_iof_base_framework.framework_output, "%s iof: closing fd %d for process %s", ORTE_NAME_PRINT(ORTE_PROC_MY_NAME), rev->fd, (NULL == proct) ? "UNKNOWN" : ORTE_NAME_PRINT(&proct->name))); close(rev->fd); rev->fd = -1; } if (NULL != rev->sink) { OBJ_RELEASE(rev->sink); } if (NULL != proct) { OBJ_RELEASE(proct); } } OBJ_CLASS_INSTANCE(orte_iof_read_event_t, opal_object_t, orte_iof_base_read_event_construct, orte_iof_base_read_event_destruct); static void orte_iof_base_write_event_construct(orte_iof_write_event_t* wev) { wev->pending = false; wev->fd = -1; OBJ_CONSTRUCT(&wev->outputs, opal_list_t); wev->ev = opal_event_alloc(); } static void orte_iof_base_write_event_destruct(orte_iof_write_event_t* wev) { opal_event_free(wev->ev); if (ORTE_PROC_IS_HNP && NULL != orte_xml_fp) { int xmlfd = fileno(orte_xml_fp); if (xmlfd == wev->fd) { /* don't close this one - will get it later */ OBJ_DESTRUCT(&wev->outputs); return; } } if (2 < wev->fd) { OPAL_OUTPUT_VERBOSE((20, orte_iof_base_framework.framework_output, "%s iof: closing fd %d for write event", ORTE_NAME_PRINT(ORTE_PROC_MY_NAME), wev->fd)); close(wev->fd); } OBJ_DESTRUCT(&wev->outputs); } OBJ_CLASS_INSTANCE(orte_iof_write_event_t, opal_list_item_t, orte_iof_base_write_event_construct, orte_iof_base_write_event_destruct); OBJ_CLASS_INSTANCE(orte_iof_write_output_t, opal_list_item_t, NULL, NULL); /* * Global variables */ orte_iof_base_t orte_iof_base = {0}; static int orte_iof_base_register(mca_base_register_flag_t flags) { /* check for maximum number of pending output messages */ orte_iof_base.output_limit = (size_t) INT_MAX; (void) mca_base_var_register("orte", "iof", "base", "output_limit", "Maximum backlog of output messages [default: unlimited]", MCA_BASE_VAR_TYPE_SIZE_T, NULL, 0, 0, OPAL_INFO_LVL_9, MCA_BASE_VAR_SCOPE_READONLY, &orte_iof_base.output_limit); /* check for files to be sent to stdin of procs */ orte_iof_base.input_files = NULL; (void) mca_base_var_register("orte", "iof","base", "input_files", "Comma-separated list of input files to be read and sent to stdin of procs (default: NULL)", MCA_BASE_VAR_TYPE_STRING, NULL, 0, 0, OPAL_INFO_LVL_9, MCA_BASE_VAR_SCOPE_READONLY, &orte_iof_base.input_files); return ORTE_SUCCESS; } static int orte_iof_base_close(void) { /* Close the selected component */ if (NULL != orte_iof.finalize) { orte_iof.finalize(); } return mca_base_framework_components_close(&orte_iof_base_framework, NULL); } /** * Function for finding and opening either all MCA components, or the one * that was specifically requested via a MCA parameter. */ static int orte_iof_base_open(mca_base_open_flag_t flags) { int rc, xmlfd; /* did the user request we print output to files? */ if (NULL != orte_output_filename) { /* we will setup the files themselves as needed in the iof * module. For now, let's see if the filename contains a * path, or just a name */ char *path; path = opal_dirname(orte_output_filename); if (NULL == path) { return ORTE_ERR_OUT_OF_RESOURCE; } if (0 != strcmp(path, orte_output_filename)) { /* there is a path in this name - ensure that the directory * exists, and create it if not */ if (ORTE_SUCCESS != (rc = opal_os_dirpath_create(path, S_IRWXU))) { free(path); return rc; } } free(path); } /* daemons do not need to do this as they do not write out stdout/err */ if (!ORTE_PROC_IS_DAEMON || (ORTE_PROC_IS_DAEMON && ORTE_PROC_IS_CM)) { if (orte_xml_output) { if (NULL != orte_xml_fp) { /* user wants all xml-formatted output sent to file */ xmlfd = fileno(orte_xml_fp); } else { xmlfd = 1; } /* setup the stdout event */ ORTE_IOF_SINK_DEFINE(&orte_iof_base.iof_write_stdout, ORTE_PROC_MY_NAME, xmlfd, ORTE_IOF_STDOUT, orte_iof_base_write_handler); /* don't create a stderr event - all output will go to * the stdout channel */ } else { /* setup the stdout event */ ORTE_IOF_SINK_DEFINE(&orte_iof_base.iof_write_stdout, ORTE_PROC_MY_NAME, 1, ORTE_IOF_STDOUT, orte_iof_base_write_handler); /* setup the stderr event */ ORTE_IOF_SINK_DEFINE(&orte_iof_base.iof_write_stderr, ORTE_PROC_MY_NAME, 2, ORTE_IOF_STDERR, orte_iof_base_write_handler); } /* do NOT set these file descriptors to non-blocking. If we do so, * we set the file descriptor to non-blocking for everyone that has * that file descriptor, which includes everyone else in our shell * pipeline chain. (See * http://lists.freebsd.org/pipermail/freebsd-hackers/2005-January/009742.html). * This causes things like "mpirun -np 1 big_app | cat" to lose * output, because cat's stdout is then ALSO non-blocking and cat * isn't built to deal with that case (same with almost all other * unix text utils). */ } /* Open up all available components */ return mca_base_framework_components_open(&orte_iof_base_framework, flags); } MCA_BASE_FRAMEWORK_DECLARE(orte, iof, "ORTE I/O Forwarding", orte_iof_base_register, orte_iof_base_open, orte_iof_base_close, mca_iof_base_static_components, 0);