2004-10-15 16:31:54 +00:00
|
|
|
/*
|
2005-11-05 19:57:48 +00:00
|
|
|
* Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
|
|
* University Research and Technology
|
|
|
|
* Corporation. All rights reserved.
|
2006-08-23 03:32:36 +00:00
|
|
|
* Copyright (c) 2004-2006 The University of Tennessee and The University
|
2005-11-05 19:57:48 +00:00
|
|
|
* of Tennessee Research Foundation. All rights
|
|
|
|
* reserved.
|
2004-11-28 20:09:25 +00:00
|
|
|
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
|
|
|
|
* University of Stuttgart. All rights reserved.
|
2005-03-24 12:43:37 +00:00
|
|
|
* Copyright (c) 2004-2005 The Regents of the University of California.
|
|
|
|
* All rights reserved.
|
2004-11-22 01:38:40 +00:00
|
|
|
* $COPYRIGHT$
|
|
|
|
*
|
|
|
|
* Additional copyrights may follow
|
|
|
|
*
|
2004-10-15 16:31:54 +00:00
|
|
|
* $HEADER$
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
2005-03-14 20:57:21 +00:00
|
|
|
#include "orte_config.h"
|
2004-10-15 16:31:54 +00:00
|
|
|
|
|
|
|
#include <stdio.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#ifdef HAVE_PWD_H
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <pwd.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#endif
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <stddef.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
2004-10-22 16:06:05 +00:00
|
|
|
#ifdef HAVE_LIBGEN_H
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <libgen.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#endif
|
|
|
|
#ifdef HAVE_SYS_PARAM_H
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <sys/param.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#endif
|
|
|
|
#ifdef HAVE_SYS_TYPES_H
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <sys/types.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#endif
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <sys/stat.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#ifdef HAVE_UNISTD_H
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <unistd.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#endif
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <errno.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#ifdef HAVE_DIRENT_H
|
2004-10-15 16:31:54 +00:00
|
|
|
#include <dirent.h>
|
2004-10-20 01:03:09 +00:00
|
|
|
#endif
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-02-12 01:33:29 +00:00
|
|
|
#include "orte/orte_constants.h"
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-02-12 01:33:29 +00:00
|
|
|
#include "orte/util/univ_info.h"
|
|
|
|
#include "orte/util/sys_info.h"
|
|
|
|
#include "orte/util/proc_info.h"
|
2005-07-03 23:31:27 +00:00
|
|
|
#include "opal/util/output.h"
|
2005-07-04 01:59:52 +00:00
|
|
|
#include "opal/util/os_path.h"
|
2006-07-03 22:23:07 +00:00
|
|
|
#include "opal/util/os_dirpath.h"
|
2006-08-23 03:32:36 +00:00
|
|
|
#include "opal/util/basename.h"
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-02-12 01:33:29 +00:00
|
|
|
#include "orte/mca/errmgr/errmgr.h"
|
|
|
|
#include "orte/runtime/runtime.h"
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-02-12 01:33:29 +00:00
|
|
|
#include "orte/util/session_dir.h"
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*******************************
|
|
|
|
* Local function Declarations
|
|
|
|
*******************************/
|
|
|
|
static int orte_create_dir(char *directory);
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
static bool orte_dir_check_file(const char *root, const char *path);
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2005-12-12 20:04:00 +00:00
|
|
|
#ifdef __WINDOWS__
|
2005-01-20 00:03:23 +00:00
|
|
|
#define OMPI_DEFAULT_TMPDIR "C:\\TEMP"
|
2005-01-24 22:51:15 +00:00
|
|
|
#else
|
|
|
|
#define OMPI_DEFAULT_TMPDIR "/tmp"
|
|
|
|
#endif
|
2004-10-22 16:06:05 +00:00
|
|
|
|
2005-06-26 23:11:37 +00:00
|
|
|
#define OMPI_PRINTF_FIX_STRING(a) ((NULL == a) ? "(null)" : a)
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/****************************
|
|
|
|
* Funcationality
|
|
|
|
****************************/
|
|
|
|
/*
|
|
|
|
* Check and create the directory requested
|
|
|
|
*/
|
|
|
|
static int orte_create_dir(char *directory)
|
|
|
|
{
|
|
|
|
#ifndef __WINDOWS__
|
|
|
|
mode_t my_mode = S_IRWXU; /* at the least, I need to be able to do anything */
|
|
|
|
#else
|
|
|
|
mode_t my_mode = _S_IREAD | _S_IWRITE | _S_IEXEC;
|
|
|
|
#endif
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
/* Sanity check before creating the directory with the proper mode,
|
|
|
|
* Make sure it doesn't exist already */
|
2006-07-03 22:23:07 +00:00
|
|
|
if( OPAL_ERR_NOT_FOUND != (ret = opal_os_dirpath_access(directory, my_mode)) ) {
|
|
|
|
/* Failure because opal_os_dirpath_access() indicated that either:
|
2006-06-28 21:03:31 +00:00
|
|
|
* - The directory exists and we can access it (no need to create it again),
|
2006-07-03 22:23:07 +00:00
|
|
|
* return OPAL_SUCCESS, or
|
|
|
|
* - don't have access rights, return OPAL_ERROR
|
2006-06-28 21:03:31 +00:00
|
|
|
*/
|
|
|
|
return(ret);
|
|
|
|
}
|
|
|
|
/* The directory doesn't exist so create it */
|
|
|
|
else {
|
2006-07-03 22:23:07 +00:00
|
|
|
return(opal_os_dirpath_create(directory, my_mode));
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Construct the fullpath to the session directory
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
orte_session_dir_get_name(char **fulldirpath,
|
|
|
|
char **prefix, /* This will come back as the valid tmp dir */
|
|
|
|
char **frontend,
|
|
|
|
char *usr, char *hostid,
|
|
|
|
char *batchid, char *univ,
|
|
|
|
char *job, char *proc) {
|
|
|
|
char *hostname = NULL,
|
|
|
|
*batchname = NULL,
|
|
|
|
*sessions = NULL,
|
|
|
|
*user = NULL,
|
|
|
|
*universe = NULL;
|
|
|
|
int exit_status = ORTE_SUCCESS;
|
|
|
|
|
|
|
|
/* Ensure that system info is set */
|
2005-03-14 20:57:21 +00:00
|
|
|
orte_sys_info();
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* set the 'user' value
|
|
|
|
*/
|
|
|
|
if( NULL != usr) { /* User specified version */
|
|
|
|
user = strdup(usr);
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
else { /* check if it is set elsewhere */
|
|
|
|
if( NULL != orte_system_info.user)
|
|
|
|
user = strdup(orte_system_info.user);
|
|
|
|
else {
|
|
|
|
/* Couldn't find it, so fail */
|
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* set the 'hostname'
|
|
|
|
*/
|
|
|
|
if( NULL != hostid) { /* User specified version */
|
|
|
|
hostname = strdup(hostid);
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
else { /* check if it is set elsewhere */
|
|
|
|
if( NULL != orte_system_info.nodename)
|
|
|
|
hostname = strdup(orte_system_info.nodename);
|
|
|
|
else {
|
|
|
|
/* Couldn't find it, so fail */
|
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* set the 'batchid'
|
|
|
|
*/
|
|
|
|
if (NULL != batchid)
|
|
|
|
batchname = strdup(batchid);
|
|
|
|
else
|
|
|
|
batchname = strdup("0");
|
|
|
|
|
|
|
|
/*
|
|
|
|
* set the 'universe'
|
|
|
|
*/
|
|
|
|
if( NULL != univ) { /* User specified version */
|
|
|
|
universe = strdup(univ);
|
|
|
|
}
|
|
|
|
else { /* check if it is set elsewhere */
|
2006-07-11 16:54:07 +00:00
|
|
|
if( NULL != orte_universe_info.name) {
|
2006-06-28 21:03:31 +00:00
|
|
|
universe = strdup(orte_universe_info.name);
|
2006-07-11 16:54:07 +00:00
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
else {
|
2006-07-11 16:54:07 +00:00
|
|
|
;/* Couldn't find it, so continue with caution */
|
2006-06-28 21:03:31 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2006-07-11 16:54:07 +00:00
|
|
|
* Check: Can't give proc or job without universe
|
|
|
|
*/
|
|
|
|
if( NULL == universe &&
|
|
|
|
(NULL != proc ||
|
|
|
|
NULL != job) ) {
|
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check: Can't give a proc without a job and universe
|
2006-06-28 21:03:31 +00:00
|
|
|
*/
|
|
|
|
if( NULL == job &&
|
|
|
|
NULL != proc) {
|
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* get the front part of the session directory
|
|
|
|
* Will look something like:
|
|
|
|
* openmpi-sessions-USERNAME@HOSTNAME_BATCHID
|
|
|
|
*/
|
|
|
|
if (NULL != orte_process_info.top_session_dir) {
|
|
|
|
*frontend = strdup(orte_process_info.top_session_dir);
|
|
|
|
}
|
|
|
|
else { /* If not set then construct it */
|
|
|
|
if (0 > asprintf(frontend, "openmpi-sessions-%s@%s_%s", user, hostname, batchname)) {
|
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Construct the session directory
|
|
|
|
*/
|
|
|
|
/* If we were given a 'proc' then we can construct it fully into:
|
|
|
|
* openmpi-sessions-USERNAME@HOSTNAME_BATCHID/UNIVERSE/JOBID/PROC
|
|
|
|
*/
|
|
|
|
if( NULL != proc) {
|
2006-08-23 03:32:36 +00:00
|
|
|
sessions = opal_os_path( false, *frontend, universe, job, proc, NULL );
|
|
|
|
if( NULL == sessions ) {
|
2006-06-28 21:03:31 +00:00
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/* If we were given a 'job' then we can construct it partially into:
|
|
|
|
* openmpi-sessions-USERNAME@HOSTNAME_BATCHID/UNIVERSE/JOBID
|
|
|
|
*/
|
|
|
|
else if(NULL != job) {
|
2006-08-23 03:32:36 +00:00
|
|
|
sessions = opal_os_path( false, *frontend, universe, job, NULL );
|
|
|
|
if( NULL == sessions ) {
|
2006-06-28 21:03:31 +00:00
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/* If we were given neither then we can construct it partially into:
|
|
|
|
* openmpi-sessions-USERNAME@HOSTNAME_BATCHID/UNIVERSE
|
|
|
|
*/
|
2006-07-11 16:54:07 +00:00
|
|
|
else if(NULL != universe) {
|
2006-08-23 03:32:36 +00:00
|
|
|
sessions = opal_os_path( false, *frontend, universe, NULL );
|
|
|
|
if( NULL == sessions ) {
|
2006-06-28 21:03:31 +00:00
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
2006-07-11 16:54:07 +00:00
|
|
|
/* If we were not given 'universe' then we can construct it into:
|
|
|
|
* openmpi-sessions-USERNAME@HOSTNAME_BATCHID
|
|
|
|
*/
|
|
|
|
else {
|
|
|
|
if (0 > asprintf(&sessions, "%s",
|
|
|
|
*frontend) ) {
|
|
|
|
exit_status = ORTE_ERROR;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* If the user specified an invalid prefix, or no prefix at all
|
|
|
|
* we need to keep looking
|
|
|
|
*/
|
|
|
|
if( NULL != *fulldirpath) {
|
|
|
|
free(*fulldirpath);
|
|
|
|
*fulldirpath = NULL;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
if( NULL != *prefix) { /* use the user specified one, if available */
|
|
|
|
;
|
|
|
|
}
|
|
|
|
/* Try to find a proper alternative prefix */
|
|
|
|
else if (NULL != orte_process_info.tmpdir_base) { /* stored value */
|
|
|
|
*prefix = strdup(orte_process_info.tmpdir_base);
|
|
|
|
}
|
|
|
|
else if( NULL != getenv("OMPI_PREFIX_ENV") ) { /* OMPI Environment var */
|
|
|
|
*prefix = strdup(getenv("OMPI_PREFIX_ENV"));
|
|
|
|
}
|
|
|
|
else if( NULL != getenv("TMPDIR") ) { /* General Environment var */
|
|
|
|
*prefix = strdup(getenv("TMPDIR"));
|
|
|
|
}
|
|
|
|
else if( NULL != getenv("TMP") ) { /* Another general environment var */
|
|
|
|
*prefix = strdup(getenv("TMP"));
|
|
|
|
}
|
|
|
|
else { /* ow. just use the default tmp directory */
|
|
|
|
*prefix = strdup(OMPI_DEFAULT_TMPDIR);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Construct the absolute final path
|
|
|
|
*/
|
2006-08-23 03:32:36 +00:00
|
|
|
*fulldirpath = opal_os_path(false, *prefix, sessions, NULL);
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
|
|
|
|
cleanup:
|
|
|
|
if(NULL != hostname)
|
|
|
|
free(hostname);
|
|
|
|
if(NULL != batchname)
|
|
|
|
free(batchname);
|
|
|
|
if(NULL != sessions)
|
|
|
|
free(sessions);
|
|
|
|
if(NULL != user)
|
|
|
|
free(user);
|
|
|
|
if(NULL != universe)
|
|
|
|
free(universe);
|
|
|
|
|
|
|
|
return exit_status;
|
|
|
|
}
|
2005-03-18 23:58:36 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Construct the session directory and create it if necessary
|
|
|
|
*/
|
|
|
|
int orte_session_dir(bool create,
|
|
|
|
char *prefix, char *usr, char *hostid,
|
|
|
|
char *batchid, char *univ, char *job, char *proc)
|
|
|
|
{
|
|
|
|
char *fulldirpath = NULL,
|
|
|
|
*frontend = NULL,
|
|
|
|
*sav = NULL;
|
|
|
|
int return_code = ORTE_SUCCESS, rtn;
|
|
|
|
/* This indicates if the prefix was set, and so if it fails then we
|
|
|
|
* should try with the default prefixes.*/
|
|
|
|
bool dbl_check_prefix = false;
|
2006-07-03 22:23:07 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
if( NULL != prefix)
|
|
|
|
dbl_check_prefix = true;
|
|
|
|
|
|
|
|
try_again:
|
|
|
|
/*
|
|
|
|
* If the first attempt at the path creation failed, try with a null
|
|
|
|
* prefix. unless the original prefix was null, then we fail.
|
|
|
|
*/
|
|
|
|
if(!dbl_check_prefix && /* an indicator that we are trying a second time */
|
|
|
|
NULL != prefix) {
|
|
|
|
free(prefix);
|
|
|
|
prefix = NULL;
|
2005-03-18 23:58:36 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Get the session directory full name
|
|
|
|
* First try it with the specified prefix.
|
|
|
|
*/
|
|
|
|
if( ORTE_SUCCESS != ( rtn = orte_session_dir_get_name(&fulldirpath,
|
|
|
|
&prefix,
|
|
|
|
&frontend,
|
|
|
|
usr, hostid,
|
|
|
|
batchid, univ, job,
|
|
|
|
proc) ) ) {
|
|
|
|
return_code = rtn;
|
|
|
|
/*
|
|
|
|
* If the first attempt at the path creation failed, try with a null
|
|
|
|
* prefix. unless the original prefix was null, then we fail :(
|
|
|
|
*/
|
|
|
|
if(dbl_check_prefix) {
|
|
|
|
dbl_check_prefix = false;
|
|
|
|
goto try_again;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Now that we have the full path, go ahead and create it if necessary
|
|
|
|
*/
|
|
|
|
if( create ) {
|
|
|
|
if( ORTE_SUCCESS != (rtn = orte_create_dir(fulldirpath) ) ) {
|
|
|
|
return_code = rtn;
|
|
|
|
|
|
|
|
if(dbl_check_prefix) {
|
|
|
|
dbl_check_prefix = false;
|
|
|
|
goto try_again;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* if we are not creating, then just verify that the path is OK
|
|
|
|
*/
|
|
|
|
else {
|
2006-07-03 22:23:07 +00:00
|
|
|
if( ORTE_SUCCESS != (rtn = opal_os_dirpath_access(fulldirpath, 0) )) {
|
2006-06-28 21:03:31 +00:00
|
|
|
/* It is not valid so we give up and return an error */
|
|
|
|
return_code = rtn;
|
|
|
|
|
|
|
|
if(dbl_check_prefix) {
|
|
|
|
dbl_check_prefix = false;
|
|
|
|
goto try_again;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2005-03-18 23:58:36 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
return_code = ORTE_SUCCESS;
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* If we are creating the directory tree, the overwrite the
|
|
|
|
* global structure fields
|
|
|
|
*/
|
|
|
|
if (create) {
|
2005-03-18 23:58:36 +00:00
|
|
|
if (NULL != orte_process_info.tmpdir_base) {
|
|
|
|
free(orte_process_info.tmpdir_base);
|
|
|
|
orte_process_info.tmpdir_base = NULL;
|
|
|
|
}
|
|
|
|
if (NULL != orte_process_info.top_session_dir) {
|
|
|
|
free(orte_process_info.top_session_dir);
|
|
|
|
orte_process_info.top_session_dir = NULL;
|
|
|
|
}
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Update some of the global structures if they are empty
|
|
|
|
*/
|
|
|
|
if (NULL == orte_process_info.tmpdir_base)
|
|
|
|
orte_process_info.tmpdir_base = strdup(prefix);
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
if (NULL == orte_process_info.top_session_dir)
|
|
|
|
orte_process_info.top_session_dir = strdup(frontend);
|
|
|
|
|
2004-10-15 16:31:54 +00:00
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Set the process session directory
|
|
|
|
*/
|
2004-10-15 16:31:54 +00:00
|
|
|
if (NULL != proc) {
|
2005-03-18 23:58:36 +00:00
|
|
|
if (create) { /* overwrite if creating */
|
|
|
|
if (NULL != orte_process_info.proc_session_dir) {
|
2006-06-28 21:03:31 +00:00
|
|
|
free(orte_process_info.proc_session_dir);
|
|
|
|
orte_process_info.proc_session_dir = NULL;
|
2005-03-18 23:58:36 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if (NULL == orte_process_info.proc_session_dir) {
|
|
|
|
orte_process_info.proc_session_dir = strdup(fulldirpath);
|
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
|
|
|
|
/* Strip off last part of directory structure */
|
2006-08-23 03:32:36 +00:00
|
|
|
sav = opal_dirname(fulldirpath);
|
2006-06-28 21:03:31 +00:00
|
|
|
free(fulldirpath);
|
2006-08-23 03:32:36 +00:00
|
|
|
fulldirpath = sav;
|
2006-06-28 21:03:31 +00:00
|
|
|
sav = NULL;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Set the job session directory
|
|
|
|
*/
|
2004-10-15 16:31:54 +00:00
|
|
|
if (NULL != job) {
|
2005-03-18 23:58:36 +00:00
|
|
|
if (create) { /* overwrite if creating */
|
|
|
|
if (NULL != orte_process_info.job_session_dir) {
|
2006-06-28 21:03:31 +00:00
|
|
|
free(orte_process_info.job_session_dir);
|
|
|
|
orte_process_info.job_session_dir = NULL;
|
2005-03-18 23:58:36 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if (NULL == orte_process_info.job_session_dir) {
|
|
|
|
orte_process_info.job_session_dir = strdup(fulldirpath);
|
|
|
|
}
|
2006-06-28 21:03:31 +00:00
|
|
|
|
|
|
|
/* Strip off last part of directory structure */
|
2006-08-23 03:32:36 +00:00
|
|
|
sav = opal_dirname(fulldirpath);
|
2006-06-28 21:03:31 +00:00
|
|
|
free(fulldirpath);
|
2006-08-23 03:32:36 +00:00
|
|
|
fulldirpath = sav;
|
2006-06-28 21:03:31 +00:00
|
|
|
sav = NULL;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
/*
|
|
|
|
* Set the universe session directory
|
|
|
|
*/
|
2004-10-15 16:31:54 +00:00
|
|
|
if (create) { /* overwrite if creating */
|
2005-03-18 23:58:36 +00:00
|
|
|
if (NULL != orte_process_info.universe_session_dir) {
|
|
|
|
free(orte_process_info.universe_session_dir);
|
|
|
|
orte_process_info.universe_session_dir = NULL;
|
|
|
|
}
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
2005-03-14 20:57:21 +00:00
|
|
|
if (NULL == orte_process_info.universe_session_dir) {
|
|
|
|
orte_process_info.universe_session_dir = strdup(fulldirpath);
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2005-03-14 20:57:21 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "procdir: %s",
|
2005-06-26 23:11:37 +00:00
|
|
|
OMPI_PRINTF_FIX_STRING(orte_process_info.proc_session_dir));
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "jobdir: %s",
|
2005-06-26 23:11:37 +00:00
|
|
|
OMPI_PRINTF_FIX_STRING(orte_process_info.job_session_dir));
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "unidir: %s",
|
2005-06-26 23:11:37 +00:00
|
|
|
OMPI_PRINTF_FIX_STRING(orte_process_info.universe_session_dir));
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "top: %s",
|
2005-06-26 23:11:37 +00:00
|
|
|
OMPI_PRINTF_FIX_STRING(orte_process_info.top_session_dir));
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "tmp: %s",
|
2005-06-26 23:11:37 +00:00
|
|
|
OMPI_PRINTF_FIX_STRING(orte_process_info.tmpdir_base));
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-06-28 21:03:31 +00:00
|
|
|
cleanup:
|
|
|
|
if(NULL != fulldirpath)
|
2004-10-15 16:31:54 +00:00
|
|
|
free(fulldirpath);
|
2006-06-28 21:03:31 +00:00
|
|
|
if(NULL != frontend)
|
|
|
|
free(frontend);
|
|
|
|
if(NULL != sav)
|
|
|
|
free(sav);
|
|
|
|
|
2004-10-15 16:31:54 +00:00
|
|
|
return return_code;
|
|
|
|
}
|
|
|
|
|
2006-02-16 00:16:22 +00:00
|
|
|
/*
|
2006-06-28 21:03:31 +00:00
|
|
|
* A job has aborted - so force cleanup of the session directory
|
2006-02-16 00:16:22 +00:00
|
|
|
*/
|
|
|
|
int
|
|
|
|
orte_session_dir_cleanup(orte_jobid_t jobid)
|
|
|
|
{
|
|
|
|
int rc;
|
|
|
|
char *tmp;
|
|
|
|
char *job, *job_session_dir;
|
|
|
|
|
|
|
|
/* need to setup the top_session_dir with the prefix */
|
|
|
|
tmp = opal_os_path(false,
|
|
|
|
orte_process_info.tmpdir_base,
|
|
|
|
orte_process_info.top_session_dir, NULL);
|
|
|
|
|
|
|
|
/* define the proc and job session directories for this process */
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ns.convert_jobid_to_string(&job, jobid))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
free(tmp);
|
|
|
|
return rc;
|
|
|
|
}
|
2006-08-23 03:32:36 +00:00
|
|
|
job_session_dir = opal_os_path( false, orte_process_info.universe_session_dir,
|
|
|
|
job, NULL );
|
|
|
|
if( NULL == job_session_dir ) {
|
2006-02-16 00:16:22 +00:00
|
|
|
ORTE_ERROR_LOG(ORTE_ERR_OUT_OF_RESOURCE);
|
|
|
|
free(tmp);
|
|
|
|
free(job);
|
|
|
|
return ORTE_ERR_OUT_OF_RESOURCE;
|
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
opal_os_dirpath_destroy(job_session_dir,
|
|
|
|
true, orte_dir_check_file);
|
|
|
|
opal_os_dirpath_destroy(orte_process_info.universe_session_dir,
|
|
|
|
false, orte_dir_check_file);
|
|
|
|
opal_os_dirpath_destroy(tmp,
|
|
|
|
false, orte_dir_check_file);
|
|
|
|
|
|
|
|
if (opal_os_dirpath_is_empty(job_session_dir)) {
|
2006-02-16 00:16:22 +00:00
|
|
|
if (orte_debug_flag) {
|
|
|
|
opal_output(0, "sess_dir_finalize: found job session dir empty - deleting");
|
|
|
|
}
|
|
|
|
rmdir(job_session_dir);
|
|
|
|
} else {
|
|
|
|
if (orte_debug_flag) {
|
|
|
|
opal_output(0, "sess_dir_finalize: job session dir not empty - leaving");
|
|
|
|
}
|
|
|
|
goto CLEANUP;
|
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
if (opal_os_dirpath_is_empty(orte_process_info.universe_session_dir)) {
|
2006-02-16 00:16:22 +00:00
|
|
|
if (orte_debug_flag) {
|
|
|
|
opal_output(0, "sess_dir_finalize: found univ session dir empty - deleting");
|
|
|
|
}
|
|
|
|
rmdir(orte_process_info.universe_session_dir);
|
|
|
|
} else {
|
|
|
|
if (orte_debug_flag) {
|
|
|
|
opal_output(0, "sess_dir_finalize: univ session dir not empty - leaving");
|
|
|
|
}
|
|
|
|
goto CLEANUP;
|
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
if (opal_os_dirpath_is_empty(tmp)) {
|
2006-02-16 00:16:22 +00:00
|
|
|
if (orte_debug_flag) {
|
|
|
|
opal_output(0, "sess_dir_finalize: found top session dir empty - deleting");
|
|
|
|
}
|
|
|
|
rmdir(tmp);
|
|
|
|
} else {
|
|
|
|
if (orte_debug_flag) {
|
|
|
|
opal_output(0, "sess_dir_finalize: top session dir not empty - leaving");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
CLEANUP:
|
|
|
|
free(tmp);
|
|
|
|
free(job);
|
|
|
|
free(job_session_dir);
|
|
|
|
return ORTE_SUCCESS;
|
|
|
|
}
|
|
|
|
|
2004-10-15 16:31:54 +00:00
|
|
|
|
|
|
|
int
|
2005-04-14 01:04:26 +00:00
|
|
|
orte_session_dir_finalize(orte_process_name_t *proc)
|
2004-10-15 16:31:54 +00:00
|
|
|
{
|
2005-04-14 01:04:26 +00:00
|
|
|
int rc;
|
2005-04-07 19:19:48 +00:00
|
|
|
char *tmp;
|
2005-04-14 01:04:26 +00:00
|
|
|
char *job, *job_session_dir, *vpid, *proc_session_dir;
|
2005-05-12 21:44:23 +00:00
|
|
|
|
2005-04-07 19:19:48 +00:00
|
|
|
/* need to setup the top_session_dir with the prefix */
|
2005-08-29 21:35:01 +00:00
|
|
|
tmp = opal_os_path(false,
|
|
|
|
orte_process_info.tmpdir_base,
|
|
|
|
orte_process_info.top_session_dir, NULL);
|
2005-04-07 19:19:48 +00:00
|
|
|
|
2005-04-14 01:04:26 +00:00
|
|
|
/* define the proc and job session directories for this process */
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ns.get_jobid_string(&job, proc))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
free(tmp);
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
if (ORTE_SUCCESS != (rc = orte_ns.get_vpid_string(&vpid, proc))) {
|
|
|
|
ORTE_ERROR_LOG(rc);
|
|
|
|
free(tmp);
|
|
|
|
free(job);
|
|
|
|
return rc;
|
|
|
|
}
|
2006-08-23 03:32:36 +00:00
|
|
|
job_session_dir = opal_os_path( false, orte_process_info.universe_session_dir,
|
|
|
|
job, NULL );
|
|
|
|
if( NULL == job_session_dir ) {
|
2005-04-14 01:04:26 +00:00
|
|
|
ORTE_ERROR_LOG(ORTE_ERR_OUT_OF_RESOURCE);
|
|
|
|
free(tmp);
|
|
|
|
free(job);
|
|
|
|
free(vpid);
|
|
|
|
return ORTE_ERR_OUT_OF_RESOURCE;
|
|
|
|
}
|
2006-08-23 03:32:36 +00:00
|
|
|
proc_session_dir = opal_os_path( false, job_session_dir, vpid, NULL );
|
|
|
|
if( NULL == proc_session_dir ) {
|
2005-04-14 01:04:26 +00:00
|
|
|
ORTE_ERROR_LOG(ORTE_ERR_OUT_OF_RESOURCE);
|
|
|
|
free(tmp);
|
|
|
|
free(job);
|
|
|
|
free(vpid);
|
|
|
|
free(job_session_dir);
|
|
|
|
return ORTE_ERR_OUT_OF_RESOURCE;
|
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
opal_os_dirpath_destroy(proc_session_dir,
|
|
|
|
false, orte_dir_check_file);
|
|
|
|
opal_os_dirpath_destroy(job_session_dir,
|
|
|
|
false, orte_dir_check_file);
|
|
|
|
opal_os_dirpath_destroy(orte_process_info.universe_session_dir,
|
|
|
|
false, orte_dir_check_file);
|
|
|
|
opal_os_dirpath_destroy(tmp,
|
|
|
|
false, orte_dir_check_file);
|
|
|
|
|
|
|
|
if (opal_os_dirpath_is_empty(proc_session_dir)) {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: found proc session dir empty - deleting");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
2005-04-14 01:04:26 +00:00
|
|
|
rmdir(proc_session_dir);
|
2004-10-15 16:31:54 +00:00
|
|
|
} else {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: proc session dir not empty - leaving");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
2005-04-14 01:04:26 +00:00
|
|
|
goto CLEANUP;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
if (opal_os_dirpath_is_empty(job_session_dir)) {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: found job session dir empty - deleting");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
2005-04-14 01:04:26 +00:00
|
|
|
rmdir(job_session_dir);
|
2004-10-15 16:31:54 +00:00
|
|
|
} else {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: job session dir not empty - leaving");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
2005-04-14 01:04:26 +00:00
|
|
|
goto CLEANUP;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
if (opal_os_dirpath_is_empty(orte_process_info.universe_session_dir)) {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: found univ session dir empty - deleting");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
|
|
|
rmdir(orte_process_info.universe_session_dir);
|
2004-10-15 16:31:54 +00:00
|
|
|
} else {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: univ session dir not empty - leaving");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
2005-04-14 01:04:26 +00:00
|
|
|
goto CLEANUP;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
if (opal_os_dirpath_is_empty(tmp)) {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: found top session dir empty - deleting");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
|
|
|
rmdir(tmp);
|
2004-10-15 16:31:54 +00:00
|
|
|
} else {
|
2005-04-07 19:19:48 +00:00
|
|
|
if (orte_debug_flag) {
|
2005-07-03 23:31:27 +00:00
|
|
|
opal_output(0, "sess_dir_finalize: top session dir not empty - leaving");
|
2005-04-07 19:19:48 +00:00
|
|
|
}
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2005-04-14 01:04:26 +00:00
|
|
|
CLEANUP:
|
2005-04-07 19:19:48 +00:00
|
|
|
free(tmp);
|
2005-04-14 01:04:26 +00:00
|
|
|
free(job);
|
|
|
|
free(vpid);
|
|
|
|
free(job_session_dir);
|
|
|
|
free(proc_session_dir);
|
2005-08-15 18:25:35 +00:00
|
|
|
return ORTE_SUCCESS;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
static bool
|
|
|
|
orte_dir_check_file(const char *root, const char *path) {
|
2006-02-16 00:16:22 +00:00
|
|
|
|
2006-07-03 22:23:07 +00:00
|
|
|
/*
|
|
|
|
* Keep:
|
|
|
|
* - files starting with "output-"
|
|
|
|
* - universe contact (universe-setup.txt)
|
|
|
|
*/
|
|
|
|
if( (0 == strncmp(path, "output-", strlen("output-"))) ||
|
|
|
|
(0 == strcmp(path, "universe-setup.txt"))) {
|
|
|
|
return false;
|
2004-11-02 21:48:31 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
2004-10-15 16:31:54 +00:00
|
|
|
}
|