1
1
Charles Shereda cbc6feaab2 Created opal_gethostname() as safer gethostname substitute.
The opal_gethostname() function provides a more robust mechanism
to retrieve the hostname than gethostname(), which can return
results that are not null-terminated, and which can vary in its
behavior from system to system.

opal_gethostname() just returns the value in opal_process_info.nodename;
this is populated in opal_init_gethostname() inside opal_init.c.

-Changed all gethostname calls in opal subtree to opal_gethostname
-Changed all gethostname calls in orte subtree to opal_gethostname
-Changed all gethostname calls in ompi subdir to opal_gethostname
-Changed all gethostname calls in oshmem subdir to opal_gethostname
-Changed opal_if.c in test subdir to use opal_gethostname
-Changed opal_init.c to include opal_init_gethostname. This function
 returns an int and directly sets opal_process_info.nodename per
 jsquyres' modifications.

Relates to open-mpi#6801

Signed-off-by: Charles Shereda <cpshereda@lanl.gov>
2020-01-13 08:52:17 -08:00

176 строки
5.0 KiB
C

/*
* Copyright (C) 2014 Artem Polyakov <artpol84@gmail.com>
* Copyright (c) 2014-2017 Intel, Inc. All rights reserved.
* Copyright (c) 2019 Triad National Security, LLC. All rights
* reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "opal_config.h"
#include "opal/runtime/opal.h"
#include <stdio.h>
#include <mpi.h>
#include <unistd.h>
#include <getopt.h>
#include <string.h>
#include <stdlib.h>
#include <errno.h>
#include "hpctimer.h"
#include "mpigclock.h"
typedef enum { Gen, Chk } prog_mode_t;
static char *filename = NULL;
static int alg = 0;
prog_mode_t mode = Gen;
void print_help(char *progname);
int parse_opts(int rank, int argc, char **argv);
void print_help(char *progname)
{
printf("%s: ./%s -o <output file>\n", progname, progname);
}
int parse_opts(int rank, int argc, char **argv)
{
while (1) {
int option_index = 0;
static struct option long_options[] = {
{"output", required_argument, 0, 'o' },
{"alg", required_argument, 0, 'a' },
{"help", required_argument, 0, 'h' },
{ 0, 0, 0, 0 } };
int c = getopt_long(argc, argv, "o:a:h",
long_options, &option_index);
if (c == -1)
break;
switch (c) {
case 'h':
if( rank == 0 )
print_help(argv[0]);
return 1;
case 'o':
filename = strdup(optarg);
if( filename == NULL ){
perror("Cannot allocate memory");
return -1;
}
break;
case 'a':
alg = atoi(optarg);
break;
default:
return -1;
}
}
return 0;
}
int main(int argc, char **argv)
{
MPI_Init(&argc, &argv);
MPI_Comm comm = MPI_COMM_WORLD;
int rank, commsize;
double offs = 0, rtt = 0;
char hname[OPAL_MAXHOSTNAMELEN];
const char *local_hname;
MPI_Comm_rank(comm, &rank);
MPI_Comm_size(comm, &commsize);
int ret = parse_opts(rank, argc, argv);
if( ret < 0 ){
// Error exit
MPI_Finalize();
exit(1);
}else if( ret > 0 ){
// Normal exit after help printout
MPI_Finalize();
exit(0);
}
if( filename == NULL ){
if( rank == 0 ){
print_help(argv[0]);
}
MPI_Finalize();
exit(1);
}
/* All error checking for getting the hostname is done with the initial
populating of opal_process_info.nodename inside opal/runtime/opal_init.c */
local_hname = opal_gethostname();
/* Truncate hostname if it is longer than OPAL_MAXHOSTNAMELEN,
since we are only reading that length with the MPI_Gather.
If full and complete hostnames are necessary in all cases,
this could be implemented with MPI_Gatherv rather than
MPI_Gather, instead of using the longer but more
accurate OPAL_LOCAL_MAXHOSTNAMELEN value, because for very
large task counts there is a risk of running out of memory
if OPAL_LOCAL_MAXHOSTNAMELEN is used. */
strncpy(hname, local_hname, OPAL_MAXHOSTNAMELEN - 1);
hname[OPAL_MAXHOSTNAMELEN - 1] = '\0';
int rc = hpctimer_initialize("gettimeofday");
if( rc == HPCTIMER_FAILURE ){
fprintf(stderr, "Fail to initialize hpc timer. Abort\n");
MPI_Abort(MPI_COMM_WORLD, 1);
}
if (commsize < 2) {
rtt = 0.0;
offs = 0.0;
} else {
if (1 == alg) {
offs = mpigclock_sync_log(comm, 0, &rtt);
} else {
offs = mpigclock_sync_linear(comm, 0, &rtt);
}
}
double send[2] = { rtt, offs };
if( rank == 0 ){
double *measure = malloc(commsize*2*sizeof(double));
if( measure == NULL ){
fprintf(stderr, "Fail to allocate memory. Abort\n");
MPI_Abort(MPI_COMM_WORLD, 1);
}
char *hnames = malloc(OPAL_MAXHOSTNAMELEN * commsize);
if( hnames == NULL ){
fprintf(stderr, "Fail to allocate memory. Abort\n");
MPI_Abort(MPI_COMM_WORLD, 1);
}
MPI_Gather(hname,sizeof(hname),MPI_CHAR,hnames,sizeof(hname),MPI_CHAR, 0, MPI_COMM_WORLD);
MPI_Gather(send,2,MPI_DOUBLE,measure,2, MPI_DOUBLE, 0, MPI_COMM_WORLD);
FILE *fp = fopen(filename,"w");
if( fp == NULL ){
fprintf(stderr, "Fail to open the file %s. Abort\n", filename);
MPI_Abort(MPI_COMM_WORLD, 1);
}
double (*m)[2] = (void*)measure;
char (*h)[OPAL_MAXHOSTNAMELEN] = (void*)hnames;
int i;
fprintf(fp, "# Used algorithm: %s\n", (alg ? "binary tree" : "linear"));
for(i=0; i<commsize;i++){
fprintf(fp, "%s %lf %lf\n", h[i], m[i][0], m[i][1]);
}
fclose(fp);
} else {
MPI_Gather(hname, sizeof(hname), MPI_CHAR, NULL, sizeof(hname), MPI_CHAR, 0, MPI_COMM_WORLD);
MPI_Gather(send,2, MPI_DOUBLE, NULL, 2, MPI_DOUBLE, 0, MPI_COMM_WORLD);
}
MPI_Finalize();
return 0;
}