1
1
openmpi/opal/mca/paffinity/hwloc/paffinity_hwloc_module.c

515 строки
15 KiB
C
Исходник Обычный вид История

Make the hwloc paffinity component available for everyone. hwloc supports a wide variety of operating systems and platforms; see the opal/mca/paffinity/hwloc/hwloc/README file for details. This component includes an embedded copy of hwloc, currently based on hwloc-1.0rc6. But note that hwloc is properly SVN imported into the /vendor branch, so it will be easy to update when 1.0 GA is released. Note that the hwloc tree embedded in opal/mca/paffinity/hwloc/hwloc is identical to a hwloc distribution tarball, except that much of the documentation was rm -rf'ed (because we don't need it for the embedded case). Since the paffinity framework currently does not understand hardware threads, the hwloc component compensates for this by identifying cores by the "first" hardware thread on that core. Hopefully we'll update paffinity someday to understand hardware threads. :-) configure grew a --with-hwloc option, analogous to what we do for many other external libraries that OMPI supports. However, there's a new feature: due to the request of several distros, OMPI can be configured to build with its internal copy of hwloc or with an external copy of hwloc (e.g., a system-installed hwloc). 1. If --with-hwloc is not specified, Open MPI will try to use its internal copy (but silently fail/ignore hwloc if that fails). 1. If --with-hwloc=<dir> is supplied, Open MPI looks for hwloc support in <dir> (and --with-hwloc-libdir=<dir>, if specified). 1. If --with-hwloc=external is supplied, Open MPI will look for hwloc in a compiler/linker default external location. 1. If --with-hwloc=internal is supplied, Open MPI will use its internal copy of hwloc. Some of OMPI's main configury had to be slightly re-arranged in the bootstrapping phase to accomodate hwloc's configry needs. This commit was SVN r23125.
2010-05-13 23:56:05 +00:00
/*
* Copyright (c) 2004-2008 The Trustees of Indiana University and Indiana
* University Research and Technology
* Corporation. All rights reserved.
* Copyright (c) 2004-2005 The University of Tennessee and The University
* of Tennessee Research Foundation. All rights
* reserved.
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
* University of Stuttgart. All rights reserved.
* Copyright (c) 2004-2005 The Regents of the University of California.
* All rights reserved.
* Copyright (c) 2006-2010 Cisco Systems, Inc. All rights reserved.
*
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
#include "opal_config.h"
/* This component will only be compiled on Hwloc, where we are
guaranteed to have <unistd.h> and friends */
#include <stdio.h>
#include <unistd.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include "opal/constants.h"
#include "opal/mca/base/mca_base_param.h"
#include "opal/mca/paffinity/paffinity.h"
#include "opal/mca/paffinity/base/base.h"
#include "paffinity_hwloc.h"
#include "opal/mca/paffinity/hwloc/hwloc/include/hwloc.h"
/*
* Local functions
*/
static int module_init(void);
static int module_set(opal_paffinity_base_cpu_set_t cpumask);
static int module_get(opal_paffinity_base_cpu_set_t *cpumask);
static int module_map_to_processor_id(int socket, int core, int *processor_id);
static int module_map_to_socket_core(int processor_id, int *socket, int *core);
static int module_get_processor_info(int *num_processors);
static int module_get_socket_info(int *num_sockets);
static int module_get_core_info(int socket, int *num_cores);
static int module_get_physical_processor_id(int logical_processor_id);
static int module_get_physical_socket_id(int logical_socket_id);
static int module_get_physical_core_id(int physical_socket_id, int logical_core_id);
/*
* Hwloc paffinity module
*/
static const opal_paffinity_base_module_1_1_0_t loc_module = {
/* Initialization function */
module_init,
/* Module function pointers */
module_set,
module_get,
module_map_to_processor_id,
module_map_to_socket_core,
module_get_processor_info,
module_get_socket_info,
module_get_core_info,
module_get_physical_processor_id,
module_get_physical_socket_id,
module_get_physical_core_id,
NULL
};
/*
* Trivial DFS traversal recursion function
*/
static hwloc_obj_t dfs_find_os_index(hwloc_obj_t root, hwloc_obj_type_t type,
unsigned os_index)
{
unsigned i;
hwloc_obj_t ret;
if (root->type == type && root->os_index == os_index) {
return root;
}
for (i = 0; i < root->arity; ++i) {
ret = dfs_find_os_index(root->children[i], type, os_index);
if (NULL != ret) {
return ret;
}
}
return NULL;
}
/*
* Trivial DFS traversal recursion function
*/
static hwloc_obj_t dfs_find_nth_item(hwloc_obj_t root,
hwloc_obj_type_t type,
unsigned *current,
unsigned n)
{
unsigned i;
hwloc_obj_t ret;
if (root->type == type) {
if (*current == n) {
return root;
}
++(*current);
}
for (i = 0; i < root->arity; ++i) {
ret = dfs_find_nth_item(root->children[i], type, current, n);
if (NULL != ret) {
return ret;
}
}
return NULL;
}
/*
* Trivial DFS traversal recursion function
*/
static int dfs_count_type(hwloc_obj_t root, hwloc_obj_type_t type)
{
unsigned i;
int count = 0;
if (root->type == type) {
++count;
}
for (i = 0; i < root->arity; ++i) {
count += dfs_count_type(root->children[i], type);
}
return count;
}
int opal_paffinity_hwloc_component_query(mca_base_module_t **module,
int *priority)
{
int param;
param = mca_base_param_find("paffinity", "hwloc", "priority");
mca_base_param_lookup_int(param, priority);
*module = (mca_base_module_t *)&loc_module;
return OPAL_SUCCESS;
}
static int module_init(void)
{
/* Nothing to do */
return OPAL_SUCCESS;
}
static int module_set(opal_paffinity_base_cpu_set_t mask)
{
int i, ret = OPAL_SUCCESS;
hwloc_cpuset_t set;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
set = hwloc_cpuset_alloc();
hwloc_cpuset_zero(set);
for (i = 0; ((unsigned int) i) < OPAL_PAFFINITY_BITMASK_T_NUM_BITS; ++i) {
if (OPAL_PAFFINITY_CPU_ISSET(i, mask) &&
i < mca_paffinity_hwloc_component.cpuset_max_size) {
hwloc_cpuset_cpu(set, i);
}
}
if (0 != hwloc_set_cpubind(*t, set, 0)) {
ret = OPAL_ERR_IN_ERRNO;
}
hwloc_cpuset_free(set);
return ret;
}
static int module_get(opal_paffinity_base_cpu_set_t *mask)
{
int i, ret = OPAL_SUCCESS;
hwloc_cpuset_t set;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
if (NULL == mask) {
return OPAL_ERR_BAD_PARAM;
}
set = hwloc_cpuset_alloc();
if (0 != hwloc_get_cpubind(*t, set, 0)) {
ret = OPAL_ERR_IN_ERRNO;
} else {
OPAL_PAFFINITY_CPU_ZERO(*mask);
for (i = 0; ((unsigned int) i) < 8 * sizeof(*mask); i++) {
if (i < mca_paffinity_hwloc_component.cpuset_max_size &&
hwloc_cpuset_isset(set, i)) {
OPAL_PAFFINITY_CPU_SET(i, *mask);
}
}
}
hwloc_cpuset_free(set);
return ret;
}
/*
* Returns mapping of PHYSICAL socket:core -> PHYSICAL processor id.
*
* Since paffinity currently does not understand hardware threads,
* return the processor ID of the first hardware thread in the target
* core.
*/
static int module_map_to_processor_id(int socket, int core, int *processor_id)
{
unsigned i;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
hwloc_obj_t obj;
/* Traverse all sockets, looking for the right physical ID number.
Once we find it, traverse all that socket's cores looking for
the right physial ID number. Once we find it, return the
physical processor ID number. */
for (obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_SOCKET, NULL);
NULL != obj;
obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_SOCKET, obj)) {
if (obj->os_index == (unsigned int) socket) {
/* Ok, we found the right socket. Browse its descendants
looking for the core with the right os_index (don't
assume all cores are at the same level). */
obj = dfs_find_os_index(obj, HWLOC_OBJ_CORE, core);
if (NULL != obj) {
/* Ok, we found the right core. Get the cpuset and
return the first PU (because hwloc understands
hardware threads, of which there might be multiple
on this core). */
hwloc_cpuset_t good;
good = hwloc_cpuset_alloc();
if (NULL == good) {
return OPAL_ERR_OUT_OF_RESOURCE;
}
hwloc_cpuset_and(good, obj->online_cpuset,
obj->allowed_cpuset);
for (i = 0;
(int) i < mca_paffinity_hwloc_component.cpuset_max_size;
++i) {
if (hwloc_cpuset_isset(good, i)) {
*processor_id = i;
hwloc_cpuset_free(good);
return OPAL_SUCCESS;
}
}
/* Huh. This shouldn't happen. */
hwloc_cpuset_free(good);
return OPAL_ERR_NOT_FOUND;
}
/* If we found the right socket but not the right core, we
didn't find it. */
return OPAL_ERR_NOT_FOUND;
}
}
/* If we didn't even find the right socket, we didn't find it. */
return OPAL_ERR_NOT_FOUND;
}
/*
* Provides mapping of PHYSICAL processor id -> PHYSICAL socket:core.
*/
static int module_map_to_socket_core(int processor_id, int *socket, int *core)
{
hwloc_obj_t obj;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
hwloc_cpuset_t good;
good = hwloc_cpuset_alloc();
if (NULL == good) {
return OPAL_ERR_OUT_OF_RESOURCE;
}
/* Iterate through every core and find one that contains the
processor_id. Then find the corresponding socket. */
for (obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_CORE, NULL);
NULL != obj;
obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_CORE, obj)) {
hwloc_cpuset_and(good, obj->online_cpuset,
obj->allowed_cpuset);
/* Does this core contain the processor_id in question? */
if (hwloc_cpuset_isset(good, processor_id)) {
*core = obj->os_index;
/* Go upward from the core object until we find its parent
socket. */
while (HWLOC_OBJ_SOCKET != obj->type) {
if (NULL == obj->parent) {
/* If we get to the root without finding a socket,
er.. Hmm. Error! */
return OPAL_ERR_NOT_FOUND;
}
obj = obj->parent;
}
*socket = obj->os_index;
return OPAL_SUCCESS;
}
}
/* If we didn't even find the right core, we didn't find it. */
return OPAL_ERR_NOT_FOUND;
}
/*
* Provides number of LOGICAL processors in a host. Since paffinity
* does not currently understand hardware threads, we interpret
* "processors" to mean "cores".
*/
static int module_get_processor_info(int *num_processors)
{
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
/* Try the simple hwloc_get_nbobjs_by_type() first. If we get -1,
go aggregate ourselves (because it means that there are cores
are multiple levels in the topology). */
*num_processors = (int) hwloc_get_nbobjs_by_type(*t, HWLOC_OBJ_CORE);
if (-1 == *num_processors) {
hwloc_obj_t obj;
*num_processors = 0;
for (obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_CORE, NULL);
NULL != obj;
obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_CORE, obj)) {
if (HWLOC_OBJ_CORE == obj->type) {
++*num_processors;
}
}
}
return OPAL_SUCCESS;
}
/*
* Provides the number of LOGICAL sockets in a host.
*/
static int module_get_socket_info(int *num_sockets)
{
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
/* Try the simple hwloc_get_nbobjs_by_type() first. If we get -1,
go aggregate ourselves (because it means that there are cores
are multiple levels in the topology). */
*num_sockets = (int) hwloc_get_nbobjs_by_type(*t, HWLOC_OBJ_SOCKET);
if (-1 == *num_sockets) {
hwloc_obj_t obj;
*num_sockets = 0;
for (obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_SOCKET, NULL);
NULL != obj;
obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_SOCKET, obj)) {
if (HWLOC_OBJ_CORE == obj->type) {
++*num_sockets;
}
}
}
return OPAL_SUCCESS;
}
/*
* Provides the number of LOGICAL cores in a PHYSICAL socket.
*/
static int module_get_core_info(int socket, int *num_cores)
{
hwloc_obj_t obj;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
/* Traverse all sockets, looking for the right physical ID
number. */
for (obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_SOCKET, NULL);
NULL != obj;
obj = hwloc_get_next_obj_by_type(*t, HWLOC_OBJ_SOCKET, obj)) {
if (obj->os_index == (unsigned int) socket) {
/* Ok, we found the right socket. Browse its descendants
looking for all cores. */
*num_cores = dfs_count_type(obj, HWLOC_OBJ_CORE);
return OPAL_SUCCESS;
}
}
/* If we didn't even find the right socket, we didn't find it. */
return OPAL_ERR_NOT_FOUND;
}
/*
* Return the PHYSICAL processor id that corresponds to the given
* LOGICAL processor id (remember: paffinity does not understand
* hardware threads, so "processor" here means "core").
*/
static int module_get_physical_processor_id(int logical_processor_id)
{
int i;
hwloc_obj_t obj;
hwloc_cpuset_t good;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
obj = hwloc_get_obj_by_type(*t, HWLOC_OBJ_CORE, logical_processor_id);
if (NULL == obj) {
return OPAL_ERR_NOT_FOUND;
}
/* Found the right core. Now find the processor ID of the first
PU available in that core. */
good = hwloc_cpuset_alloc();
if (NULL == good) {
return OPAL_ERR_OUT_OF_RESOURCE;
}
hwloc_cpuset_and(good, obj->online_cpuset,
obj->allowed_cpuset);
for (i = 0;
(int) i < mca_paffinity_hwloc_component.cpuset_max_size;
++i) {
if (hwloc_cpuset_isset(good, i)) {
hwloc_cpuset_free(good);
return i;
}
}
/* Huh. This shouldn't happen. */
hwloc_cpuset_free(good);
return OPAL_ERR_NOT_FOUND;
}
/*
* Return the PHYSICAL socket id that corresponds to the given
* LOGICAL socket id
*/
static int module_get_physical_socket_id(int logical_socket_id)
{
hwloc_obj_t obj;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
obj = hwloc_get_obj_by_type(*t, HWLOC_OBJ_SOCKET, logical_socket_id);
if (NULL == obj) {
return OPAL_ERR_NOT_FOUND;
}
return obj->os_index;
}
/*
* Return the PHYSICAL core id that corresponds to the given LOGICAL
* core id on the given PHYSICAL socket id
*/
static int module_get_physical_core_id(int physical_socket_id,
int logical_core_id)
{
int i;
unsigned count = 0;
hwloc_obj_t obj;
hwloc_cpuset_t good;
hwloc_topology_t *t = &mca_paffinity_hwloc_component.topology;
obj = hwloc_get_root_obj(*t);
if (NULL == obj) {
return OPAL_ERR_NOT_FOUND;
}
obj = dfs_find_os_index(obj, HWLOC_OBJ_SOCKET, physical_socket_id);
if (NULL == obj) {
return OPAL_ERR_NOT_FOUND;
}
/* Note that we can't look at hwloc's logical_index here -- hwloc
counts logically across *all* cores. We only want to find the
Nth logical core under this particular socket. */
obj = dfs_find_nth_item(obj, HWLOC_OBJ_CORE, &count, logical_core_id);
if (NULL == obj) {
return OPAL_ERR_NOT_FOUND;
}
/* Found the right core. Now find the processor ID of the first
PU available in that core. */
good = hwloc_cpuset_alloc();
if (NULL == good) {
return OPAL_ERR_OUT_OF_RESOURCE;
}
hwloc_cpuset_and(good, obj->online_cpuset,
obj->allowed_cpuset);
for (i = 0;
(int) i < mca_paffinity_hwloc_component.cpuset_max_size;
++i) {
if (hwloc_cpuset_isset(good, i)) {
hwloc_cpuset_free(good);
return i;
}
}
/* Huh. This shouldn't happen. */
hwloc_cpuset_free(good);
return OPAL_ERR_NOT_FOUND;
}