038dcad8b5
This commit removes the unsupported __sync built-in atomics in favor of the GCC built-ins. The priority order (if not modified by configure flags) is: C11, custom atomics (opal/include/opal/sys/*), then GCC built-ins. Signed-off-by: Nathan Hjelm <hjelmn@google.com>
1362 строки
47 KiB
Plaintext
1362 строки
47 KiB
Plaintext
dnl
|
|
dnl Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
dnl University Research and Technology
|
|
dnl Corporation. All rights reserved.
|
|
dnl Copyright (c) 2004-2018 The University of Tennessee and The University
|
|
dnl of Tennessee Research Foundation. All rights
|
|
dnl reserved.
|
|
dnl Copyright (c) 2004-2006 High Performance Computing Center Stuttgart,
|
|
dnl University of Stuttgart. All rights reserved.
|
|
dnl Copyright (c) 2004-2005 The Regents of the University of California.
|
|
dnl All rights reserved.
|
|
dnl Copyright (c) 2008-2018 Cisco Systems, Inc. All rights reserved.
|
|
dnl Copyright (c) 2010 Oracle and/or its affiliates. All rights reserved.
|
|
dnl Copyright (c) 2015-2018 Research Organization for Information Science
|
|
dnl and Technology (RIST). All rights reserved.
|
|
dnl Copyright (c) 2014-2018 Los Alamos National Security, LLC. All rights
|
|
dnl reserved.
|
|
dnl Copyright (c) 2017 Amazon.com, Inc. or its affiliates. All Rights
|
|
dnl reserved.
|
|
dnl Copyright (c) 2020 Google, LLC. All rights reserved.
|
|
dnl $COPYRIGHT$
|
|
dnl
|
|
dnl Additional copyrights may follow
|
|
dnl
|
|
dnl $HEADER$
|
|
dnl
|
|
|
|
dnl This is a C test to see if 128-bit __atomic_compare_exchange_n()
|
|
dnl actually works (e.g., it compiles and links successfully on
|
|
dnl ARM64+clang, but returns incorrect answers as of August 2018).
|
|
AC_DEFUN([OPAL_ATOMIC_COMPARE_EXCHANGE_N_TEST_SOURCE],[[
|
|
#include <stdint.h>
|
|
#include <stdbool.h>
|
|
#include <stdlib.h>
|
|
|
|
typedef union {
|
|
uint64_t fake@<:@2@:>@;
|
|
__int128 real;
|
|
} ompi128;
|
|
|
|
static void test1(void)
|
|
{
|
|
// As of Aug 2018, we could not figure out a way to assign 128-bit
|
|
// constants -- the compilers would not accept it. So use a fake
|
|
// union to assign 2 uin64_t's to make a single __int128.
|
|
ompi128 ptr = { .fake = { 0xFFEEDDCCBBAA0099, 0x8877665544332211 }};
|
|
ompi128 expected = { .fake = { 0x11EEDDCCBBAA0099, 0x88776655443322FF }};
|
|
ompi128 desired = { .fake = { 0x1122DDCCBBAA0099, 0x887766554433EEFF }};
|
|
bool r = __atomic_compare_exchange_n(&ptr.real, &expected.real,
|
|
desired.real, true,
|
|
__ATOMIC_RELAXED, __ATOMIC_RELAXED);
|
|
if ( !(r == false && ptr.real == expected.real)) {
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
static void test2(void)
|
|
{
|
|
ompi128 ptr = { .fake = { 0xFFEEDDCCBBAA0099, 0x8877665544332211 }};
|
|
ompi128 expected = ptr;
|
|
ompi128 desired = { .fake = { 0x1122DDCCBBAA0099, 0x887766554433EEFF }};
|
|
bool r = __atomic_compare_exchange_n(&ptr.real, &expected.real,
|
|
desired.real, true,
|
|
__ATOMIC_RELAXED, __ATOMIC_RELAXED);
|
|
if (!(r == true && ptr.real == desired.real)) {
|
|
exit(2);
|
|
}
|
|
}
|
|
|
|
int main(int argc, char** argv)
|
|
{
|
|
test1();
|
|
test2();
|
|
return 0;
|
|
}
|
|
]])
|
|
|
|
dnl ------------------------------------------------------------------
|
|
|
|
dnl This is a C test to see if 128-bit __sync_bool_compare_and_swap()
|
|
dnl actually works (e.g., it compiles and links successfully on
|
|
dnl ARM64+clang, but returns incorrect answers as of August 2018).
|
|
AC_DEFUN([OPAL_SYNC_BOOL_COMPARE_AND_SWAP_TEST_SOURCE],[[
|
|
#include <stdint.h>
|
|
#include <stdbool.h>
|
|
#include <stdlib.h>
|
|
|
|
typedef union {
|
|
uint64_t fake@<:@2@:>@;
|
|
__int128 real;
|
|
} ompi128;
|
|
|
|
static void test1(void)
|
|
{
|
|
// As of Aug 2018, we could not figure out a way to assign 128-bit
|
|
// constants -- the compilers would not accept it. So use a fake
|
|
// union to assign 2 uin64_t's to make a single __int128.
|
|
ompi128 ptr = { .fake = { 0xFFEEDDCCBBAA0099, 0x8877665544332211 }};
|
|
ompi128 oldval = { .fake = { 0x11EEDDCCBBAA0099, 0x88776655443322FF }};
|
|
ompi128 newval = { .fake = { 0x1122DDCCBBAA0099, 0x887766554433EEFF }};
|
|
bool r = __sync_bool_compare_and_swap(&ptr.real, oldval.real, newval.real);
|
|
if (!(r == false && ptr.real != newval.real)) {
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
static void test2(void)
|
|
{
|
|
ompi128 ptr = { .fake = { 0xFFEEDDCCBBAA0099, 0x8877665544332211 }};
|
|
ompi128 oldval = ptr;
|
|
ompi128 newval = { .fake = { 0x1122DDCCBBAA0099, 0x887766554433EEFF }};
|
|
bool r = __sync_bool_compare_and_swap(&ptr.real, oldval.real, newval.real);
|
|
if (!(r == true && ptr.real == newval.real)) {
|
|
exit(2);
|
|
}
|
|
}
|
|
|
|
int main(int argc, char** argv)
|
|
{
|
|
test1();
|
|
test2();
|
|
return 0;
|
|
}
|
|
]])
|
|
|
|
dnl This is a C test to see if 128-bit __atomic_compare_exchange_n()
|
|
dnl actually works (e.g., it compiles and links successfully on
|
|
dnl ARM64+clang, but returns incorrect answers as of August 2018).
|
|
AC_DEFUN([OPAL_ATOMIC_COMPARE_EXCHANGE_STRONG_TEST_SOURCE],[[
|
|
#include <stdint.h>
|
|
#include <stdbool.h>
|
|
#include <stdlib.h>
|
|
#include <stdatomic.h>
|
|
|
|
typedef union {
|
|
uint64_t fake@<:@2@:>@;
|
|
_Atomic __int128 real;
|
|
} ompi128;
|
|
|
|
static void test1(void)
|
|
{
|
|
// As of Aug 2018, we could not figure out a way to assign 128-bit
|
|
// constants -- the compilers would not accept it. So use a fake
|
|
// union to assign 2 uin64_t's to make a single __int128.
|
|
ompi128 ptr = { .fake = { 0xFFEEDDCCBBAA0099, 0x8877665544332211 }};
|
|
ompi128 expected = { .fake = { 0x11EEDDCCBBAA0099, 0x88776655443322FF }};
|
|
ompi128 desired = { .fake = { 0x1122DDCCBBAA0099, 0x887766554433EEFF }};
|
|
bool r = atomic_compare_exchange_strong (&ptr.real, &expected.real,
|
|
desired.real, true,
|
|
atomic_relaxed, atomic_relaxed);
|
|
if ( !(r == false && ptr.real == expected.real)) {
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
static void test2(void)
|
|
{
|
|
ompi128 ptr = { .fake = { 0xFFEEDDCCBBAA0099, 0x8877665544332211 }};
|
|
ompi128 expected = ptr;
|
|
ompi128 desired = { .fake = { 0x1122DDCCBBAA0099, 0x887766554433EEFF }};
|
|
bool r = atomic_compare_exchange_strong (&ptr.real, &expected.real,
|
|
desired.real, true,
|
|
atomic_relaxed, atomic_relaxed);
|
|
if (!(r == true && ptr.real == desired.real)) {
|
|
exit(2);
|
|
}
|
|
}
|
|
|
|
int main(int argc, char** argv)
|
|
{
|
|
test1();
|
|
test2();
|
|
return 0;
|
|
}
|
|
]])
|
|
|
|
dnl ------------------------------------------------------------------
|
|
|
|
dnl
|
|
dnl Check to see if a specific function is linkable.
|
|
dnl
|
|
dnl Check with:
|
|
dnl 1. No compiler/linker flags.
|
|
dnl 2. CFLAGS += -mcx16
|
|
dnl 3. LIBS += -latomic
|
|
dnl 4. Finally, if it links ok with any of #1, #2, or #3, actually try
|
|
dnl to run the test code (if we're not cross-compiling) and verify
|
|
dnl that it actually gives us the correct result.
|
|
dnl
|
|
dnl Note that we unfortunately can't use AC SEARCH_LIBS because its
|
|
dnl check incorrectly fails (because these functions are special compiler
|
|
dnl intrinsics -- SEARCH_LIBS tries with "check FUNC()", which the
|
|
dnl compiler complains doesn't match the internal prototype). So we have
|
|
dnl to use our own LINK_IFELSE tests. Indeed, since these functions are
|
|
dnl so special, we actually need a valid source code that calls the
|
|
dnl functions with correct arguments, etc. It's not enough, for example,
|
|
dnl to do the usual "try to set a function pointer to the symbol" trick to
|
|
dnl determine if these functions are available, because the compiler may
|
|
dnl not implement these as actual symbols. So just try to link a real
|
|
dnl test code.
|
|
dnl
|
|
dnl $1: function name to print
|
|
dnl $2: program to test
|
|
dnl $3: action if any of 1, 2, or 3 succeeds
|
|
dnl #4: action if all of 1, 2, and 3 fail
|
|
dnl
|
|
AC_DEFUN([OPAL_ASM_CHECK_ATOMIC_FUNC],[
|
|
OPAL_VAR_SCOPE_PUSH([opal_asm_check_func_happy opal_asm_check_func_CFLAGS_save opal_asm_check_func_LIBS_save])
|
|
|
|
opal_asm_check_func_CFLAGS_save=$CFLAGS
|
|
opal_asm_check_func_LIBS_save=$LIBS
|
|
|
|
dnl Check with no compiler/linker flags
|
|
AC_MSG_CHECKING([for $1])
|
|
AC_LINK_IFELSE([$2],
|
|
[opal_asm_check_func_happy=1
|
|
AC_MSG_RESULT([yes])],
|
|
[opal_asm_check_func_happy=0
|
|
AC_MSG_RESULT([no])])
|
|
|
|
dnl If that didn't work, try again with CFLAGS+=mcx16
|
|
AS_IF([test $opal_asm_check_func_happy -eq 0],
|
|
[AC_MSG_CHECKING([for $1 with -mcx16])
|
|
CFLAGS="$CFLAGS -mcx16"
|
|
AC_LINK_IFELSE([$2],
|
|
[opal_asm_check_func_happy=1
|
|
AC_MSG_RESULT([yes])],
|
|
[opal_asm_check_func_happy=0
|
|
CFLAGS=$opal_asm_check_func_CFLAGS_save
|
|
AC_MSG_RESULT([no])])
|
|
])
|
|
|
|
dnl If that didn't work, try again with LIBS+=-latomic
|
|
AS_IF([test $opal_asm_check_func_happy -eq 0],
|
|
[AC_MSG_CHECKING([for $1 with -latomic])
|
|
LIBS="$LIBS -latomic"
|
|
AC_LINK_IFELSE([$2],
|
|
[opal_asm_check_func_happy=1
|
|
AC_MSG_RESULT([yes])],
|
|
[opal_asm_check_func_happy=0
|
|
LIBS=$opal_asm_check_func_LIBS_save
|
|
AC_MSG_RESULT([no])])
|
|
])
|
|
|
|
dnl If we have it, try it and make sure it gives a correct result.
|
|
dnl As of Aug 2018, we know that it links but does *not* work on clang
|
|
dnl 6 on ARM64.
|
|
AS_IF([test $opal_asm_check_func_happy -eq 1],
|
|
[AC_MSG_CHECKING([if $1() gives correct results])
|
|
AC_RUN_IFELSE([$2],
|
|
[AC_MSG_RESULT([yes])],
|
|
[opal_asm_check_func_happy=0
|
|
AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([cannot test -- assume yes (cross compiling)])])
|
|
])
|
|
|
|
dnl If we were unsuccessful, restore CFLAGS/LIBS
|
|
AS_IF([test $opal_asm_check_func_happy -eq 0],
|
|
[CFLAGS=$opal_asm_check_func_CFLAGS_save
|
|
LIBS=$opal_asm_check_func_LIBS_save])
|
|
|
|
dnl Run the user actions
|
|
AS_IF([test $opal_asm_check_func_happy -eq 1], [$3], [$4])
|
|
|
|
OPAL_VAR_SCOPE_POP
|
|
])
|
|
|
|
dnl ------------------------------------------------------------------
|
|
|
|
AC_DEFUN([OPAL_CHECK_SYNC_BUILTIN_CSWAP_INT128], [
|
|
OPAL_VAR_SCOPE_PUSH([sync_bool_compare_and_swap_128_result])
|
|
|
|
# Do we have __sync_bool_compare_and_swap?
|
|
# Use a special macro because we need to check with a few different
|
|
# CFLAGS/LIBS.
|
|
OPAL_ASM_CHECK_ATOMIC_FUNC([__sync_bool_compare_and_swap],
|
|
[AC_LANG_SOURCE(OPAL_SYNC_BOOL_COMPARE_AND_SWAP_TEST_SOURCE)],
|
|
[sync_bool_compare_and_swap_128_result=1],
|
|
[sync_bool_compare_and_swap_128_result=0])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_SYNC_BUILTIN_CSWAP_INT128],
|
|
[$sync_bool_compare_and_swap_128_result],
|
|
[Whether the __sync builtin atomic compare and swap supports 128-bit values])
|
|
|
|
OPAL_VAR_SCOPE_POP
|
|
])
|
|
|
|
AC_DEFUN([OPAL_CHECK_GCC_BUILTIN_CSWAP_INT128], [
|
|
OPAL_VAR_SCOPE_PUSH([atomic_compare_exchange_n_128_result atomic_compare_exchange_n_128_CFLAGS_save atomic_compare_exchange_n_128_LIBS_save])
|
|
|
|
atomic_compare_exchange_n_128_CFLAGS_save=$CFLAGS
|
|
atomic_compare_exchange_n_128_LIBS_save=$LIBS
|
|
|
|
# Do we have __sync_bool_compare_and_swap?
|
|
# Use a special macro because we need to check with a few different
|
|
# CFLAGS/LIBS.
|
|
OPAL_ASM_CHECK_ATOMIC_FUNC([__atomic_compare_exchange_n],
|
|
[AC_LANG_SOURCE(OPAL_ATOMIC_COMPARE_EXCHANGE_N_TEST_SOURCE)],
|
|
[atomic_compare_exchange_n_128_result=1],
|
|
[atomic_compare_exchange_n_128_result=0])
|
|
|
|
# If we have it and it works, check to make sure it is always lock
|
|
# free.
|
|
AS_IF([test $atomic_compare_exchange_n_128_result -eq 1],
|
|
[AC_MSG_CHECKING([if __int128 atomic compare-and-swap is always lock-free])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([], [if (!__atomic_always_lock_free(16, 0)) { return 1; }])],
|
|
[AC_MSG_RESULT([yes])],
|
|
[atomic_compare_exchange_n_128_result=0
|
|
# If this test fails, need to reset CFLAGS/LIBS (the
|
|
# above tests atomically set CFLAGS/LIBS or not; this
|
|
# test is running after the fact, so we have to undo
|
|
# the side-effects of setting CFLAGS/LIBS if the above
|
|
# tests passed).
|
|
CFLAGS=$atomic_compare_exchange_n_128_CFLAGS_save
|
|
LIBS=$atomic_compare_exchange_n_128_LIBS_save
|
|
AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([cannot test -- assume yes (cross compiling)])])
|
|
])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_GCC_BUILTIN_CSWAP_INT128],
|
|
[$atomic_compare_exchange_n_128_result],
|
|
[Whether the __atomic builtin atomic compare swap is both supported and lock-free on 128-bit values])
|
|
|
|
dnl If we could not find decent support for 128-bits __atomic let's
|
|
dnl try the GCC _sync
|
|
AS_IF([test $atomic_compare_exchange_n_128_result -eq 0],
|
|
[OPAL_CHECK_SYNC_BUILTIN_CSWAP_INT128])
|
|
|
|
OPAL_VAR_SCOPE_POP
|
|
])
|
|
|
|
AC_DEFUN([OPAL_CHECK_GCC_ATOMIC_BUILTINS], [
|
|
if test -z "$opal_cv_have___atomic" ; then
|
|
AC_MSG_CHECKING([for 32-bit GCC built-in atomics])
|
|
|
|
AC_TRY_LINK([
|
|
#include <stdint.h>
|
|
uint32_t tmp, old = 0;
|
|
uint64_t tmp64, old64 = 0;], [
|
|
__atomic_thread_fence(__ATOMIC_SEQ_CST);
|
|
__atomic_compare_exchange_n(&tmp, &old, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);
|
|
__atomic_add_fetch(&tmp, 1, __ATOMIC_RELAXED);
|
|
__atomic_compare_exchange_n(&tmp64, &old64, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);
|
|
__atomic_add_fetch(&tmp64, 1, __ATOMIC_RELAXED);],
|
|
[opal_cv_have___atomic=yes],
|
|
[opal_cv_have___atomic=no])
|
|
|
|
AC_MSG_RESULT([$opal_cv_have___atomic])
|
|
|
|
if test $opal_cv_have___atomic = "yes" ; then
|
|
AC_MSG_CHECKING([for 64-bit GCC built-in atomics])
|
|
|
|
AC_TRY_LINK([
|
|
#include <stdint.h>
|
|
uint64_t tmp64, old64 = 0;], [
|
|
__atomic_compare_exchange_n(&tmp64, &old64, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);
|
|
__atomic_add_fetch(&tmp64, 1, __ATOMIC_RELAXED);],
|
|
[opal_cv_have___atomic_64=yes],
|
|
[opal_cv_have___atomic_64=no])
|
|
|
|
AC_MSG_RESULT([$opal_cv_have___atomic_64])
|
|
|
|
if test $opal_cv_have___atomic_64 = "yes" ; then
|
|
AC_MSG_CHECKING([if 64-bit GCC built-in atomics are lock-free])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([], [if (!__atomic_is_lock_free (8, 0)) { return 1; }])],
|
|
[AC_MSG_RESULT([yes])],
|
|
[AC_MSG_RESULT([no])
|
|
opal_cv_have___atomic_64=no],
|
|
[AC_MSG_RESULT([cannot test -- assume yes (cross compiling)])])
|
|
fi
|
|
else
|
|
opal_cv_have___atomic_64=no
|
|
fi
|
|
|
|
# Check for 128-bit support
|
|
OPAL_CHECK_GCC_BUILTIN_CSWAP_INT128
|
|
fi
|
|
])
|
|
|
|
AC_DEFUN([OPAL_CHECK_C11_CSWAP_INT128], [
|
|
OPAL_VAR_SCOPE_PUSH([atomic_compare_exchange_result atomic_compare_exchange_CFLAGS_save atomic_compare_exchange_LIBS_save])
|
|
|
|
atomic_compare_exchange_CFLAGS_save=$CFLAGS
|
|
atomic_compare_exchange_LIBS_save=$LIBS
|
|
|
|
# Do we have C11 atomics on 128-bit integers?
|
|
# Use a special macro because we need to check with a few different
|
|
# CFLAGS/LIBS.
|
|
OPAL_ASM_CHECK_ATOMIC_FUNC([atomic_compare_exchange_strong_16],
|
|
[AC_LANG_SOURCE(OPAL_ATOMIC_COMPARE_EXCHANGE_STRONG_TEST_SOURCE)],
|
|
[atomic_compare_exchange_result=1],
|
|
[atomic_compare_exchange_result=0])
|
|
|
|
# If we have it and it works, check to make sure it is always lock
|
|
# free.
|
|
AS_IF([test $atomic_compare_exchange_result -eq 1],
|
|
[AC_MSG_CHECKING([if C11 __int128 atomic compare-and-swap is always lock-free])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([#include <stdatomic.h>], [_Atomic __int128_t x; if (!atomic_is_lock_free(&x)) { return 1; }])],
|
|
[AC_MSG_RESULT([yes])],
|
|
[atomic_compare_exchange_result=0
|
|
# If this test fails, need to reset CFLAGS/LIBS (the
|
|
# above tests atomically set CFLAGS/LIBS or not; this
|
|
# test is running after the fact, so we have to undo
|
|
# the side-effects of setting CFLAGS/LIBS if the above
|
|
# tests passed).
|
|
CFLAGS=$atomic_compare_exchange_CFLAGS_save
|
|
LIBS=$atomic_compare_exchange_LIBS_save
|
|
AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([cannot test -- assume yes (cross compiling)])])
|
|
])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_C11_CSWAP_INT128],
|
|
[$atomic_compare_exchange_result],
|
|
[Whether C11 atomic compare swap is both supported and lock-free on 128-bit values])
|
|
|
|
dnl If we could not find decent support for 128-bits atomic let's
|
|
dnl try the GCC _sync
|
|
AS_IF([test $atomic_compare_exchange_result -eq 0],
|
|
[OPAL_CHECK_SYNC_BUILTIN_CSWAP_INT128])
|
|
|
|
OPAL_VAR_SCOPE_POP
|
|
])
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_TEXT
|
|
dnl
|
|
dnl Determine how to set current mode as text.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_TEXT],[
|
|
AC_MSG_CHECKING([directive for setting text section])
|
|
opal_cv_asm_text=""
|
|
if test "$opal_cv_c_compiler_vendor" = "microsoft" ; then
|
|
# text section will be brought in with the rest of
|
|
# header for MS - leave blank for now
|
|
opal_cv_asm_text=""
|
|
else
|
|
case $host in
|
|
*-aix*)
|
|
opal_cv_asm_text=[".csect .text[PR]"]
|
|
;;
|
|
*)
|
|
opal_cv_asm_text=".text"
|
|
;;
|
|
esac
|
|
fi
|
|
AC_MSG_RESULT([$opal_cv_asm_text])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_TEXT], ["$opal_cv_asm_text"],
|
|
[Assembly directive for setting text section])
|
|
OPAL_ASM_TEXT="$opal_cv_asm_text"
|
|
AC_SUBST(OPAL_ASM_TEXT)
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_GLOBAL
|
|
dnl
|
|
dnl Sets OPAL_ASM_GLOBAL to the value to prefix global values
|
|
dnl
|
|
dnl I'm sure if I don't have a test for this, there will be some
|
|
dnl dumb platform that uses something else
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_GLOBAL],[
|
|
AC_MSG_CHECKING([directive for exporting symbols])
|
|
opal_cv_asm_global=""
|
|
if test "$opal_cv_c_compiler_vendor" = "microsoft" ; then
|
|
opal_cv_asm_global="PUBLIC"
|
|
else
|
|
case $host in
|
|
*)
|
|
opal_cv_asm_global=".globl"
|
|
;;
|
|
esac
|
|
fi
|
|
AC_MSG_RESULT([$opal_cv_asm_global])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_GLOBAL], ["$opal_cv_asm_global"],
|
|
[Assembly directive for exporting symbols])
|
|
OPAL_ASM_GLOBAL="$opal_cv_asm_global"
|
|
AC_SUBST(OPAL_AS_GLOBAL)
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_LSYM
|
|
dnl
|
|
dnl Sets OPAL_ASM_LSYM to the prefix value on a symbol to make it
|
|
dnl an internal label (jump target and whatnot)
|
|
dnl
|
|
dnl We look for L .L $ L$ (in that order) for something that both
|
|
dnl assembles and does not leave a label in the output of nm. Fall
|
|
dnl back to L if nothing else seems to work :/
|
|
dnl
|
|
dnl #################################################################
|
|
|
|
# _OPAL_CHECK_ASM_LSYM([variable-to-set])
|
|
# ---------------------------------------
|
|
AC_DEFUN([_OPAL_CHECK_ASM_LSYM],[
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
|
|
$1="L"
|
|
|
|
for sym in L .L $ L$ ; do
|
|
asm_result=0
|
|
echo "configure: trying $sym" >&AC_FD_CC
|
|
OPAL_TRY_ASSEMBLE([foobar$opal_cv_asm_label_suffix
|
|
${sym}mytestlabel$opal_cv_asm_label_suffix],
|
|
[# ok, we succeeded at assembling. see if we can nm,
|
|
# throwing the results in a file
|
|
if $NM conftest.$OBJEXT > conftest.out 2>&AC_FD_CC ; then
|
|
if test "`$GREP mytestlabel conftest.out`" = "" ; then
|
|
# there was no symbol... looks promising to me
|
|
$1="$sym"
|
|
asm_result=1
|
|
elif test ["`$GREP ' [Nt] .*mytestlabel' conftest.out`"] = "" ; then
|
|
# see if we have a non-global-ish symbol
|
|
# but we should see if we can do better.
|
|
$1="$sym"
|
|
fi
|
|
else
|
|
# not so much on the NM goodness :/
|
|
echo "$NM failed. Output from NM was:" >&AC_FD_CC
|
|
cat conftest.out >&AC_FD_CC
|
|
AC_MSG_WARN([$NM could not read object file])
|
|
fi
|
|
])
|
|
if test "$asm_result" = "1" ; then
|
|
break
|
|
fi
|
|
done
|
|
rm -f conftest.out
|
|
unset asm_result sym
|
|
])
|
|
|
|
# OPAL_CHECK_ASM_LSYM()
|
|
# ---------------------
|
|
AC_DEFUN([OPAL_CHECK_ASM_LSYM],[
|
|
AC_REQUIRE([AC_PROG_NM])
|
|
|
|
AC_CACHE_CHECK([prefix for lsym labels],
|
|
[opal_cv_asm_lsym],
|
|
[_OPAL_CHECK_ASM_LSYM([opal_cv_asm_lsym])])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_LSYM], ["$opal_cv_asm_lsym"],
|
|
[Assembly prefix for lsym labels])
|
|
OPAL_ASM_LSYM="$opal_cv_asm_lsym"
|
|
AC_SUBST(OPAL_ASM_LSYM)
|
|
])dnl
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_PROC
|
|
dnl
|
|
dnl Sets a cv-flag, if the compiler needs a proc/endp-definition to
|
|
dnl link with C.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_PROC],[
|
|
AC_CACHE_CHECK([if .proc/endp is needed],
|
|
[opal_cv_asm_need_proc],
|
|
[opal_cv_asm_need_proc="no"
|
|
OPAL_TRY_ASSEMBLE([
|
|
.proc mysym
|
|
mysym:
|
|
.endp mysym],
|
|
[opal_cv_asm_need_proc="yes"])
|
|
rm -f conftest.out])
|
|
|
|
if test "$opal_cv_asm_need_proc" = "yes" ; then
|
|
opal_cv_asm_proc=".proc"
|
|
opal_cv_asm_endproc=".endp"
|
|
else
|
|
opal_cv_asm_proc="#"
|
|
opal_cv_asm_endproc="#"
|
|
fi
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_GSYM
|
|
dnl
|
|
dnl Sets OPAL_ASM_GSYM to the prefix value on a symbol to make it
|
|
dnl a global linkable from C. Basically, an _ or not.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_GSYM],[
|
|
AC_CACHE_CHECK([prefix for global symbol labels],
|
|
[opal_cv_asm_gsym],
|
|
[_OPAL_CHECK_ASM_GSYM])
|
|
|
|
if test "$opal_cv_asm_gsym" = "none" ; then
|
|
AC_MSG_ERROR([Could not determine global symbol label prefix])
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_GSYM], ["$opal_cv_asm_gsym"],
|
|
[Assembly prefix for gsym labels])
|
|
OPAL_ASM_GSYM="$opal_cv_asm_gsym"
|
|
AC_SUBST(OPAL_ASM_GSYM)
|
|
|
|
])
|
|
|
|
AC_DEFUN([_OPAL_CHECK_ASM_GSYM],[
|
|
opal_cv_asm_gsym="none"
|
|
|
|
for sym in "_" "" "." ; do
|
|
asm_result=0
|
|
echo "configure: trying $sym" >&AC_FD_CC
|
|
cat > conftest_c.c <<EOF
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
void gsym_test_func(void);
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
int
|
|
main()
|
|
{
|
|
gsym_test_func();
|
|
return 0;
|
|
}
|
|
EOF
|
|
OPAL_TRY_ASSEMBLE([
|
|
$opal_cv_asm_text
|
|
$opal_cv_asm_proc ${sym}gsym_test_func
|
|
$opal_cv_asm_global ${sym}gsym_test_func
|
|
${sym}gsym_test_func${opal_cv_asm_label_suffix}
|
|
$opal_cv_asm_endproc ${sym}gsym_test_func
|
|
],
|
|
[opal_compile="$CC $CFLAGS -I. conftest_c.c -c > conftest.cmpl 2>&1"
|
|
if AC_TRY_EVAL(opal_compile) ; then
|
|
# save the warnings
|
|
cat conftest.cmpl >&AC_FD_CC
|
|
opal_link="$CC $CFLAGS conftest_c.$OBJEXT conftest.$OBJEXT -o conftest $LDFLAGS $LIBS > conftest.link 2>&1"
|
|
if AC_TRY_EVAL(opal_link) ; then
|
|
# save the warnings
|
|
cat conftest.link >&AC_FD_CC
|
|
asm_result=1
|
|
else
|
|
cat conftest.link >&AC_FD_CC
|
|
echo "configure: failed C program was: " >&AC_FD_CC
|
|
cat conftest_c.c >&AC_FD_CC
|
|
echo "configure: failed ASM program was: " >&AC_FD_CC
|
|
cat conftest.s >&AC_FD_CC
|
|
asm_result=0
|
|
fi
|
|
else
|
|
# save output and failed program
|
|
cat conftest.cmpl >&AC_FD_CC
|
|
echo "configure: failed C program was: " >&AC_FD_CC
|
|
cat conftest.c >&AC_FD_CC
|
|
asm_result=0
|
|
fi],
|
|
[asm_result=0])
|
|
if test "$asm_result" = "1" ; then
|
|
opal_cv_asm_gsym="$sym"
|
|
break
|
|
fi
|
|
done
|
|
rm -rf conftest.*
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_LABEL_SUFFIX
|
|
dnl
|
|
dnl Sets OPAL_ASM_LABEL_SUFFIX to the value to suffix for labels
|
|
dnl
|
|
dnl I'm sure if I don't have a test for this, there will be some
|
|
dnl dumb platform that uses something else
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_LABEL_SUFFIX],[
|
|
AC_MSG_CHECKING([suffix for labels])
|
|
opal_cv_asm_label_suffix=""
|
|
case $host in
|
|
*)
|
|
opal_cv_asm_label_suffix=":"
|
|
;;
|
|
esac
|
|
AC_MSG_RESULT([$opal_cv_asm_label_suffix])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_LABEL_SUFFIX], ["$opal_cv_asm_label_suffix"],
|
|
[Assembly suffix for labels])
|
|
OPAL_ASM_LABEL_SUFFIX="$opal_cv_asm_label_suffix"
|
|
AC_SUBST(OPAL_AS_LABEL_SUFFIX)
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_ALIGN_LOG
|
|
dnl
|
|
dnl Sets OPAL_ASM_ALIGN_LOG to 1 if align is specified
|
|
dnl logarithmically, 0 otherwise
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_ALIGN_LOG],[
|
|
AC_REQUIRE([AC_PROG_NM])
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
|
|
AC_CACHE_CHECK([if .align directive takes logarithmic value],
|
|
[opal_cv_asm_align_log],
|
|
[ OPAL_TRY_ASSEMBLE([ $opal_cv_asm_text
|
|
.align 4
|
|
$opal_cv_asm_global foo
|
|
.byte 1
|
|
.align 4
|
|
foo$opal_cv_asm_label_suffix
|
|
.byte 2],
|
|
[opal_asm_addr=[`$NM conftest.$OBJEXT | $GREP foo | sed -e 's/.*\([0-9a-fA-F][0-9a-fA-F]\).*foo.*/\1/'`]],
|
|
[opal_asm_addr=""])
|
|
# test for both 16 and 10 (decimal and hex notations)
|
|
echo "configure: .align test address offset is $opal_asm_addr" >&AC_FD_CC
|
|
if test "$opal_asm_addr" = "16" || test "$opal_asm_addr" = "10" ; then
|
|
opal_cv_asm_align_log="yes"
|
|
else
|
|
opal_cv_asm_align_log="no"
|
|
fi])
|
|
|
|
if test "$opal_cv_asm_align_log" = "yes" || test "$opal_cv_asm_align_log" = "1" ; then
|
|
opal_asm_align_log_result=1
|
|
else
|
|
opal_asm_align_log_result=0
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_ALIGN_LOG],
|
|
[$asm_align_log_result],
|
|
[Assembly align directive expects logarithmic value])
|
|
|
|
unset omp_asm_addr asm_result
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_TYPE
|
|
dnl
|
|
dnl Sets OPAL_ASM_TYPE to the prefix for the function type to
|
|
dnl set a symbol's type as function (needed on ELF for shared
|
|
dnl libraries). If no .type directive is needed, sets OPAL_ASM_TYPE
|
|
dnl to an empty string
|
|
dnl
|
|
dnl We look for @ \# %
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_TYPE],[
|
|
AC_CACHE_CHECK([prefix for function in .type],
|
|
[opal_cv_asm_type],
|
|
[_OPAL_CHECK_ASM_TYPE])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_TYPE], ["$opal_cv_asm_type"],
|
|
[How to set function type in .type directive])
|
|
OPAL_ASM_TYPE="$opal_cv_asm_type"
|
|
AC_SUBST(OPAL_ASM_TYPE)
|
|
])
|
|
|
|
AC_DEFUN([_OPAL_CHECK_ASM_TYPE],[
|
|
opal_cv_asm_type=""
|
|
|
|
case "${host}" in
|
|
*-sun-solaris*)
|
|
# GCC on solaris seems to accept just about anything, not
|
|
# that what it defines actually works... So just hardwire
|
|
# to the right answer
|
|
opal_cv_asm_type="#"
|
|
;;
|
|
*)
|
|
for type in @ \# % ; do
|
|
asm_result=0
|
|
echo "configure: trying $type" >&AC_FD_CC
|
|
OPAL_TRY_ASSEMBLE([ .type mysym, ${type}function
|
|
mysym:],
|
|
[opal_cv_asm_type="${type}"
|
|
asm_result=1])
|
|
if test "$asm_result" = "1" ; then
|
|
break
|
|
fi
|
|
done
|
|
;;
|
|
esac
|
|
rm -f conftest.out
|
|
|
|
unset asm_result type
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_SIZE
|
|
dnl
|
|
dnl Sets OPAL_ASM_SIZE to 1 if we should set .size directives for
|
|
dnl each function, 0 otherwise.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_SIZE],[
|
|
AC_CACHE_CHECK([if .size is needed],
|
|
[opal_cv_asm_need_size],
|
|
[opal_cv_asm_need_size="no"
|
|
OPAL_TRY_ASSEMBLE([ .size mysym, 1],
|
|
[opal_cv_asm_need_size="yes"])
|
|
rm -f conftest.out])
|
|
|
|
if test "$opal_cv_asm_need_size" = "yes" ; then
|
|
opal_asm_size=1
|
|
else
|
|
opal_asm_size=0
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_SIZE], ["$opal_asm_size"],
|
|
[Do we need to give a .size directive])
|
|
OPAL_ASM_SIZE="$opal_asm_size"
|
|
AC_SUBST(OPAL_ASM_TYPE)
|
|
unset asm_result
|
|
])dnl
|
|
|
|
|
|
# OPAL_CHECK_ASM_GNU_STACKEXEC(var)
|
|
# ----------------------------------
|
|
# sets shell variable var to the things necessary to
|
|
# disable execable stacks with GAS
|
|
AC_DEFUN([OPAL_CHECK_ASM_GNU_STACKEXEC], [
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
|
|
AC_CHECK_PROG([OBJDUMP], [objdump], [objdump])
|
|
AC_CACHE_CHECK([if .note.GNU-stack is needed],
|
|
[opal_cv_asm_gnu_stack_result],
|
|
[AS_IF([test "$OBJDUMP" != ""],
|
|
[ # first, see if a simple C program has it set
|
|
cat >conftest.c <<EOF
|
|
int testfunc() {return 0; }
|
|
EOF
|
|
OPAL_LOG_COMMAND([$CC $CFLAGS -c conftest.c -o conftest.$OBJEXT],
|
|
[$OBJDUMP -x conftest.$OBJEXT | $GREP '\.note\.GNU-stack' > /dev/null && opal_cv_asm_gnu_stack_result=yes],
|
|
[OPAL_LOG_MSG([the failed program was:], 1)
|
|
OPAL_LOG_FILE([conftest.c])
|
|
opal_cv_asm_gnu_stack_result=no])
|
|
if test "$opal_cv_asm_gnu_stack_result" != "yes" ; then
|
|
opal_cv_asm_gnu_stack_result="no"
|
|
fi
|
|
rm -rf conftest.*],
|
|
[opal_cv_asm_gnu_stack_result="no"])])
|
|
if test "$opal_cv_asm_gnu_stack_result" = "yes" ; then
|
|
opal_cv_asm_gnu_stack=1
|
|
else
|
|
opal_cv_asm_gnu_stack=0
|
|
fi
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_POWERPC_REG
|
|
dnl
|
|
dnl See if the notation for specifying registers is X (most everyone)
|
|
dnl or rX (OS X)
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_POWERPC_REG],[
|
|
AC_MSG_CHECKING([if PowerPC registers have r prefix])
|
|
OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
addi 1,1,0],
|
|
[opal_cv_asm_powerpc_r_reg=0],
|
|
[OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
addi r1,r1,0],
|
|
[opal_cv_asm_powerpc_r_reg=1],
|
|
[AC_MSG_ERROR([Can not determine how to use PPC registers])])])
|
|
if test "$opal_cv_asm_powerpc_r_reg" = "1" ; then
|
|
AC_MSG_RESULT([yes])
|
|
else
|
|
AC_MSG_RESULT([no])
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_POWERPC_R_REGISTERS],
|
|
[$opal_cv_asm_powerpc_r_reg],
|
|
[Whether r notation is used for ppc registers])
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_POWERPC_64BIT
|
|
dnl
|
|
dnl On some powerpc chips (the PPC970 or G5), the OS usually runs in
|
|
dnl 32 bit mode, even though the hardware can do 64bit things. If
|
|
dnl the compiler will let us, emit code for 64bit test and set type
|
|
dnl operations (on a long long).
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_POWERPC_64BIT],[
|
|
if test "$ac_cv_sizeof_long" != "4" ; then
|
|
# this function should only be called in the 32 bit case
|
|
AC_MSG_ERROR([CHECK_POWERPC_64BIT called on 64 bit platform. Internal error.])
|
|
fi
|
|
AC_MSG_CHECKING([for 64-bit PowerPC assembly support])
|
|
case $host in
|
|
*-darwin*)
|
|
ppc64_result=0
|
|
if test "$opal_cv_asm_powerpc_r_reg" = "1" ; then
|
|
ldarx_asm=" ldarx r1,r1,r1";
|
|
else
|
|
ldarx_asm=" ldarx 1,1,1";
|
|
fi
|
|
OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
$ldarx_asm],
|
|
[ppc64_result=1],
|
|
[ppc64_result=0])
|
|
;;
|
|
*)
|
|
ppc64_result=0
|
|
;;
|
|
esac
|
|
|
|
if test "$ppc64_result" = "1" ; then
|
|
AC_MSG_RESULT([yes])
|
|
ifelse([$1],,:,[$1])
|
|
else
|
|
AC_MSG_RESULT([no])
|
|
ifelse([$2],,:,[$2])
|
|
fi
|
|
|
|
unset ppc64_result ldarx_asm
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_SPARCV8PLUS
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_SPARCV8PLUS],[
|
|
AC_MSG_CHECKING([if have Sparc v8+/v9 support])
|
|
sparc_result=0
|
|
OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
casa [%o0] 0x80, %o1, %o2],
|
|
[sparc_result=1],
|
|
[sparc_result=0])
|
|
if test "$sparc_result" = "1" ; then
|
|
AC_MSG_RESULT([yes])
|
|
ifelse([$1],,:,[$1])
|
|
else
|
|
AC_MSG_RESULT([no])
|
|
ifelse([$2],,:,[$2])
|
|
fi
|
|
|
|
unset sparc_result
|
|
])dnl
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_CMPXCHG16B
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CMPXCHG16B_TEST_SOURCE],[[
|
|
#include <stdint.h>
|
|
#include <assert.h>
|
|
|
|
union opal_counted_pointer_t {
|
|
struct {
|
|
uint64_t counter;
|
|
uint64_t item;
|
|
} data;
|
|
#if defined(HAVE___INT128) && HAVE___INT128
|
|
__int128 value;
|
|
#elif defined(HAVE_INT128_T) && HAVE_INT128_T
|
|
int128_t value;
|
|
#endif
|
|
};
|
|
typedef union opal_counted_pointer_t opal_counted_pointer_t;
|
|
|
|
int main(int argc, char* argv) {
|
|
volatile opal_counted_pointer_t a;
|
|
opal_counted_pointer_t b;
|
|
|
|
a.data.counter = 0;
|
|
a.data.item = 0x1234567890ABCDEF;
|
|
|
|
b.data.counter = a.data.counter;
|
|
b.data.item = a.data.item;
|
|
|
|
/* bozo checks */
|
|
assert(16 == sizeof(opal_counted_pointer_t));
|
|
assert(a.data.counter == b.data.counter);
|
|
assert(a.data.item == b.data.item);
|
|
/*
|
|
* the following test fails on buggy compilers
|
|
* so far, with icc -o conftest conftest.c
|
|
* - intel icc 14.0.0.080 (aka 2013sp1)
|
|
* - intel icc 14.0.1.106 (aka 2013sp1u1)
|
|
* older and more recents compilers work fine
|
|
* buggy compilers work also fine but only with -O0
|
|
*/
|
|
#if (defined(HAVE___INT128) && HAVE___INT128) || (defined(HAVE_INT128_T) && HAVE_INT128_T)
|
|
return (a.value != b.value);
|
|
#else
|
|
return 0;
|
|
#endif
|
|
}
|
|
]])
|
|
|
|
AC_DEFUN([OPAL_CHECK_CMPXCHG16B],[
|
|
OPAL_VAR_SCOPE_PUSH([cmpxchg16b_result])
|
|
|
|
OPAL_ASM_CHECK_ATOMIC_FUNC([cmpxchg16b],
|
|
[AC_LANG_PROGRAM([[unsigned char tmp[16];]],
|
|
[[__asm__ __volatile__ ("lock cmpxchg16b (%%rsi)" : : "S" (tmp) : "memory", "cc");]])],
|
|
[cmpxchg16b_result=1],
|
|
[cmpxchg16b_result=0])
|
|
# If we have it, make sure it works.
|
|
AS_IF([test $cmpxchg16b_result -eq 1],
|
|
[AC_MSG_CHECKING([if cmpxchg16b_result works])
|
|
AC_RUN_IFELSE([AC_LANG_SOURCE(OPAL_CMPXCHG16B_TEST_SOURCE)],
|
|
[AC_MSG_RESULT([yes])],
|
|
[cmpxchg16b_result=0
|
|
AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([cannot test -- assume yes (cross compiling)])])
|
|
])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_CMPXCHG16B], [$cmpxchg16b_result],
|
|
[Whether the processor supports the cmpxchg16b instruction])
|
|
OPAL_VAR_SCOPE_POP
|
|
])dnl
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_INLINE_GCC
|
|
dnl
|
|
dnl Check if the compiler is capable of doing GCC-style inline
|
|
dnl assembly. Some compilers emit a warning and ignore the inline
|
|
dnl assembly (xlc on OS X) and compile without error. Therefore,
|
|
dnl the test attempts to run the emitted code to check that the
|
|
dnl assembly is actually run. To run this test, one argument to
|
|
dnl the macro must be an assembly instruction in gcc format to move
|
|
dnl the value 0 into the register containing the variable ret.
|
|
dnl For PowerPC, this would be:
|
|
dnl
|
|
dnl "li %0,0" : "=&r"(ret)
|
|
dnl
|
|
dnl For testing ia32 assembly, the assembly instruction xaddl is
|
|
dnl tested. The xaddl instruction is used by some of the atomic
|
|
dnl implementations so it makes sense to test for it. In addition,
|
|
dnl some compilers (i.e. earlier versions of Sun Studio 12) do not
|
|
dnl necessarily handle xaddl properly, so that needs to be detected
|
|
dnl during configure time.
|
|
dnl
|
|
dnl DEFINE OPAL_GCC_INLINE_ASSEMBLY to 0 or 1 depending on GCC
|
|
dnl support
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_INLINE_C_GCC],[
|
|
assembly="$1"
|
|
asm_result="unknown"
|
|
|
|
AC_MSG_CHECKING([if $CC supports GCC inline assembly])
|
|
|
|
if test ! "$assembly" = "" ; then
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([AC_INCLUDES_DEFAULT],[[
|
|
int ret = 1;
|
|
int negone = -1;
|
|
__asm__ __volatile__ ($assembly);
|
|
return ret;
|
|
]])],
|
|
[asm_result="yes"], [asm_result="no"],
|
|
[asm_result="unknown"])
|
|
else
|
|
assembly="test skipped - assuming no"
|
|
fi
|
|
|
|
# if we're cross compiling, just try to compile and figure good enough
|
|
if test "$asm_result" = "unknown" ; then
|
|
AC_LINK_IFELSE([AC_LANG_PROGRAM([AC_INCLUDES_DEFAULT],[[
|
|
int ret = 1;
|
|
int negone = -1;
|
|
__asm__ __volatile__ ($assembly);
|
|
return ret;
|
|
]])],
|
|
[asm_result="yes"], [asm_result="no"])
|
|
fi
|
|
|
|
AC_MSG_RESULT([$asm_result])
|
|
|
|
if test "$asm_result" = "yes" ; then
|
|
OPAL_C_GCC_INLINE_ASSEMBLY=1
|
|
opal_cv_asm_inline_supported="yes"
|
|
else
|
|
OPAL_C_GCC_INLINE_ASSEMBLY=0
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_C_GCC_INLINE_ASSEMBLY],
|
|
[$OPAL_C_GCC_INLINE_ASSEMBLY],
|
|
[Whether C compiler supports GCC style inline assembly])
|
|
|
|
unset OPAL_C_GCC_INLINE_ASSEMBLY assembly asm_result
|
|
])dnl
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CONFIG_ASM
|
|
dnl
|
|
dnl DEFINE OPAL_ASSEMBLY_ARCH to something in sys/architecture.h
|
|
dnl DEFINE OPAL_ASSEMBLY_FORMAT to string containing correct
|
|
dnl format for assembly (not user friendly)
|
|
dnl SUBST OPAL_ASSEMBLY_FORMAT to string containing correct
|
|
dnl format for assembly (not user friendly)
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CONFIG_ASM],[
|
|
AC_REQUIRE([OPAL_SETUP_CC])
|
|
AC_REQUIRE([AM_PROG_AS])
|
|
|
|
AC_ARG_ENABLE([c11-atomics],[AC_HELP_STRING([--enable-c11-atomics],
|
|
[Enable use of C11 atomics if available (default: enabled)])])
|
|
|
|
AC_ARG_ENABLE([builtin-atomics],
|
|
[AC_HELP_STRING([--enable-builtin-atomics],
|
|
[Enable use of GCC built-in atomics (default: autodetect)])])
|
|
|
|
OPAL_CHECK_C11_CSWAP_INT128
|
|
opal_cv_asm_builtin="BUILTIN_NO"
|
|
OPAL_CHECK_GCC_ATOMIC_BUILTINS
|
|
|
|
if test "x$enable_c11_atomics" != "xno" && test "$opal_cv_c11_supported" = "yes" ; then
|
|
opal_cv_asm_builtin="BUILTIN_C11"
|
|
OPAL_CHECK_C11_CSWAP_INT128
|
|
elif test "x$enable_c11_atomics" = "xyes"; then
|
|
AC_MSG_WARN([C11 atomics were requested but are not supported])
|
|
AC_MSG_ERROR([Cannot continue])
|
|
elif test "$enable_builtin_atomics" = "yes" ; then
|
|
if test $opal_cv_have___atomic = "yes" ; then
|
|
opal_cv_asm_builtin="BUILTIN_GCC"
|
|
else
|
|
AC_MSG_WARN([GCC built-in atomics requested but not found.])
|
|
AC_MSG_ERROR([Cannot continue])
|
|
fi
|
|
fi
|
|
|
|
OPAL_CHECK_ASM_PROC
|
|
OPAL_CHECK_ASM_TEXT
|
|
OPAL_CHECK_ASM_GLOBAL
|
|
OPAL_CHECK_ASM_GNU_STACKEXEC
|
|
OPAL_CHECK_ASM_LABEL_SUFFIX
|
|
OPAL_CHECK_ASM_GSYM
|
|
OPAL_CHECK_ASM_LSYM
|
|
OPAL_CHECK_ASM_TYPE
|
|
OPAL_CHECK_ASM_SIZE
|
|
OPAL_CHECK_ASM_ALIGN_LOG
|
|
|
|
# find our architecture for purposes of assembly stuff
|
|
opal_cv_asm_arch="UNSUPPORTED"
|
|
OPAL_GCC_INLINE_ASSIGN=""
|
|
if test "$opal_cv_have___atomic_64" ; then
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
else
|
|
OPAL_ASM_SUPPORT_64BIT=0
|
|
fi
|
|
|
|
case "${host}" in
|
|
x86_64-*x32)
|
|
opal_cv_asm_arch="X86_64"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_GCC_INLINE_ASSIGN='"xaddl %1,%0" : "=m"(ret), "+r"(negone) : "m"(ret)'
|
|
;;
|
|
i?86-*|x86_64*|amd64*)
|
|
if test "$ac_cv_sizeof_long" = "4" ; then
|
|
opal_cv_asm_arch="IA32"
|
|
else
|
|
opal_cv_asm_arch="X86_64"
|
|
fi
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_GCC_INLINE_ASSIGN='"xaddl %1,%0" : "=m"(ret), "+r"(negone) : "m"(ret)'
|
|
OPAL_CHECK_CMPXCHG16B
|
|
;;
|
|
|
|
aarch64*)
|
|
opal_cv_asm_arch="ARM64"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_ASM_ARM_VERSION=8
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0, #0" : "=&r"(ret)'
|
|
;;
|
|
|
|
armv7*|arm-*-linux-gnueabihf)
|
|
opal_cv_asm_arch="ARM"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_ASM_ARM_VERSION=7
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0, #0" : "=&r"(ret)'
|
|
;;
|
|
|
|
armv6*)
|
|
opal_cv_asm_arch="ARM"
|
|
OPAL_ASM_SUPPORT_64BIT=0
|
|
OPAL_ASM_ARM_VERSION=6
|
|
CCASFLAGS="$CCASFLAGS -march=armv7-a"
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0, #0" : "=&r"(ret)'
|
|
;;
|
|
|
|
powerpc-*|powerpc64-*|powerpcle-*|powerpc64le-*|rs6000-*|ppc-*)
|
|
OPAL_CHECK_POWERPC_REG
|
|
if test "$ac_cv_sizeof_long" = "4" ; then
|
|
opal_cv_asm_arch="POWERPC32"
|
|
|
|
# Note that on some platforms (Apple G5), even if we are
|
|
# compiling in 32 bit mode (and therefore should assume
|
|
# sizeof(long) == 4), we can use the 64 bit test and set
|
|
# operations.
|
|
OPAL_CHECK_POWERPC_64BIT(OPAL_ASM_SUPPORT_64BIT=1)
|
|
elif test "$ac_cv_sizeof_long" = "8" ; then
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
opal_cv_asm_arch="POWERPC64"
|
|
else
|
|
AC_MSG_ERROR([Could not determine PowerPC word size: $ac_cv_sizeof_long])
|
|
fi
|
|
OPAL_GCC_INLINE_ASSIGN='"1: li %0,0" : "=&r"(ret)'
|
|
;;
|
|
sparc*-*)
|
|
# SPARC v9 (and above) are the only ones with 64bit support
|
|
# if compiling 32 bit, see if we are v9 (aka v8plus) or
|
|
# earlier (casa is v8+/v9).
|
|
if test "$ac_cv_sizeof_long" = "4" ; then
|
|
have_v8plus=0
|
|
OPAL_CHECK_SPARCV8PLUS([have_v8plus=1])
|
|
if test "$have_v8plus" = "0" ; then
|
|
OPAL_ASM_SUPPORT_64BIT=0
|
|
opal_cv_asm_arch="SPARC"
|
|
AC_MSG_WARN([Sparc v8 target is not supported in this release of Open MPI.])
|
|
AC_MSG_WARN([You must specify the target architecture v8plus to compile])
|
|
AC_MSG_WARN([Open MPI in 32 bit mode on Sparc processors (see the README).])
|
|
AC_MSG_ERROR([Can not continue.])
|
|
else
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
opal_cv_asm_arch="SPARCV9_32"
|
|
fi
|
|
|
|
elif test "$ac_cv_sizeof_long" = "8" ; then
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
opal_cv_asm_arch="SPARCV9_64"
|
|
else
|
|
AC_MSG_ERROR([Could not determine Sparc word size: $ac_cv_sizeof_long])
|
|
fi
|
|
OPAL_GCC_INLINE_ASSIGN='"mov 0,%0" : "=&r"(ret)'
|
|
;;
|
|
|
|
*)
|
|
if test $opal_cv_have___atomic = "yes" ; then
|
|
opal_cv_asm_builtin="BUILTIN_GCC"
|
|
else
|
|
AC_MSG_ERROR([No atomic primitives available for $host])
|
|
fi
|
|
;;
|
|
esac
|
|
|
|
if ! test -z "$OPAL_ASM_ARM_VERSION" ; then
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_ARM_VERSION], [$OPAL_ASM_ARM_VERSION],
|
|
[What ARM assembly version to use])
|
|
fi
|
|
|
|
if test "$opal_cv_asm_builtin" = "BUILTIN_GCC" ; then
|
|
AC_DEFINE([OPAL_C_GCC_INLINE_ASSEMBLY], [1],
|
|
[Whether C compiler supports GCC style inline assembly])
|
|
else
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_SUPPORT_64BIT],
|
|
[$OPAL_ASM_SUPPORT_64BIT],
|
|
[Whether we can do 64bit assembly operations or not. Should not be used outside of the assembly header files])
|
|
AC_SUBST([OPAL_ASM_SUPPORT_64BIT])
|
|
|
|
opal_cv_asm_inline_supported="no"
|
|
# now that we know our architecture, try to inline assemble
|
|
OPAL_CHECK_INLINE_C_GCC([$OPAL_GCC_INLINE_ASSIGN])
|
|
|
|
# format:
|
|
# config_file-text-global-label_suffix-gsym-lsym-type-size-align_log-ppc_r_reg-64_bit-gnu_stack
|
|
asm_format="${opal_asm_arch_config}"
|
|
asm_format="${asm_format}-${opal_cv_asm_text}-${opal_cv_asm_global}"
|
|
asm_format="${asm_format}-${opal_cv_asm_label_suffix}-${opal_cv_asm_gsym}"
|
|
asm_format="${asm_format}-${opal_cv_asm_lsym}"
|
|
asm_format="${asm_format}-${opal_cv_asm_type}-${opal_asm_size}"
|
|
asm_format="${asm_format}-${opal_asm_align_log_result}"
|
|
if test "$opal_cv_asm_arch" = "POWERPC32" || test "$opal_cv_asm_arch" = "POWERPC64" ; then
|
|
asm_format="${asm_format}-${opal_cv_asm_powerpc_r_reg}"
|
|
else
|
|
asm_format="${asm_format}-1"
|
|
fi
|
|
asm_format="${asm_format}-${OPAL_ASM_SUPPORT_64BIT}"
|
|
opal_cv_asm_format="${asm_format}-${opal_cv_asm_gnu_stack}"
|
|
# For the Makefile, need to escape the $ as $$. Don't display
|
|
# this version, but make sure the Makefile gives the right thing
|
|
# when regenerating the files because the base has been touched.
|
|
OPAL_ASSEMBLY_FORMAT=`echo "$opal_cv_asm_format" | sed -e 's/\\\$/\\\$\\\$/'`
|
|
|
|
AC_MSG_CHECKING([for assembly format])
|
|
AC_MSG_RESULT([$opal_cv_asm_format])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_FORMAT], ["$OPAL_ASSEMBLY_FORMAT"],
|
|
[Format of assembly file])
|
|
AC_SUBST([OPAL_ASSEMBLY_FORMAT])
|
|
fi # if opal_cv_asm_builtin = BUILTIN_GCC
|
|
|
|
result="OPAL_$opal_cv_asm_arch"
|
|
OPAL_ASSEMBLY_ARCH="$opal_cv_asm_arch"
|
|
AC_MSG_CHECKING([for assembly architecture])
|
|
AC_MSG_RESULT([$opal_cv_asm_arch])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_ARCH], [$result],
|
|
[Architecture type of assembly to use for atomic operations and CMA])
|
|
AC_SUBST([OPAL_ASSEMBLY_ARCH])
|
|
|
|
# Check for RDTSCP support
|
|
result=0
|
|
AS_IF([test "$opal_cv_asm_arch" = "OPAL_X86_64" || test "$opal_cv_asm_arch" = "OPAL_IA32"],
|
|
[AC_MSG_CHECKING([for RDTSCP assembly support])
|
|
AC_LANG_PUSH([C])
|
|
AC_TRY_RUN([[
|
|
int main(int argc, char* argv[])
|
|
{
|
|
unsigned int rax, rdx;
|
|
__asm__ __volatile__ ("rdtscp\n": "=a" (rax), "=d" (rdx):: "%rax", "%rdx");
|
|
return 0;
|
|
}
|
|
]],
|
|
[result=1
|
|
AC_MSG_RESULT([yes])],
|
|
[AC_MSG_RESULT([no])],
|
|
[#cross compile not supported
|
|
AC_MSG_RESULT(["no (cross compiling)"])])
|
|
AC_LANG_POP([C])])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_SUPPORTS_RDTSCP], [$result],
|
|
[Whether we have support for RDTSCP instruction])
|
|
|
|
result="OPAL_$opal_cv_asm_builtin"
|
|
OPAL_ASSEMBLY_BUILTIN="$opal_cv_asm_builtin"
|
|
AC_MSG_CHECKING([for builtin atomics])
|
|
AC_MSG_RESULT([$opal_cv_asm_builtin])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_BUILTIN], [$result],
|
|
[Whether to use builtin atomics])
|
|
AC_SUBST([OPAL_ASSEMBLY_BUILTIN])
|
|
|
|
OPAL_ASM_FIND_FILE
|
|
|
|
unset result asm_format
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_ASM_FIND_FILE
|
|
dnl
|
|
dnl
|
|
dnl do all the evil mojo to provide a working assembly file
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_ASM_FIND_FILE], [
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
AC_REQUIRE([AC_PROG_FGREP])
|
|
|
|
if test "$opal_cv_asm_arch" != "WINDOWS" && test "$opal_cv_asm_builtin" != "BUILTIN_GCC" && test "$opal_cv_asm_builtin" != "BUILTIN_OSX" && test "$opal_cv_asm_inline_arch" = "no" ; then
|
|
AC_MSG_ERROR([no atomic support available. exiting])
|
|
else
|
|
# On windows with VC++, atomics are done with compiler primitives
|
|
opal_cv_asm_file=""
|
|
fi
|
|
])dnl
|