e77874bbaf
test for both 32 and 64 bits. clang only support 32 bits builtin atomics when -m32 is used Thanks Paul Hargrove for reporting this. Signed-off-by: Gilles Gouaillardet <gilles@rist.or.jp>
1318 строки
46 KiB
Plaintext
1318 строки
46 KiB
Plaintext
dnl
|
|
dnl Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
|
|
dnl University Research and Technology
|
|
dnl Corporation. All rights reserved.
|
|
dnl Copyright (c) 2004-2015 The University of Tennessee and The University
|
|
dnl of Tennessee Research Foundation. All rights
|
|
dnl reserved.
|
|
dnl Copyright (c) 2004-2006 High Performance Computing Center Stuttgart,
|
|
dnl University of Stuttgart. All rights reserved.
|
|
dnl Copyright (c) 2004-2005 The Regents of the University of California.
|
|
dnl All rights reserved.
|
|
dnl Copyright (c) 2008-2015 Cisco Systems, Inc. All rights reserved.
|
|
dnl Copyright (c) 2010 Oracle and/or its affiliates. All rights reserved.
|
|
dnl Copyright (c) 2015-2017 Research Organization for Information Science
|
|
dnl and Technology (RIST). All rights reserved.
|
|
dnl Copyright (c) 2014-2017 Los Alamos National Security, LLC. All rights
|
|
dnl reserved.
|
|
dnl Copyright (c) 2017 Amazon.com, Inc. or its affiliates. All Rights
|
|
dnl reserved.
|
|
dnl $COPYRIGHT$
|
|
dnl
|
|
dnl Additional copyrights may follow
|
|
dnl
|
|
dnl $HEADER$
|
|
dnl
|
|
|
|
|
|
AC_DEFUN([OPAL_CHECK_SYNC_BUILTIN_CSWAP_INT128], [
|
|
|
|
OPAL_VAR_SCOPE_PUSH([sync_bool_compare_and_swap_128_result CFLAGS_save])
|
|
|
|
AC_ARG_ENABLE([cross-cmpset128],[AC_HELP_STRING([--enable-cross-cmpset128],
|
|
[enable the use of the __sync builtin atomic compare-and-swap 128 when cross compiling])])
|
|
|
|
sync_bool_compare_and_swap_128_result=0
|
|
|
|
if test ! "$enable_cross_cmpset128" = "yes" ; then
|
|
AC_MSG_CHECKING([for processor support of __sync builtin atomic compare-and-swap on 128-bit values])
|
|
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([], [__int128 x = 0; __sync_bool_compare_and_swap (&x, 0, 1);])],
|
|
[AC_MSG_RESULT([yes])
|
|
sync_bool_compare_and_swap_128_result=1],
|
|
[AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([no (cross compiling)])])
|
|
|
|
if test $sync_bool_compare_and_swap_128_result = 0 ; then
|
|
CFLAGS_save=$CFLAGS
|
|
CFLAGS="$CFLAGS -mcx16"
|
|
|
|
AC_MSG_CHECKING([for __sync builtin atomic compare-and-swap on 128-bit values with -mcx16 flag])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([], [__int128 x = 0; __sync_bool_compare_and_swap (&x, 0, 1);])],
|
|
[AC_MSG_RESULT([yes])
|
|
sync_bool_compare_and_swap_128_result=1
|
|
CFLAGS_save="$CFLAGS"],
|
|
[AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([no (cross compiling)])])
|
|
|
|
CFLAGS=$CFLAGS_save
|
|
fi
|
|
else
|
|
AC_MSG_CHECKING([for compiler support of __sync builtin atomic compare-and-swap on 128-bit values])
|
|
|
|
# Check if the compiler supports the __sync builtin
|
|
AC_TRY_LINK([], [__int128 x = 0; __sync_bool_compare_and_swap (&x, 0, 1);],
|
|
[AC_MSG_RESULT([yes])
|
|
sync_bool_compare_and_swap_128_result=1],
|
|
[AC_MSG_RESULT([no])])
|
|
|
|
if test $sync_bool_compare_and_swap_128_result = 0 ; then
|
|
CFLAGS_save=$CFLAGS
|
|
CFLAGS="$CFLAGS -mcx16"
|
|
|
|
AC_MSG_CHECKING([for __sync builtin atomic compare-and-swap on 128-bit values with -mcx16 flag])
|
|
AC_TRY_LINK([], [__int128 x = 0; __sync_bool_compare_and_swap (&x, 0, 1);],
|
|
[AC_MSG_RESULT([yes])
|
|
sync_bool_compare_and_swap_128_result=1
|
|
CFLAGS_save="$CFLAGS"],
|
|
[AC_MSG_RESULT([no])])
|
|
|
|
CFLAGS=$CFLAGS_save
|
|
fi
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_SYNC_BUILTIN_CSWAP_INT128], [$sync_bool_compare_and_swap_128_result],
|
|
[Whether the __sync builtin atomic compare and swap supports 128-bit values])
|
|
|
|
OPAL_VAR_SCOPE_POP
|
|
])
|
|
|
|
AC_DEFUN([OPAL_CHECK_SYNC_BUILTINS], [
|
|
AC_MSG_CHECKING([for __sync builtin atomics])
|
|
|
|
AC_TRY_LINK([long tmp;], [__sync_synchronize();
|
|
__sync_bool_compare_and_swap(&tmp, 0, 1);
|
|
__sync_add_and_fetch(&tmp, 1);],
|
|
[AC_MSG_RESULT([yes])
|
|
$1],
|
|
[AC_MSG_RESULT([no])
|
|
$2])
|
|
|
|
AC_MSG_CHECKING([for 64-bit __sync builtin atomics])
|
|
|
|
AC_TRY_LINK([
|
|
#include <stdint.h>
|
|
uint64_t tmp;], [
|
|
__sync_bool_compare_and_swap(&tmp, 0, 1);
|
|
__sync_add_and_fetch(&tmp, 1);],
|
|
[AC_MSG_RESULT([yes])
|
|
opal_asm_sync_have_64bit=1],
|
|
[AC_MSG_RESULT([no])
|
|
opal_asm_sync_have_64bit=0])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_SYNC_HAVE_64BIT],[$opal_asm_sync_have_64bit],
|
|
[Whether 64-bit is supported by the __sync builtin atomics])
|
|
|
|
# Check for 128-bit support
|
|
OPAL_CHECK_SYNC_BUILTIN_CSWAP_INT128
|
|
])
|
|
|
|
|
|
AC_DEFUN([OPAL_CHECK_GCC_BUILTIN_CSWAP_INT128], [
|
|
|
|
OPAL_VAR_SCOPE_PUSH([atomic_compare_exchange_n_128_result CFLAGS_save])
|
|
|
|
AC_ARG_ENABLE([cross-cmpset128],[AC_HELP_STRING([--enable-cross-cmpset128],
|
|
[enable the use of the __sync builtin atomic compare-and-swap 128 when cross compiling])])
|
|
|
|
atomic_compare_exchange_n_128_result=0
|
|
|
|
if test ! "$enable_cross_cmpset128" = "yes" ; then
|
|
AC_MSG_CHECKING([for processor support of __atomic builtin atomic compare-and-swap on 128-bit values])
|
|
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([], [__int128 x = 0, y = 0; __atomic_compare_exchange_n (&x, &y, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);])],
|
|
[AC_MSG_RESULT([yes])
|
|
atomic_compare_exchange_n_128_result=1],
|
|
[AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([no (cross compiling)])])
|
|
|
|
if test $atomic_compare_exchange_n_128_result = 0 ; then
|
|
CFLAGS_save=$CFLAGS
|
|
CFLAGS="$CFLAGS -mcx16"
|
|
|
|
AC_MSG_CHECKING([for __atomic builtin atomic compare-and-swap on 128-bit values with -mcx16 flag])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([], [__int128 x = 0, y = 0; __atomic_compare_exchange_n (&x, &y, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);])],
|
|
[AC_MSG_RESULT([yes])
|
|
atomic_compare_exchange_n_128_result=1
|
|
CFLAGS_save="$CFLAGS"],
|
|
[AC_MSG_RESULT([no])],
|
|
[AC_MSG_RESULT([no (cross compiling)])])
|
|
|
|
CFLAGS=$CFLAGS_save
|
|
fi
|
|
|
|
if test $atomic_compare_exchange_n_128_result = 1 ; then
|
|
AC_MSG_CHECKING([if __int128 atomic compare-and-swap is always lock-free])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([], [if (!__atomic_always_lock_free(16, 0)) { return 1; }])],
|
|
[AC_MSG_RESULT([yes])],
|
|
[AC_MSG_RESULT([no])
|
|
OPAL_CHECK_SYNC_BUILTIN_CSWAP_INT128
|
|
atomic_compare_exchange_n_128_result=0],
|
|
[AC_MSG_RESULT([no (cross compiling)])])
|
|
fi
|
|
else
|
|
AC_MSG_CHECKING([for compiler support of __atomic builtin atomic compare-and-swap on 128-bit values])
|
|
|
|
# Check if the compiler supports the __atomic builtin
|
|
AC_TRY_LINK([], [__int128 x = 0, y = 0; __atomic_compare_exchange_n (&x, &y, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);],
|
|
[AC_MSG_RESULT([yes])
|
|
atomic_compare_exchange_n_128_result=1],
|
|
[AC_MSG_RESULT([no])])
|
|
|
|
if test $atomic_compare_exchange_n_128_result = 0 ; then
|
|
CFLAGS_save=$CFLAGS
|
|
CFLAGS="$CFLAGS -mcx16"
|
|
|
|
AC_MSG_CHECKING([for __atomic builtin atomic compare-and-swap on 128-bit values with -mcx16 flag])
|
|
AC_TRY_LINK([], [__int128 x = 0, y = 0; __atomic_compare_exchange_n (&x, &y, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);],
|
|
[AC_MSG_RESULT([yes])
|
|
atomic_compare_exchange_n_128_result=1
|
|
CFLAGS_save="$CFLAGS"],
|
|
[AC_MSG_RESULT([no])])
|
|
|
|
CFLAGS=$CFLAGS_save
|
|
fi
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_GCC_BUILTIN_CSWAP_INT128], [$atomic_compare_exchange_n_128_result],
|
|
[Whether the __atomic builtin atomic compare and swap is lock-free on 128-bit values])
|
|
|
|
OPAL_VAR_SCOPE_POP
|
|
])
|
|
|
|
AC_DEFUN([OPAL_CHECK_GCC_ATOMIC_BUILTINS], [
|
|
AC_MSG_CHECKING([for __atomic builtin atomics])
|
|
|
|
AC_TRY_LINK([
|
|
#include <stdint.h>
|
|
uint32_t tmp, old = 0;
|
|
uint64_t tmp64, old64 = 0;], [
|
|
__atomic_thread_fence(__ATOMIC_SEQ_CST);
|
|
__atomic_compare_exchange_n(&tmp, &old, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);
|
|
__atomic_add_fetch(&tmp, 1, __ATOMIC_RELAXED);
|
|
__atomic_compare_exchange_n(&tmp64, &old64, 1, 0, __ATOMIC_RELAXED, __ATOMIC_RELAXED);
|
|
__atomic_add_fetch(&tmp64, 1, __ATOMIC_RELAXED);],
|
|
[AC_MSG_RESULT([yes])
|
|
$1],
|
|
[AC_MSG_RESULT([no])
|
|
$2])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_SYNC_HAVE_64BIT],[$opal_asm_sync_have_64bit],
|
|
[Whether 64-bit is supported by the __sync builtin atomics])
|
|
|
|
# Check for 128-bit support
|
|
OPAL_CHECK_GCC_BUILTIN_CSWAP_INT128
|
|
])
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_TEXT
|
|
dnl
|
|
dnl Determine how to set current mode as text.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_TEXT],[
|
|
AC_MSG_CHECKING([directive for setting text section])
|
|
opal_cv_asm_text=""
|
|
if test "$opal_cv_c_compiler_vendor" = "microsoft" ; then
|
|
# text section will be brought in with the rest of
|
|
# header for MS - leave blank for now
|
|
opal_cv_asm_text=""
|
|
else
|
|
case $host in
|
|
*-aix*)
|
|
opal_cv_asm_text=[".csect .text[PR]"]
|
|
;;
|
|
*)
|
|
opal_cv_asm_text=".text"
|
|
;;
|
|
esac
|
|
fi
|
|
AC_MSG_RESULT([$opal_cv_asm_text])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_TEXT], ["$opal_cv_asm_text"],
|
|
[Assembly directive for setting text section])
|
|
OPAL_ASM_TEXT="$opal_cv_asm_text"
|
|
AC_SUBST(OPAL_ASM_TEXT)
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_GLOBAL
|
|
dnl
|
|
dnl Sets OPAL_ASM_GLOBAL to the value to prefix global values
|
|
dnl
|
|
dnl I'm sure if I don't have a test for this, there will be some
|
|
dnl dumb platform that uses something else
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_GLOBAL],[
|
|
AC_MSG_CHECKING([directive for exporting symbols])
|
|
opal_cv_asm_global=""
|
|
if test "$opal_cv_c_compiler_vendor" = "microsoft" ; then
|
|
opal_cv_asm_global="PUBLIC"
|
|
else
|
|
case $host in
|
|
*)
|
|
opal_cv_asm_global=".globl"
|
|
;;
|
|
esac
|
|
fi
|
|
AC_MSG_RESULT([$opal_cv_asm_global])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_GLOBAL], ["$opal_cv_asm_global"],
|
|
[Assembly directive for exporting symbols])
|
|
OPAL_ASM_GLOBAL="$opal_cv_asm_global"
|
|
AC_SUBST(OPAL_AS_GLOBAL)
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_LSYM
|
|
dnl
|
|
dnl Sets OPAL_ASM_LSYM to the prefix value on a symbol to make it
|
|
dnl an internal label (jump target and whatnot)
|
|
dnl
|
|
dnl We look for L .L $ L$ (in that order) for something that both
|
|
dnl assembles and does not leave a label in the output of nm. Fall
|
|
dnl back to L if nothing else seems to work :/
|
|
dnl
|
|
dnl #################################################################
|
|
|
|
# _OPAL_CHECK_ASM_LSYM([variable-to-set])
|
|
# ---------------------------------------
|
|
AC_DEFUN([_OPAL_CHECK_ASM_LSYM],[
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
|
|
$1="L"
|
|
|
|
for sym in L .L $ L$ ; do
|
|
asm_result=0
|
|
echo "configure: trying $sym" >&AC_FD_CC
|
|
OPAL_TRY_ASSEMBLE([foobar$opal_cv_asm_label_suffix
|
|
${sym}mytestlabel$opal_cv_asm_label_suffix],
|
|
[# ok, we succeeded at assembling. see if we can nm,
|
|
# throwing the results in a file
|
|
if $NM conftest.$OBJEXT > conftest.out 2>&AC_FD_CC ; then
|
|
if test "`$GREP mytestlabel conftest.out`" = "" ; then
|
|
# there was no symbol... looks promising to me
|
|
$1="$sym"
|
|
asm_result=1
|
|
elif test ["`$GREP ' [Nt] .*mytestlabel' conftest.out`"] = "" ; then
|
|
# see if we have a non-global-ish symbol
|
|
# but we should see if we can do better.
|
|
$1="$sym"
|
|
fi
|
|
else
|
|
# not so much on the NM goodness :/
|
|
echo "$NM failed. Output from NM was:" >&AC_FD_CC
|
|
cat conftest.out >&AC_FD_CC
|
|
AC_MSG_WARN([$NM could not read object file])
|
|
fi
|
|
])
|
|
if test "$asm_result" = "1" ; then
|
|
break
|
|
fi
|
|
done
|
|
rm -f conftest.out
|
|
unset asm_result sym
|
|
])
|
|
|
|
# OPAL_CHECK_ASM_LSYM()
|
|
# ---------------------
|
|
AC_DEFUN([OPAL_CHECK_ASM_LSYM],[
|
|
AC_REQUIRE([AC_PROG_NM])
|
|
|
|
AC_CACHE_CHECK([prefix for lsym labels],
|
|
[opal_cv_asm_lsym],
|
|
[_OPAL_CHECK_ASM_LSYM([opal_cv_asm_lsym])])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_LSYM], ["$opal_cv_asm_lsym"],
|
|
[Assembly prefix for lsym labels])
|
|
OPAL_ASM_LSYM="$opal_cv_asm_lsym"
|
|
AC_SUBST(OPAL_ASM_LSYM)
|
|
])dnl
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_PROC
|
|
dnl
|
|
dnl Sets a cv-flag, if the compiler needs a proc/endp-definition to
|
|
dnl link with C.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_PROC],[
|
|
AC_CACHE_CHECK([if .proc/endp is needed],
|
|
[opal_cv_asm_need_proc],
|
|
[opal_cv_asm_need_proc="no"
|
|
OPAL_TRY_ASSEMBLE([
|
|
.proc mysym
|
|
mysym:
|
|
.endp mysym],
|
|
[opal_cv_asm_need_proc="yes"])
|
|
rm -f conftest.out])
|
|
|
|
if test "$opal_cv_asm_need_proc" = "yes" ; then
|
|
opal_cv_asm_proc=".proc"
|
|
opal_cv_asm_endproc=".endp"
|
|
else
|
|
opal_cv_asm_proc="#"
|
|
opal_cv_asm_endproc="#"
|
|
fi
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_GSYM
|
|
dnl
|
|
dnl Sets OPAL_ASM_GSYM to the prefix value on a symbol to make it
|
|
dnl a global linkable from C. Basically, an _ or not.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_GSYM],[
|
|
AC_CACHE_CHECK([prefix for global symbol labels],
|
|
[opal_cv_asm_gsym],
|
|
[_OPAL_CHECK_ASM_GSYM])
|
|
|
|
if test "$opal_cv_asm_gsym" = "none" ; then
|
|
AC_MSG_ERROR([Could not determine global symbol label prefix])
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_GSYM], ["$opal_cv_asm_gsym"],
|
|
[Assembly prefix for gsym labels])
|
|
OPAL_ASM_GSYM="$opal_cv_asm_gsym"
|
|
AC_SUBST(OPAL_ASM_GSYM)
|
|
|
|
])
|
|
|
|
AC_DEFUN([_OPAL_CHECK_ASM_GSYM],[
|
|
opal_cv_asm_gsym="none"
|
|
|
|
for sym in "_" "" "." ; do
|
|
asm_result=0
|
|
echo "configure: trying $sym" >&AC_FD_CC
|
|
cat > conftest_c.c <<EOF
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
void gsym_test_func(void);
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
int
|
|
main()
|
|
{
|
|
gsym_test_func();
|
|
return 0;
|
|
}
|
|
EOF
|
|
OPAL_TRY_ASSEMBLE([
|
|
$opal_cv_asm_text
|
|
$opal_cv_asm_proc ${sym}gsym_test_func
|
|
$opal_cv_asm_global ${sym}gsym_test_func
|
|
${sym}gsym_test_func${opal_cv_asm_label_suffix}
|
|
$opal_cv_asm_endproc ${sym}gsym_test_func
|
|
],
|
|
[opal_compile="$CC $CFLAGS -I. conftest_c.c -c > conftest.cmpl 2>&1"
|
|
if AC_TRY_EVAL(opal_compile) ; then
|
|
# save the warnings
|
|
cat conftest.cmpl >&AC_FD_CC
|
|
opal_link="$CC $CFLAGS conftest_c.$OBJEXT conftest.$OBJEXT -o conftest $LDFLAGS $LIBS > conftest.link 2>&1"
|
|
if AC_TRY_EVAL(opal_link) ; then
|
|
# save the warnings
|
|
cat conftest.link >&AC_FD_CC
|
|
asm_result=1
|
|
else
|
|
cat conftest.link >&AC_FD_CC
|
|
echo "configure: failed C program was: " >&AC_FD_CC
|
|
cat conftest_c.c >&AC_FD_CC
|
|
echo "configure: failed ASM program was: " >&AC_FD_CC
|
|
cat conftest.s >&AC_FD_CC
|
|
asm_result=0
|
|
fi
|
|
else
|
|
# save output and failed program
|
|
cat conftest.cmpl >&AC_FD_CC
|
|
echo "configure: failed C program was: " >&AC_FD_CC
|
|
cat conftest.c >&AC_FD_CC
|
|
asm_result=0
|
|
fi],
|
|
[asm_result=0])
|
|
if test "$asm_result" = "1" ; then
|
|
opal_cv_asm_gsym="$sym"
|
|
break
|
|
fi
|
|
done
|
|
rm -rf conftest.*
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_LABEL_SUFFIX
|
|
dnl
|
|
dnl Sets OPAL_ASM_LABEL_SUFFIX to the value to suffix for labels
|
|
dnl
|
|
dnl I'm sure if I don't have a test for this, there will be some
|
|
dnl dumb platform that uses something else
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_LABEL_SUFFIX],[
|
|
AC_MSG_CHECKING([suffix for labels])
|
|
opal_cv_asm_label_suffix=""
|
|
case $host in
|
|
*)
|
|
opal_cv_asm_label_suffix=":"
|
|
;;
|
|
esac
|
|
AC_MSG_RESULT([$opal_cv_asm_label_suffix])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_LABEL_SUFFIX], ["$opal_cv_asm_label_suffix"],
|
|
[Assembly suffix for labels])
|
|
OPAL_ASM_LABEL_SUFFIX="$opal_cv_asm_label_suffix"
|
|
AC_SUBST(OPAL_AS_LABEL_SUFFIX)
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_ALIGN_LOG
|
|
dnl
|
|
dnl Sets OPAL_ASM_ALIGN_LOG to 1 if align is specified
|
|
dnl logarithmically, 0 otherwise
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_ALIGN_LOG],[
|
|
AC_REQUIRE([AC_PROG_NM])
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
|
|
AC_CACHE_CHECK([if .align directive takes logarithmic value],
|
|
[opal_cv_asm_align_log],
|
|
[ OPAL_TRY_ASSEMBLE([ $opal_cv_asm_text
|
|
.align 4
|
|
$opal_cv_asm_global foo
|
|
.byte 1
|
|
.align 4
|
|
foo$opal_cv_asm_label_suffix
|
|
.byte 2],
|
|
[opal_asm_addr=[`$NM conftest.$OBJEXT | $GREP foo | sed -e 's/.*\([0-9a-fA-F][0-9a-fA-F]\).*foo.*/\1/'`]],
|
|
[opal_asm_addr=""])
|
|
# test for both 16 and 10 (decimal and hex notations)
|
|
echo "configure: .align test address offset is $opal_asm_addr" >&AC_FD_CC
|
|
if test "$opal_asm_addr" = "16" || test "$opal_asm_addr" = "10" ; then
|
|
opal_cv_asm_align_log="yes"
|
|
else
|
|
opal_cv_asm_align_log="no"
|
|
fi])
|
|
|
|
if test "$opal_cv_asm_align_log" = "yes" || test "$opal_cv_asm_align_log" = "1" ; then
|
|
opal_asm_align_log_result=1
|
|
else
|
|
opal_asm_align_log_result=0
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_ALIGN_LOG],
|
|
[$asm_align_log_result],
|
|
[Assembly align directive expects logarithmic value])
|
|
|
|
unset omp_asm_addr asm_result
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_TYPE
|
|
dnl
|
|
dnl Sets OPAL_ASM_TYPE to the prefix for the function type to
|
|
dnl set a symbol's type as function (needed on ELF for shared
|
|
dnl libaries). If no .type directive is needed, sets OPAL_ASM_TYPE
|
|
dnl to an empty string
|
|
dnl
|
|
dnl We look for @ \# %
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_TYPE],[
|
|
AC_CACHE_CHECK([prefix for function in .type],
|
|
[opal_cv_asm_type],
|
|
[_OPAL_CHECK_ASM_TYPE])
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_TYPE], ["$opal_cv_asm_type"],
|
|
[How to set function type in .type directive])
|
|
OPAL_ASM_TYPE="$opal_cv_asm_type"
|
|
AC_SUBST(OPAL_ASM_TYPE)
|
|
])
|
|
|
|
AC_DEFUN([_OPAL_CHECK_ASM_TYPE],[
|
|
opal_cv_asm_type=""
|
|
|
|
case "${host}" in
|
|
*-sun-solaris*)
|
|
# GCC on solaris seems to accept just about anything, not
|
|
# that what it defines actually works... So just hardwire
|
|
# to the right answer
|
|
opal_cv_asm_type="#"
|
|
;;
|
|
*)
|
|
for type in @ \# % ; do
|
|
asm_result=0
|
|
echo "configure: trying $type" >&AC_FD_CC
|
|
OPAL_TRY_ASSEMBLE([ .type mysym, ${type}function
|
|
mysym:],
|
|
[opal_cv_asm_type="${type}"
|
|
asm_result=1])
|
|
if test "$asm_result" = "1" ; then
|
|
break
|
|
fi
|
|
done
|
|
;;
|
|
esac
|
|
rm -f conftest.out
|
|
|
|
unset asm_result type
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_ASM_SIZE
|
|
dnl
|
|
dnl Sets OPAL_ASM_SIZE to 1 if we should set .size directives for
|
|
dnl each function, 0 otherwise.
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_ASM_SIZE],[
|
|
AC_CACHE_CHECK([if .size is needed],
|
|
[opal_cv_asm_need_size],
|
|
[opal_cv_asm_need_size="no"
|
|
OPAL_TRY_ASSEMBLE([ .size mysym, 1],
|
|
[opal_cv_asm_need_size="yes"])
|
|
rm -f conftest.out])
|
|
|
|
if test "$opal_cv_asm_need_size" = "yes" ; then
|
|
opal_asm_size=1
|
|
else
|
|
opal_asm_size=0
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_SIZE], ["$opal_asm_size"],
|
|
[Do we need to give a .size directive])
|
|
OPAL_ASM_SIZE="$opal_asm_size"
|
|
AC_SUBST(OPAL_ASM_TYPE)
|
|
unset asm_result
|
|
])dnl
|
|
|
|
|
|
# OPAL_CHECK_ASM_GNU_STACKEXEC(var)
|
|
# ----------------------------------
|
|
# sets shell variable var to the things necessary to
|
|
# disable execable stacks with GAS
|
|
AC_DEFUN([OPAL_CHECK_ASM_GNU_STACKEXEC], [
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
|
|
AC_CHECK_PROG([OBJDUMP], [objdump], [objdump])
|
|
AC_CACHE_CHECK([if .note.GNU-stack is needed],
|
|
[opal_cv_asm_gnu_stack_result],
|
|
[AS_IF([test "$OBJDUMP" != ""],
|
|
[ # first, see if a simple C program has it set
|
|
cat >conftest.c <<EOF
|
|
int testfunc() {return 0; }
|
|
EOF
|
|
OPAL_LOG_COMMAND([$CC $CFLAGS -c conftest.c -o conftest.$OBJEXT],
|
|
[$OBJDUMP -x conftest.$OBJEXT | $GREP '\.note\.GNU-stack' > /dev/null && opal_cv_asm_gnu_stack_result=yes],
|
|
[OPAL_LOG_MSG([the failed program was:], 1)
|
|
OPAL_LOG_FILE([conftest.c])
|
|
opal_cv_asm_gnu_stack_result=no])
|
|
if test "$opal_cv_asm_gnu_stack_result" != "yes" ; then
|
|
opal_cv_asm_gnu_stack_result="no"
|
|
fi
|
|
rm -rf conftest.*],
|
|
[opal_cv_asm_gnu_stack_result="no"])])
|
|
if test "$opal_cv_asm_gnu_stack_result" = "yes" ; then
|
|
opal_cv_asm_gnu_stack=1
|
|
else
|
|
opal_cv_asm_gnu_stack=0
|
|
fi
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_POWERPC_REG
|
|
dnl
|
|
dnl See if the notation for specifying registers is X (most everyone)
|
|
dnl or rX (OS X)
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_POWERPC_REG],[
|
|
AC_MSG_CHECKING([if PowerPC registers have r prefix])
|
|
OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
addi 1,1,0],
|
|
[opal_cv_asm_powerpc_r_reg=0],
|
|
[OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
addi r1,r1,0],
|
|
[opal_cv_asm_powerpc_r_reg=1],
|
|
[AC_MSG_ERROR([Can not determine how to use PPC registers])])])
|
|
if test "$opal_cv_asm_powerpc_r_reg" = "1" ; then
|
|
AC_MSG_RESULT([yes])
|
|
else
|
|
AC_MSG_RESULT([no])
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_POWERPC_R_REGISTERS],
|
|
[$opal_cv_asm_powerpc_r_reg],
|
|
[Whether r notation is used for ppc registers])
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_POWERPC_64BIT
|
|
dnl
|
|
dnl On some powerpc chips (the PPC970 or G5), the OS usually runs in
|
|
dnl 32 bit mode, even though the hardware can do 64bit things. If
|
|
dnl the compiler will let us, emit code for 64bit test and set type
|
|
dnl operations (on a long long).
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_POWERPC_64BIT],[
|
|
if test "$ac_cv_sizeof_long" != "4" ; then
|
|
# this function should only be called in the 32 bit case
|
|
AC_MSG_ERROR([CHECK_POWERPC_64BIT called on 64 bit platform. Internal error.])
|
|
fi
|
|
AC_MSG_CHECKING([for 64-bit PowerPC assembly support])
|
|
case $host in
|
|
*-darwin*)
|
|
ppc64_result=0
|
|
if test "$opal_cv_asm_powerpc_r_reg" = "1" ; then
|
|
ldarx_asm=" ldarx r1,r1,r1";
|
|
else
|
|
ldarx_asm=" ldarx 1,1,1";
|
|
fi
|
|
OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
$ldarx_asm],
|
|
[ppc64_result=1],
|
|
[ppc64_result=0])
|
|
;;
|
|
*)
|
|
ppc64_result=0
|
|
;;
|
|
esac
|
|
|
|
if test "$ppc64_result" = "1" ; then
|
|
AC_MSG_RESULT([yes])
|
|
ifelse([$1],,:,[$1])
|
|
else
|
|
AC_MSG_RESULT([no])
|
|
ifelse([$2],,:,[$2])
|
|
fi
|
|
|
|
unset ppc64_result ldarx_asm
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_SPARCV8PLUS
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_SPARCV8PLUS],[
|
|
AC_MSG_CHECKING([if have Sparc v8+/v9 support])
|
|
sparc_result=0
|
|
OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
casa [%o0] 0x80, %o1, %o2],
|
|
[sparc_result=1],
|
|
[sparc_result=0])
|
|
if test "$sparc_result" = "1" ; then
|
|
AC_MSG_RESULT([yes])
|
|
ifelse([$1],,:,[$1])
|
|
else
|
|
AC_MSG_RESULT([no])
|
|
ifelse([$2],,:,[$2])
|
|
fi
|
|
|
|
unset sparc_result
|
|
])dnl
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_CMPXCHG16B
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_CMPXCHG16B],[
|
|
OPAL_VAR_SCOPE_PUSH([cmpxchg16b_result])
|
|
|
|
AC_ARG_ENABLE([cross-cmpxchg16b],[AC_HELP_STRING([--enable-cross-cmpxchg16b],
|
|
[enable the use of the cmpxchg16b instruction when cross compiling])])
|
|
|
|
if test ! "$enable_cross_cmpxchg16b" = "yes" ; then
|
|
AC_MSG_CHECKING([if processor supports x86_64 16-byte compare-and-exchange])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([[unsigned char tmp[16];]],[[
|
|
__asm__ __volatile__ ("lock cmpxchg16b (%%rsi)" : : "S" (tmp) : "memory", "cc");]])],
|
|
[AC_MSG_RESULT([yes])
|
|
cmpxchg16b_result=1],
|
|
[AC_MSG_RESULT([no])
|
|
cmpxchg16b_result=0],
|
|
[AC_MSG_RESULT([no (cross-compiling)])
|
|
cmpxchg16b_result=0])
|
|
else
|
|
AC_MSG_CHECKING([if assembler supports x86_64 16-byte compare-and-exchange])
|
|
|
|
OPAL_TRY_ASSEMBLE([$opal_cv_asm_text
|
|
cmpxchg16b 0],
|
|
[AC_MSG_RESULT([yes])
|
|
cmpxchg16b_result=1],
|
|
[AC_MSG_RESULT([no])
|
|
cmpxchg16b_result=0])
|
|
fi
|
|
if test "$cmpxchg16b_result" = 1; then
|
|
AC_MSG_CHECKING([if compiler correctly handles volatile 128bits])
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([#include <stdint.h>
|
|
#include <assert.h>
|
|
|
|
union opal_counted_pointer_t {
|
|
struct {
|
|
uint64_t counter;
|
|
uint64_t item;
|
|
} data;
|
|
#if defined(HAVE___INT128) && HAVE___INT128
|
|
__int128 value;
|
|
#elif defined(HAVE_INT128_T) && HAVE_INT128_T
|
|
int128_t value;
|
|
#endif
|
|
};
|
|
typedef union opal_counted_pointer_t opal_counted_pointer_t;],
|
|
[volatile opal_counted_pointer_t a;
|
|
opal_counted_pointer_t b;
|
|
|
|
a.data.counter = 0;
|
|
a.data.item = 0x1234567890ABCDEF;
|
|
|
|
b.data.counter = a.data.counter;
|
|
b.data.item = a.data.item;
|
|
|
|
/* bozo checks */
|
|
assert(16 == sizeof(opal_counted_pointer_t));
|
|
assert(a.data.counter == b.data.counter);
|
|
assert(a.data.item == b.data.item);
|
|
/*
|
|
* the following test fails on buggy compilers
|
|
* so far, with icc -o conftest conftest.c
|
|
* - intel icc 14.0.0.080 (aka 2013sp1)
|
|
* - intel icc 14.0.1.106 (aka 2013sp1u1)
|
|
* older and more recents compilers work fine
|
|
* buggy compilers work also fine but only with -O0
|
|
*/
|
|
#if (defined(HAVE___INT128) && HAVE___INT128) || (defined(HAVE_INT128_T) && HAVE_INT128_T)
|
|
return (a.value != b.value);
|
|
#else
|
|
return 0;
|
|
#endif])],
|
|
[AC_MSG_RESULT([yes])],
|
|
[AC_MSG_RESULT([no])
|
|
cmpxchg16b_result=0],
|
|
[AC_MSG_RESULT([untested, assuming ok])])
|
|
fi
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_CMPXCHG16B], [$cmpxchg16b_result],
|
|
[Whether the processor supports the cmpxchg16b instruction])
|
|
OPAL_VAR_SCOPE_POP
|
|
])dnl
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_INLINE_GCC
|
|
dnl
|
|
dnl Check if the compiler is capable of doing GCC-style inline
|
|
dnl assembly. Some compilers emit a warning and ignore the inline
|
|
dnl assembly (xlc on OS X) and compile without error. Therefore,
|
|
dnl the test attempts to run the emited code to check that the
|
|
dnl assembly is actually run. To run this test, one argument to
|
|
dnl the macro must be an assembly instruction in gcc format to move
|
|
dnl the value 0 into the register containing the variable ret.
|
|
dnl For PowerPC, this would be:
|
|
dnl
|
|
dnl "li %0,0" : "=&r"(ret)
|
|
dnl
|
|
dnl For testing ia32 assembly, the assembly instruction xaddl is
|
|
dnl tested. The xaddl instruction is used by some of the atomic
|
|
dnl implementations so it makes sense to test for it. In addition,
|
|
dnl some compilers (i.e. earlier versions of Sun Studio 12) do not
|
|
dnl necessarily handle xaddl properly, so that needs to be detected
|
|
dnl during configure time.
|
|
dnl
|
|
dnl DEFINE OPAL_GCC_INLINE_ASSEMBLY to 0 or 1 depending on GCC
|
|
dnl support
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_INLINE_C_GCC],[
|
|
assembly="$1"
|
|
asm_result="unknown"
|
|
|
|
AC_MSG_CHECKING([if $CC supports GCC inline assembly])
|
|
|
|
if test ! "$assembly" = "" ; then
|
|
AC_RUN_IFELSE([AC_LANG_PROGRAM([AC_INCLUDES_DEFAULT],[[
|
|
int ret = 1;
|
|
int negone = -1;
|
|
__asm__ __volatile__ ($assembly);
|
|
return ret;
|
|
]])],
|
|
[asm_result="yes"], [asm_result="no"],
|
|
[asm_result="unknown"])
|
|
else
|
|
assembly="test skipped - assuming no"
|
|
fi
|
|
|
|
# if we're cross compiling, just try to compile and figure good enough
|
|
if test "$asm_result" = "unknown" ; then
|
|
AC_LINK_IFELSE([AC_LANG_PROGRAM([AC_INCLUDES_DEFAULT],[[
|
|
int ret = 1;
|
|
int negone = -1;
|
|
__asm__ __volatile__ ($assembly);
|
|
return ret;
|
|
]])],
|
|
[asm_result="yes"], [asm_result="no"])
|
|
fi
|
|
|
|
AC_MSG_RESULT([$asm_result])
|
|
|
|
if test "$asm_result" = "yes" ; then
|
|
OPAL_C_GCC_INLINE_ASSEMBLY=1
|
|
else
|
|
OPAL_C_GCC_INLINE_ASSEMBLY=0
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_C_GCC_INLINE_ASSEMBLY],
|
|
[$OPAL_C_GCC_INLINE_ASSEMBLY],
|
|
[Whether C compiler supports GCC style inline assembly])
|
|
|
|
unset OPAL_C_GCC_INLINE_ASSEMBLY assembly asm_result
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_INLINE_DEC
|
|
dnl
|
|
dnl DEFINE OPAL_DEC to 0 or 1 depending on DEC
|
|
dnl support
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_INLINE_C_DEC],[
|
|
|
|
AC_MSG_CHECKING([if $CC supports DEC inline assembly])
|
|
|
|
AC_LINK_IFELSE([AC_LANG_PROGRAM([
|
|
AC_INCLUDES_DEFAULT
|
|
#include <c_asm.h>],
|
|
[[asm("");
|
|
return 0;]])],
|
|
[asm_result="yes"], [asm_result="no"])
|
|
|
|
AC_MSG_RESULT([$asm_result])
|
|
|
|
if test "$asm_result" = "yes" ; then
|
|
OPAL_C_DEC_INLINE_ASSEMBLY=1
|
|
else
|
|
OPAL_C_DEC_INLINE_ASSEMBLY=0
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_C_DEC_INLINE_ASSEMBLY],
|
|
[$OPAL_C_DEC_INLINE_ASSEMBLY],
|
|
[Whether C compiler supports DEC style inline assembly])
|
|
|
|
unset OPAL_C_DEC_INLINE_ASSEMBLY asm_result
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CHECK_INLINE_XLC
|
|
dnl
|
|
dnl DEFINE OPAL_XLC to 0 or 1 depending on XLC
|
|
dnl support
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CHECK_INLINE_C_XLC],[
|
|
|
|
AC_MSG_CHECKING([if $CC supports XLC inline assembly])
|
|
|
|
OPAL_C_XLC_INLINE_ASSEMBLY=0
|
|
asm_result="no"
|
|
if test "$CC" = "xlc" ; then
|
|
OPAL_XLC_INLINE_ASSEMBLY=1
|
|
asm_result="yes"
|
|
fi
|
|
|
|
AC_MSG_RESULT([$asm_result])
|
|
AC_DEFINE_UNQUOTED([OPAL_C_XLC_INLINE_ASSEMBLY],
|
|
[$OPAL_C_XLC_INLINE_ASSEMBLY],
|
|
[Whether C compiler supports XLC style inline assembly])
|
|
|
|
unset OPAL_C_XLC_INLINE_ASSEMBLY
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_CONFIG_ASM
|
|
dnl
|
|
dnl DEFINE OPAL_ASSEMBLY_ARCH to something in sys/architecture.h
|
|
dnl DEFINE OPAL_ASSEMBLY_FORMAT to string containing correct
|
|
dnl format for assembly (not user friendly)
|
|
dnl SUBST OPAL_ASSEMBLY_FORMAT to string containing correct
|
|
dnl format for assembly (not user friendly)
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_CONFIG_ASM],[
|
|
AC_REQUIRE([OPAL_SETUP_CC])
|
|
AC_REQUIRE([AM_PROG_AS])
|
|
|
|
AC_ARG_ENABLE([builtin-atomics],
|
|
[AC_HELP_STRING([--enable-builtin-atomics],
|
|
[Enable use of __sync builtin atomics (default: enabled)])],
|
|
[], [enable_builtin_atomics="yes"])
|
|
|
|
opal_cv_asm_builtin="BUILTIN_NO"
|
|
if test "$opal_cv_asm_builtin" = "BUILTIN_NO" && test "$enable_builtin_atomics" = "yes" ; then
|
|
OPAL_CHECK_GCC_ATOMIC_BUILTINS([opal_cv_asm_builtin="BUILTIN_GCC"], [])
|
|
fi
|
|
if test "$opal_cv_asm_builtin" = "BUILTIN_NO" && test "$enable_builtin_atomics" = "yes" ; then
|
|
OPAL_CHECK_SYNC_BUILTINS([opal_cv_asm_builtin="BUILTIN_SYNC"], [])
|
|
fi
|
|
|
|
OPAL_CHECK_ASM_PROC
|
|
OPAL_CHECK_ASM_TEXT
|
|
OPAL_CHECK_ASM_GLOBAL
|
|
OPAL_CHECK_ASM_GNU_STACKEXEC
|
|
OPAL_CHECK_ASM_LABEL_SUFFIX
|
|
OPAL_CHECK_ASM_GSYM
|
|
OPAL_CHECK_ASM_LSYM
|
|
OPAL_CHECK_ASM_TYPE
|
|
OPAL_CHECK_ASM_SIZE
|
|
OPAL_CHECK_ASM_ALIGN_LOG
|
|
|
|
# find our architecture for purposes of assembly stuff
|
|
opal_cv_asm_arch="UNSUPPORTED"
|
|
OPAL_GCC_INLINE_ASSIGN=""
|
|
OPAL_ASM_SUPPORT_64BIT=0
|
|
case "${host}" in
|
|
x86_64-*x32)
|
|
opal_cv_asm_arch="X86_64"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_GCC_INLINE_ASSIGN='"xaddl %1,%0" : "=m"(ret), "+r"(negone) : "m"(ret)'
|
|
;;
|
|
i?86-*|x86_64*|amd64*)
|
|
if test "$ac_cv_sizeof_long" = "4" ; then
|
|
opal_cv_asm_arch="IA32"
|
|
else
|
|
opal_cv_asm_arch="X86_64"
|
|
fi
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_GCC_INLINE_ASSIGN='"xaddl %1,%0" : "=m"(ret), "+r"(negone) : "m"(ret)'
|
|
OPAL_CHECK_CMPXCHG16B
|
|
;;
|
|
|
|
ia64-*)
|
|
opal_cv_asm_arch="IA64"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0=r0\n;;\n" : "=&r"(ret)'
|
|
;;
|
|
aarch64*)
|
|
opal_cv_asm_arch="ARM64"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_ASM_ARM_VERSION=8
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_ARM_VERSION], [$OPAL_ASM_ARM_VERSION],
|
|
[What ARM assembly version to use])
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0, #0" : "=&r"(ret)'
|
|
;;
|
|
|
|
armv7*|arm-*-linux-gnueabihf)
|
|
opal_cv_asm_arch="ARM"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_ASM_ARM_VERSION=7
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_ARM_VERSION], [$OPAL_ASM_ARM_VERSION],
|
|
[What ARM assembly version to use])
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0, #0" : "=&r"(ret)'
|
|
;;
|
|
|
|
armv6*)
|
|
opal_cv_asm_arch="ARM"
|
|
OPAL_ASM_SUPPORT_64BIT=0
|
|
OPAL_ASM_ARM_VERSION=6
|
|
CCASFLAGS="$CCASFLAGS -march=armv7-a"
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_ARM_VERSION], [$OPAL_ASM_ARM_VERSION],
|
|
[What ARM assembly version to use])
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0, #0" : "=&r"(ret)'
|
|
;;
|
|
|
|
armv5*linux*|armv4*linux*|arm-*-linux-gnueabi)
|
|
# uses Linux kernel helpers for some atomic operations
|
|
opal_cv_asm_arch="ARM"
|
|
OPAL_ASM_SUPPORT_64BIT=0
|
|
OPAL_ASM_ARM_VERSION=5
|
|
CCASFLAGS="$CCASFLAGS -march=armv7-a"
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_ARM_VERSION], [$OPAL_ASM_ARM_VERSION],
|
|
[What ARM assembly version to use])
|
|
OPAL_GCC_INLINE_ASSIGN='"mov %0, #0" : "=&r"(ret)'
|
|
;;
|
|
|
|
mips-*|mips64*)
|
|
# Should really find some way to make sure that we are on
|
|
# a MIPS III machine (r4000 and later)
|
|
opal_cv_asm_arch="MIPS"
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
OPAL_GCC_INLINE_ASSIGN='"or %0,[$]0,[$]0" : "=&r"(ret)'
|
|
;;
|
|
|
|
powerpc-*|powerpc64-*|powerpcle-*|powerpc64le-*|rs6000-*|ppc-*)
|
|
OPAL_CHECK_POWERPC_REG
|
|
if test "$ac_cv_sizeof_long" = "4" ; then
|
|
opal_cv_asm_arch="POWERPC32"
|
|
|
|
# Note that on some platforms (Apple G5), even if we are
|
|
# compiling in 32 bit mode (and therefore should assume
|
|
# sizeof(long) == 4), we can use the 64 bit test and set
|
|
# operations.
|
|
OPAL_CHECK_POWERPC_64BIT(OPAL_ASM_SUPPORT_64BIT=1)
|
|
elif test "$ac_cv_sizeof_long" = "8" ; then
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
opal_cv_asm_arch="POWERPC64"
|
|
else
|
|
AC_MSG_ERROR([Could not determine PowerPC word size: $ac_cv_sizeof_long])
|
|
fi
|
|
OPAL_GCC_INLINE_ASSIGN='"1: li %0,0" : "=&r"(ret)'
|
|
;;
|
|
# There is no current difference between s390 and s390x
|
|
# But use two different defines in case some come later
|
|
# as s390 is 31bits while s390x is 64bits
|
|
s390-*)
|
|
opal_cv_asm_arch="S390"
|
|
OPAL_CHECK_SYNC_BUILTINS([opal_cv_asm_builtin="BUILTIN_SYNC"],
|
|
[AC_MSG_ERROR([No atomic primitives available for $host])])
|
|
;;
|
|
s390x-*)
|
|
opal_cv_asm_arch="S390X"
|
|
OPAL_CHECK_SYNC_BUILTINS([opal_cv_asm_builtin="BUILTIN_SYNC"],
|
|
[AC_MSG_ERROR([No atomic primitives available for $host])])
|
|
;;
|
|
sparc*-*)
|
|
# SPARC v9 (and above) are the only ones with 64bit support
|
|
# if compiling 32 bit, see if we are v9 (aka v8plus) or
|
|
# earlier (casa is v8+/v9).
|
|
if test "$ac_cv_sizeof_long" = "4" ; then
|
|
have_v8plus=0
|
|
OPAL_CHECK_SPARCV8PLUS([have_v8plus=1])
|
|
if test "$have_v8plus" = "0" ; then
|
|
OPAL_ASM_SUPPORT_64BIT=0
|
|
opal_cv_asm_arch="SPARC"
|
|
AC_MSG_WARN([Sparc v8 target is not supported in this release of Open MPI.])
|
|
AC_MSG_WARN([You must specify the target architecture v8plus to compile])
|
|
AC_MSG_WARN([Open MPI in 32 bit mode on Sparc processors (see the README).])
|
|
AC_MSG_ERROR([Can not continue.])
|
|
else
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
opal_cv_asm_arch="SPARCV9_32"
|
|
fi
|
|
|
|
elif test "$ac_cv_sizeof_long" = "8" ; then
|
|
OPAL_ASM_SUPPORT_64BIT=1
|
|
opal_cv_asm_arch="SPARCV9_64"
|
|
else
|
|
AC_MSG_ERROR([Could not determine Sparc word size: $ac_cv_sizeof_long])
|
|
fi
|
|
OPAL_GCC_INLINE_ASSIGN='"mov 0,%0" : "=&r"(ret)'
|
|
;;
|
|
|
|
*)
|
|
OPAL_CHECK_SYNC_BUILTINS([opal_cv_asm_builtin="BUILTIN_SYNC"],
|
|
[AC_MSG_ERROR([No atomic primitives available for $host])])
|
|
;;
|
|
esac
|
|
|
|
if test "x$OPAL_ASM_SUPPORT_64BIT" = "x1" && test "$opal_cv_asm_builtin" = "BUILTIN_SYNC" &&
|
|
test "$opal_asm_sync_have_64bit" = "0" ; then
|
|
# __sync builtins exist but do not implement 64-bit support. Fall back on inline asm.
|
|
opal_cv_asm_builtin="BUILTIN_NO"
|
|
fi
|
|
|
|
if test "$opal_cv_asm_builtin" = "BUILTIN_SYNC" || test "$opal_cv_asm_builtin" = "BUILTIN_GCC" ; then
|
|
AC_DEFINE([OPAL_C_GCC_INLINE_ASSEMBLY], [1],
|
|
[Whether C compiler supports GCC style inline assembly])
|
|
else
|
|
AC_DEFINE_UNQUOTED([OPAL_ASM_SUPPORT_64BIT],
|
|
[$OPAL_ASM_SUPPORT_64BIT],
|
|
[Whether we can do 64bit assembly operations or not. Should not be used outside of the assembly header files])
|
|
AC_SUBST([OPAL_ASM_SUPPORT_64BIT])
|
|
|
|
#
|
|
# figure out if we need any special function start / stop code
|
|
#
|
|
case $host_os in
|
|
aix*)
|
|
opal_asm_arch_config="aix"
|
|
;;
|
|
*)
|
|
opal_asm_arch_config="default"
|
|
;;
|
|
esac
|
|
|
|
# now that we know our architecture, try to inline assemble
|
|
OPAL_CHECK_INLINE_C_GCC([$OPAL_GCC_INLINE_ASSIGN])
|
|
OPAL_CHECK_INLINE_C_DEC
|
|
OPAL_CHECK_INLINE_C_XLC
|
|
|
|
# format:
|
|
# config_file-text-global-label_suffix-gsym-lsym-type-size-align_log-ppc_r_reg-64_bit-gnu_stack
|
|
asm_format="${opal_asm_arch_config}"
|
|
asm_format="${asm_format}-${opal_cv_asm_text}-${opal_cv_asm_global}"
|
|
asm_format="${asm_format}-${opal_cv_asm_label_suffix}-${opal_cv_asm_gsym}"
|
|
asm_format="${asm_format}-${opal_cv_asm_lsym}"
|
|
asm_format="${asm_format}-${opal_cv_asm_type}-${opal_asm_size}"
|
|
asm_format="${asm_format}-${opal_asm_align_log_result}"
|
|
if test "$opal_cv_asm_arch" = "POWERPC32" || test "$opal_cv_asm_arch" = "POWERPC64" ; then
|
|
asm_format="${asm_format}-${opal_cv_asm_powerpc_r_reg}"
|
|
else
|
|
asm_format="${asm_format}-1"
|
|
fi
|
|
asm_format="${asm_format}-${OPAL_ASM_SUPPORT_64BIT}"
|
|
opal_cv_asm_format="${asm_format}-${opal_cv_asm_gnu_stack}"
|
|
# For the Makefile, need to escape the $ as $$. Don't display
|
|
# this version, but make sure the Makefile gives the right thing
|
|
# when regenerating the files because the base has been touched.
|
|
OPAL_ASSEMBLY_FORMAT=`echo "$opal_cv_asm_format" | sed -e 's/\\\$/\\\$\\\$/'`
|
|
|
|
AC_MSG_CHECKING([for assembly format])
|
|
AC_MSG_RESULT([$opal_cv_asm_format])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_FORMAT], ["$OPAL_ASSEMBLY_FORMAT"],
|
|
[Format of assembly file])
|
|
AC_SUBST([OPAL_ASSEMBLY_FORMAT])
|
|
fi # if opal_cv_asm_builtin = BUILTIN_SYNC
|
|
|
|
result="OPAL_$opal_cv_asm_arch"
|
|
OPAL_ASSEMBLY_ARCH="$opal_cv_asm_arch"
|
|
AC_MSG_CHECKING([for assembly architecture])
|
|
AC_MSG_RESULT([$opal_cv_asm_arch])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_ARCH], [$result],
|
|
[Architecture type of assembly to use for atomic operations and CMA])
|
|
AC_SUBST([OPAL_ASSEMBLY_ARCH])
|
|
|
|
# Check for RDTSCP support
|
|
result=0
|
|
AS_IF([test "$opal_cv_asm_arch" = "OPAL_X86_64" || test "$opal_cv_asm_arch" = "OPAL_IA32"],
|
|
[AC_MSG_CHECKING([for RDTSCP assembly support])
|
|
AC_LANG_PUSH([C])
|
|
AC_TRY_RUN([[
|
|
int main(int argc, char* argv[])
|
|
{
|
|
unsigned int rax, rdx;
|
|
__asm__ __volatile__ ("rdtscp\n": "=a" (rax), "=d" (rdx):: "%rax", "%rdx");
|
|
return 0;
|
|
}
|
|
]],
|
|
[result=1
|
|
AC_MSG_RESULT([yes])],
|
|
[AC_MSG_RESULT([no])],
|
|
[#cross compile not supported
|
|
AC_MSG_RESULT(["no (cross compiling)"])])
|
|
AC_LANG_POP([C])])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_SUPPORTS_RDTSCP], [$result],
|
|
[Whether we have support for RDTSCP instruction])
|
|
|
|
result="OPAL_$opal_cv_asm_builtin"
|
|
OPAL_ASSEMBLY_BUILTIN="$opal_cv_asm_builtin"
|
|
AC_MSG_CHECKING([for builtin atomics])
|
|
AC_MSG_RESULT([$opal_cv_asm_builtin])
|
|
AC_DEFINE_UNQUOTED([OPAL_ASSEMBLY_BUILTIN], [$result],
|
|
[Whether to use builtin atomics])
|
|
AC_SUBST([OPAL_ASSEMBLY_BUILTIN])
|
|
|
|
OPAL_ASM_FIND_FILE
|
|
|
|
unset result asm_format
|
|
])dnl
|
|
|
|
|
|
dnl #################################################################
|
|
dnl
|
|
dnl OPAL_ASM_FIND_FILE
|
|
dnl
|
|
dnl
|
|
dnl do all the evil mojo to provide a working assembly file
|
|
dnl
|
|
dnl #################################################################
|
|
AC_DEFUN([OPAL_ASM_FIND_FILE], [
|
|
AC_REQUIRE([AC_PROG_GREP])
|
|
AC_REQUIRE([AC_PROG_FGREP])
|
|
|
|
if test "$opal_cv_asm_arch" != "WINDOWS" && test "$opal_cv_asm_builtin" != "BUILTIN_SYNC" && test "$opal_cv_asm_builtin" != "BUILTIN_GCC" && test "$opal_cv_asm_builtin" != "BUILTIN_OSX" ; then
|
|
# see if we have a pre-built one already
|
|
AC_MSG_CHECKING([for pre-built assembly file])
|
|
opal_cv_asm_file=""
|
|
if $GREP "$opal_cv_asm_arch" "${OPAL_TOP_SRCDIR}/opal/asm/asm-data.txt" | $FGREP "$opal_cv_asm_format" >conftest.out 2>&1 ; then
|
|
opal_cv_asm_file="`cut -f3 conftest.out`"
|
|
if test ! "$opal_cv_asm_file" = "" ; then
|
|
opal_cv_asm_file="atomic-${opal_cv_asm_file}.s"
|
|
if test -f "${OPAL_TOP_SRCDIR}/opal/asm/generated/${opal_cv_asm_file}" ; then
|
|
AC_MSG_RESULT([yes ($opal_cv_asm_file)])
|
|
else
|
|
AC_MSG_RESULT([no ($opal_cv_asm_file not found)])
|
|
opal_cv_asm_file=""
|
|
fi
|
|
fi
|
|
else
|
|
AC_MSG_RESULT([no (not in asm-data)])
|
|
fi
|
|
rm -rf conftest.*
|
|
|
|
if test "$opal_cv_asm_file" = "" ; then
|
|
# Can we generate a file?
|
|
AC_MSG_CHECKING([whether possible to generate assembly file])
|
|
mkdir -p opal/asm/generated
|
|
opal_cv_asm_file="atomic-local.s"
|
|
opal_try='$PERL $OPAL_TOP_SRCDIR/opal/asm/generate-asm.pl $opal_cv_asm_arch "$opal_cv_asm_format" $OPAL_TOP_SRCDIR/opal/asm/base $OPAL_TOP_BUILDDIR/opal/asm/generated/$opal_cv_asm_file >conftest.out 2>&1'
|
|
if AC_TRY_EVAL(opal_try) ; then
|
|
# save the warnings
|
|
cat conftest.out >&AC_FD_CC
|
|
AC_MSG_RESULT([yes])
|
|
else
|
|
# save output
|
|
cat conftest.out >&AC_FD_CC
|
|
opal_cv_asm_file=""
|
|
AC_MSG_RESULT([failed])
|
|
AC_MSG_WARN([Could not build atomic operations assembly file.])
|
|
AC_MSG_WARN([There will be no atomic operations for this build.])
|
|
fi
|
|
fi
|
|
rm -rf conftest.*
|
|
else
|
|
# On windows with VC++, atomics are done with compiler primitives
|
|
opal_cv_asm_file=""
|
|
fi
|
|
|
|
AC_MSG_CHECKING([for atomic assembly filename])
|
|
if test "$opal_cv_asm_file" = "" ; then
|
|
AC_MSG_RESULT([none])
|
|
result=0
|
|
else
|
|
AC_MSG_RESULT([$opal_cv_asm_file])
|
|
result=1
|
|
fi
|
|
|
|
AC_DEFINE_UNQUOTED([OPAL_HAVE_ASM_FILE], [$result],
|
|
[Whether there is an atomic assembly file available])
|
|
AM_CONDITIONAL([OPAL_HAVE_ASM_FILE], [test "$result" = "1"])
|
|
|
|
OPAL_ASM_FILE=$opal_cv_asm_file
|
|
AC_SUBST(OPAL_ASM_FILE)
|
|
])dnl
|