S390: Do not set FE_INEXACT with feraiseexcept (FE_OWERFLOW|FE_UNDERFLOW).

On s390 feraiseexcept (FE_OVERFLOW|FE_UNDERFLOW) sets FE_INEXACT, too.
This patch uses z196 zarch load rounded instruction which can suppress
FE_INEXACT exception if gcc has z196 support in used configuration.
Otherwise FE_INEXACT flag is set as before. The gcc support is tested
in a new configure-check.

A comment in fsetexcptflg.c is corrected as new exceptions are not
executed with the next floating-point instruction if fpc is set with
_FPU_SETCW macro. It seems the comment was copied e.g. from
sysdeps/x86_64/fpu/fsetexcptflg.c file.

ChangeLog:

	* config.h.in (HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT):
	New undefine.
	* sysdeps/s390/configure.ac: Add test for z196 zarch support.
	* sysdeps/s390/configure: Regenerated.
	* sysdeps/s390/fpu/fraiseexcpt.c (__feraiseexcept): Use ledbra
	instruction for raising over-/underflow if z196 zarch is supported
	by default.
	* sysdeps/s390/fpu/fsetexcptflg.c (fesetexceptflag):
	Correct comment.
This commit is contained in:
Stefan Liebler 2016-08-31 14:54:55 +02:00
parent aaf3045480
commit e9b424881a
6 changed files with 113 additions and 6 deletions

View File

@ -1,3 +1,13 @@
2016-08-31 Stefan Liebler <stli@linux.vnet.ibm.com>
* config.h.in (HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT): New undefine.
* sysdeps/s390/configure.ac: Add test for z196 zarch support.
* sysdeps/s390/configure: Regenerated.
* sysdeps/s390/fpu/fraiseexcpt.c (__feraiseexcept): Use ledbra
instruction for raising over-/underflow if z196 zarch is supported
by default.
* sysdeps/s390/fpu/fsetexcptflg.c (fesetexceptflag): Correct comment.
2016-08-30 Svante Signell <svante.signell@gmail.com> 2016-08-30 Svante Signell <svante.signell@gmail.com>
* sysdeps/mach/hurd/adjtime.c (__adjtime): When OLDDELTA is NULL, make * sysdeps/mach/hurd/adjtime.c (__adjtime): When OLDDELTA is NULL, make

View File

@ -70,6 +70,9 @@
/* Define if assembler supports AVX512DQ. */ /* Define if assembler supports AVX512DQ. */
#undef HAVE_AVX512DQ_ASM_SUPPORT #undef HAVE_AVX512DQ_ASM_SUPPORT
/* Define if assembler supports z196 zarch instructions as default on S390. */
#undef HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT
/* Define if assembler supports vector instructions on S390. */ /* Define if assembler supports vector instructions on S390. */
#undef HAVE_S390_VX_ASM_SUPPORT #undef HAVE_S390_VX_ASM_SUPPORT

View File

@ -177,5 +177,41 @@ then
fi fi
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for S390 z196 zarch instruction support as default" >&5
$as_echo_n "checking for S390 z196 zarch instruction support as default... " >&6; }
if ${libc_cv_asm_s390_min_z196_zarch+:} false; then :
$as_echo_n "(cached) " >&6
else
cat > conftest.c <<\EOF
float testinsn (double e)
{
float d;
__asm__ ("ledbra %0,5,%1,4" : "=f" (d) : "f" (e) );
return d;
}
EOF
if { ac_try='${CC-cc} $CFLAGS $CPPFLAGS $LDFLAGS --shared conftest.c
-o conftest.o &> /dev/null'
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
(eval $ac_try) 2>&5
ac_status=$?
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
test $ac_status = 0; }; } ;
then
libc_cv_asm_s390_min_z196_zarch=yes
else
libc_cv_asm_s390_min_z196_zarch=no
fi
rm -f conftest*
fi
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_asm_s390_min_z196_zarch" >&5
$as_echo "$libc_cv_asm_s390_min_z196_zarch" >&6; }
if test "$libc_cv_asm_s390_min_z196_zarch" = yes ;
then
$as_echo "#define HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT 1" >>confdefs.h
fi
test -n "$critic_missing" && as_fn_error $? " test -n "$critic_missing" && as_fn_error $? "
*** $critic_missing" "$LINENO" 5 *** $critic_missing" "$LINENO" 5

View File

@ -86,5 +86,31 @@ then
AC_DEFINE(HAVE_S390_VX_GCC_SUPPORT) AC_DEFINE(HAVE_S390_VX_GCC_SUPPORT)
fi fi
AC_CACHE_CHECK(for S390 z196 zarch instruction support as default,
libc_cv_asm_s390_min_z196_zarch, [dnl
cat > conftest.c <<\EOF
float testinsn (double e)
{
float d;
__asm__ ("ledbra %0,5,%1,4" : "=f" (d) : "f" (e) );
return d;
}
EOF
dnl
dnl test, if assembler supports S390 z196 zarch instructions as default
if AC_TRY_COMMAND([${CC-cc} $CFLAGS $CPPFLAGS $LDFLAGS --shared conftest.c
-o conftest.o &> /dev/null]) ;
then
libc_cv_asm_s390_min_z196_zarch=yes
else
libc_cv_asm_s390_min_z196_zarch=no
fi
rm -f conftest* ])
if test "$libc_cv_asm_s390_min_z196_zarch" = yes ;
then
AC_DEFINE(HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT)
fi
test -n "$critic_missing" && AC_MSG_ERROR([ test -n "$critic_missing" && AC_MSG_ERROR([
*** $critic_missing]) *** $critic_missing])

View File

@ -35,6 +35,23 @@ fexceptadd (float d, float e)
__asm__ __volatile__ ("aebr %0,%1" : : "f" (d), "f" (e) ); __asm__ __volatile__ ("aebr %0,%1" : : "f" (d), "f" (e) );
} }
#ifdef HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT
static __inline__ void
fexceptround (double e)
{
float d;
/* Load rounded from double to float with M3 = round toward 0, M4 = Suppress
IEEE-inexact exception.
In case of e=0x1p128 and the overflow-mask bit is zero, only the
IEEE-overflow flag is set. If overflow-mask bit is one, DXC field is set to
0x20 "IEEE overflow, exact".
In case of e=0x1p-150 and the underflow-mask bit is zero, only the
IEEE-underflow flag is set. If underflow-mask bit is one, DXC field is set
to 0x10 "IEEE underflow, exact".
This instruction is available with a zarch machine >= z196. */
__asm__ __volatile__ ("ledbra %0,5,%1,4" : "=f" (d) : "f" (e) );
}
#endif
int int
__feraiseexcept (int excepts) __feraiseexcept (int excepts)
@ -54,13 +71,29 @@ __feraiseexcept (int excepts)
/* Next: overflow. */ /* Next: overflow. */
if (FE_OVERFLOW & excepts) if (FE_OVERFLOW & excepts)
/* I don't think we can do the same trick as intel so we will have {
to live with inexact coming also. */ #ifdef HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT
fexceptadd (FLT_MAX, 1.0e32); fexceptround (0x1p128);
#else
/* If overflow-mask bit is zero, both IEEE-overflow and IEEE-inexact flags
are set. If overflow-mask bit is one, DXC field is set to 0x2C "IEEE
overflow, inexact and incremented". */
fexceptadd (FLT_MAX, 1.0e32);
#endif
}
/* Next: underflow. */ /* Next: underflow. */
if (FE_UNDERFLOW & excepts) if (FE_UNDERFLOW & excepts)
fexceptdiv (FLT_MIN, 3.0); {
#ifdef HAVE_S390_MIN_Z196_ZARCH_ASM_SUPPORT
fexceptround (0x1p-150);
#else
/* If underflow-mask bit is zero, both IEEE-underflow and IEEE-inexact
flags are set. If underflow-mask bit is one, DXC field is set to 0x1C
"IEEE underflow, inexact and incremented". */
fexceptdiv (FLT_MIN, 3.0);
#endif
}
/* Last: inexact. */ /* Last: inexact. */
if (FE_INEXACT & excepts) if (FE_INEXACT & excepts)

View File

@ -45,8 +45,7 @@ fesetexceptflag (const fexcept_t *flagp, int excepts)
& newexcepts; & newexcepts;
/* Store the new status word (along with the rest of the environment. /* Store the new status word (along with the rest of the environment.
Possibly new exceptions are set but they won't get executed unless Possibly new exceptions are set but they won't get executed. */
the next floating-point instruction. */
_FPU_SETCW (temp); _FPU_SETCW (temp);
/* Success. */ /* Success. */