/* Functions for tracking which floating-point exceptions have occurred.
Copyright (C) 1997-2024 Free Software Foundation, Inc.
This file is free software: you can redistribute it and/or modify
it under the terms of the GNU Lesser General Public License as
published by the Free Software Foundation; either version 2.1 of the
License, or (at your option) any later version.
This file is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public License
along with this program. If not, see . */
/* Based on glibc/sysdeps//{fclrexcpt.c,fraiseexcpt.c,ftestexcept.c}
together with glibc/sysdeps//{fpu_control.h,fenv_private.h,fenv_libc.h}. */
#include
/* Specification. */
#include
#include "fenv-private.h"
_GL_UNUSED static void
generic_feraiseexcept (int exceptions)
{
/* First: invalid exception. */
if (exceptions & FE_INVALID)
{
double volatile a;
_GL_UNUSED double volatile b;
a = 0; b = a / a;
}
/* Next: division by zero. */
if (exceptions & FE_DIVBYZERO)
{
double volatile a, b;
_GL_UNUSED double volatile c;
a = 1; b = 0; c = a / b;
}
/* Next: overflow. */
if (exceptions & FE_OVERFLOW)
{
double volatile a;
_GL_UNUSED double volatile b;
a = 1e200; b = a * a;
}
/* Next: underflow. */
if (exceptions & FE_UNDERFLOW)
{
double volatile a;
_GL_UNUSED double volatile b;
a = 1e-200; b = a * a;
}
/* Last: inexact. */
if (exceptions & FE_INEXACT)
{
double volatile a, b;
_GL_UNUSED double volatile c;
a = 1; b = 3; c = a / b;
}
}
#if defined __GNUC__ || defined __clang__ || defined _MSC_VER
# if (defined __x86_64__ || defined _M_X64) || (defined __i386 || defined _M_IX86)
int
feraiseexcept (int exceptions)
{
# if defined _MSC_VER
/* Setting the exception flags only in the SSE unit (i.e. in the mxcsr
register) would not cause the hardware to trap on the exception. */
generic_feraiseexcept (exceptions);
# else
exceptions &= FE_ALL_EXCEPT;
if ((exceptions & ~(FE_INVALID | FE_DIVBYZERO)) == 0)
{
/* Like generic_feraiseexcept (exceptions). */
/* This code is probably faster than the general code below. */
/* First: invalid exception. */
if (exceptions & FE_INVALID)
{
double volatile a;
_GL_UNUSED double volatile b;
a = 0; b = a / a;
}
/* Next: division by zero. */
if (exceptions & FE_DIVBYZERO)
{
double volatile a, b;
_GL_UNUSED double volatile c;
a = 1; b = 0; c = a / b;
}
}
else
{
/* The general case. */
/* Set the bits in the 387 unit. */
x86_387_fenv_t env;
__asm__ __volatile__ ("fnstenv %0" : "=m" (*&env));
/* Note: fnstenv masks all floating-point exceptions until the fldenv
below. */
env.__status_word |= exceptions;
__asm__ __volatile__ ("fldenv %0" : : "m" (*&env));
/* A trap (if enabled) is triggered only at the next floating-point
instruction. Force it to occur here. */
__asm__ __volatile__ ("fwait");
}
# endif
return 0;
}
# elif defined __aarch64__ /* arm64 */
int
feraiseexcept (int exceptions)
{
# if 0
/* This would just set the flag bits and make fetestexcept() work as expected.
But it would not cause the hardware to trap on the exception. */
exceptions &= FE_ALL_EXCEPT;
unsigned long fpsr, orig_fpsr;
_FPU_GETFPSR (orig_fpsr);
fpsr = orig_fpsr | exceptions;
if (fpsr != orig_fpsr)
_FPU_SETFPSR (fpsr);
# else
/* This is how glibc does it.
The drawback is that when FE_OVERFLOW is raised, FE_INEXACT is raised
with it. */
generic_feraiseexcept (exceptions);
# endif
return 0;
}
# elif defined __arm__
int
feraiseexcept (int exceptions)
{
# ifdef __SOFTFP__
exceptions &= FE_ALL_EXCEPT;
if (exceptions != 0)
return -1;
# else
/* Raise exceptions represented by EXCEPTIONS. But we must raise only
one signal at a time. It is important that if the overflow/underflow
exception and the inexact exception are given at the same time,
the overflow/underflow exception follows the inexact exception. After
each exception we read from the fpscr, to force the exception to be
raised immediately. */
/* XXX Probably this should do actual floating-point operations, like in
generic_feraiseexcept, not just setting flag bits in the fpscr. */
unsigned int fpscr, orig_fpscr;
/* First: invalid exception. */
if (exceptions & FE_INVALID)
{
_FPU_GETCW (orig_fpscr);
fpscr = orig_fpscr | FE_INVALID;
if (fpscr != orig_fpscr)
{
_FPU_SETCW (fpscr);
_FPU_GETCW (fpscr);
}
}
/* Next: division by zero. */
if (exceptions & FE_DIVBYZERO)
{
_FPU_GETCW (orig_fpscr);
fpscr = orig_fpscr | FE_DIVBYZERO;
if (fpscr != orig_fpscr)
{
_FPU_SETCW (fpscr);
_FPU_GETCW (fpscr);
}
}
/* Next: overflow. */
if (exceptions & FE_OVERFLOW)
{
_FPU_GETCW (orig_fpscr);
fpscr = orig_fpscr | FE_OVERFLOW;
if (fpscr != orig_fpscr)
{
_FPU_SETCW (fpscr);
_FPU_GETCW (fpscr);
}
}
/* Next: underflow. */
if (exceptions & FE_UNDERFLOW)
{
_FPU_GETCW (orig_fpscr);
fpscr = orig_fpscr | FE_UNDERFLOW;
if (fpscr != orig_fpscr)
{
_FPU_SETCW (fpscr);
_FPU_GETCW (fpscr);
}
}
/* Last: inexact. */
if (exceptions & FE_INEXACT)
{
_FPU_GETCW (orig_fpscr);
fpscr = orig_fpscr | FE_INEXACT;
if (fpscr != orig_fpscr)
{
_FPU_SETCW (fpscr);
_FPU_GETCW (fpscr);
}
}
# endif
return 0;
}
# elif defined __alpha
/* Prefer the Linux system call when available.
See glibc/sysdeps/unix/sysv/linux/alpha/fraiseexcpt.S */
# if !defined __linux__
int
feraiseexcept (int exceptions)
{
/* This implementation cannot raise FE_INEXACT. */
generic_feraiseexcept (exceptions);
return 0;
}
# endif
# elif defined __hppa
int
feraiseexcept (int exceptions)
{
generic_feraiseexcept (exceptions);
return 0;
}
# elif defined __ia64__
int
feraiseexcept (int exceptions)
{
/* Raise exceptions represented by EXCEPTIONS. But we must raise only
one signal at a time. It is important that if the overflow/underflow
exception and the inexact exception are given at the same time,
the overflow/underflow exception precedes the inexact exception. */
generic_feraiseexcept (exceptions);
return 0;
}
# elif defined __m68k__
int
feraiseexcept (int exceptions)
{
generic_feraiseexcept (exceptions);
return 0;
}
# elif defined __mips__
int
feraiseexcept (int exceptions)
{
exceptions &= FE_ALL_EXCEPT;
/* Set also the cause bits. The setting of the cause bits is what actually
causes the hardware to trap on the exception, if the corresponding enable
bit is set as well. */
unsigned int fcsr, orig_fcsr;
_FPU_GETCW (orig_fcsr);
fcsr = orig_fcsr | ((exceptions << 10) | exceptions);
if (fcsr != orig_fcsr)
_FPU_SETCW (fcsr);
return 0;
}
# elif defined __loongarch__
int
feraiseexcept (int exceptions)
{
# if 0
/* This would just set the flag bits and make fetestexcept() work as expected.
But it would not cause the hardware to trap on the exception. */
exceptions &= FE_ALL_EXCEPT;
/* Set also the cause bits. The setting of the cause bits is what actually
causes the hardware to trap on the exception, if the corresponding enable
bit is set as well. */
unsigned int fcsr, orig_fcsr;
_FPU_GETCW (orig_fcsr);
fcsr = orig_fcsr | ((exceptions << 8) | exceptions);
if (fcsr != orig_fcsr)
_FPU_SETCW (fcsr);
# else
/* This is how glibc does it.
The drawback is that when FE_OVERFLOW is raised, FE_INEXACT is raised
with it. */
generic_feraiseexcept (exceptions);
# endif
return 0;
}
# elif defined __powerpc__
int
feraiseexcept (int exceptions)
{
exceptions &= FE_ALL_EXCEPT;
union { unsigned long long u; double f; } memenv, orig_memenv;
_FPU_GETCW_AS_DOUBLE (memenv.f);
orig_memenv = memenv;
/* Instead of setting FE_INVALID (= bit 29), we need to set one of the
individual bits: bit 10 or, if that does not work, bit 24. */
memenv.u |= (exceptions & FE_INVALID
? (exceptions & ~FE_INVALID) | (1U << 10)
: exceptions);
if (!(memenv.u == orig_memenv.u))
{
_FPU_SETCW_AS_DOUBLE (memenv.f);
if (exceptions & FE_INVALID)
{
/* Did it work? */
_FPU_GETCW_AS_DOUBLE (memenv.f);
if ((memenv.u & FE_INVALID) == 0)
{
memenv.u |= (1U << 24);
_FPU_SETCW_AS_DOUBLE (memenv.f);
}
}
}
return 0;
}
# elif defined __riscv
int
feraiseexcept (int exceptions)
{
exceptions &= FE_ALL_EXCEPT;
__asm__ __volatile__ ("csrs fflags, %0" : : "r" (exceptions));
return 0;
}
# elif defined __s390__ || defined __s390x__
int
feraiseexcept (int exceptions)
{
generic_feraiseexcept (exceptions);
return 0;
}
# elif defined __sh__
int
feraiseexcept (int exceptions)
{
# if 0
/* This would just set the flag bits and make fetestexcept() work as expected.
But it would not cause the hardware to trap on the exception. */
exceptions &= FE_ALL_EXCEPT;
unsigned int fpscr, orig_fpscr;
_FPU_GETCW (orig_fpscr);
fpscr = orig_fpscr | exceptions;
if (fpscr != orig_fpscr)
_FPU_SETCW (fpscr);
# else
/* This is how glibc does it.
The drawback is that when FE_OVERFLOW is raised, FE_INEXACT is raised
with it. */
generic_feraiseexcept (exceptions);
# endif
return 0;
}
# elif defined __sparc
int
feraiseexcept (int exceptions)
{
# if 0
/* This would just set the flag bits and make fetestexcept() work as expected.
But it would not cause the hardware to trap on the exception. */
exceptions &= FE_ALL_EXCEPT;
unsigned long fsr, orig_fsr;
_FPU_GETCW (orig_fsr);
# if FE_INEXACT == 32 /* glibc compatible FE_* values */
fsr = orig_fsr | exceptions;
# else /* Solaris compatible FE_* values */
fsr = orig_fsr | (exceptions << 5);
# endif
if (fsr != orig_fsr)
_FPU_SETCW (fsr);
# else
/* This is how glibc does it.
The drawback is that when FE_OVERFLOW is raised, FE_INEXACT is raised
with it. */
generic_feraiseexcept (exceptions);
# endif
return 0;
}
# else
# if defined __GNUC__ || defined __clang__
# warning "Unknown CPU / architecture. Please report your platform and compiler to ."
# endif
# define NEED_FALLBACK 1
# endif
#else
/* The compiler does not support __asm__ statements or equivalent
intrinsics. */
# define NEED_FALLBACK 1
#endif
#if NEED_FALLBACK
/* A fallback that should work everywhere. */
int
feraiseexcept (int exceptions)
{
generic_feraiseexcept (exceptions);
return 0;
}
#endif