newlib-cygwin/newlib/libm/math/ef_exp.c

/* ef_exp.c -- float version of e_exp.c.
 * Conversion to float by Ian Lance Taylor, Cygnus Support, ian@cygnus.com.
 */

/*
 * ====================================================
 * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
 *
 * Developed at SunPro, a Sun Microsystems, Inc. business.
 * Permission to use, copy, modify, and distribute this
 * software is freely granted, provided that this notice 
 * is preserved.
 * ====================================================
 */

#include "fdlibm.h"
#include "math_config.h"

#if __OBSOLETE_MATH
#ifdef __v810__
#define const
#endif

#ifdef __STDC__
static const float
#else
static float
#endif
one	= 1.0,
halF[2]	= {0.5,-0.5,},
huge	= 1.0e+30,
twom100 = 7.8886090522e-31,      /* 2**-100=0x0d800000 */
ln2HI[2]   ={ 6.9313812256e-01,		/* 0x3f317180 */
	     -6.9313812256e-01,},	/* 0xbf317180 */
ln2LO[2]   ={ 9.0580006145e-06,  	/* 0x3717f7d1 */
	     -9.0580006145e-06,},	/* 0xb717f7d1 */
invln2 =  1.4426950216e+00, 		/* 0x3fb8aa3b */
P1   =  1.6666667163e-01, /* 0x3e2aaaab */
P2   = -2.7777778450e-03, /* 0xbb360b61 */
P3   =  6.6137559770e-05, /* 0x388ab355 */
P4   = -1.6533901999e-06, /* 0xb5ddea0e */
P5   =  4.1381369442e-08; /* 0x3331bb4c */

#ifdef __STDC__
	float __ieee754_expf(float x)	/* default IEEE double exp */
#else
	float __ieee754_expf(x)	/* default IEEE double exp */
	float x;
#endif
{
	float y,hi,lo,c,t;
	__int32_t k = 0,xsb,sx;
	__uint32_t hx;

	GET_FLOAT_WORD(sx,x);
	xsb = (sx>>31)&1;		/* sign bit of x */
	hx = sx & 0x7fffffff;		/* high word of |x| */

    /* filter out non-finite argument */
        if(FLT_UWORD_IS_NAN(hx))
            return x+x;	 	/* NaN */
        if(FLT_UWORD_IS_INFINITE(hx))
	    return (xsb==0)? x:0.0;		/* exp(+-inf)={inf,0} */
	if(sx > FLT_UWORD_LOG_MAX)
	    return __math_oflowf(0); /* overflow */
	if(sx < 0 && hx > FLT_UWORD_LOG_MIN)
	    return __math_uflowf(0); /* underflow */
	
    /* argument reduction */
	if(hx > 0x3eb17218) {		/* if  |x| > 0.5 ln2 */ 
	    if(hx < 0x3F851592) {	/* and |x| < 1.5 ln2 */
		hi = x-ln2HI[xsb]; lo=ln2LO[xsb]; k = 1-xsb-xsb;
	    } else {
		k  = invln2*x+halF[xsb];
		t  = k;
		hi = x - t*ln2HI[0];	/* t*ln2HI is exact here */
		lo = t*ln2LO[0];
	    }
	    x  = hi - lo;
	} 
	else if(hx < 0x34000000)  {	/* when |x|<2**-23 */
	    if(huge+x>one) return one+x;/* trigger inexact */
	}

    /* x is now in primary range */
	t  = x*x;
	c  = x - t*(P1+t*(P2+t*(P3+t*(P4+t*P5))));
	if(k==0) 	return one-((x*c)/(c-(float)2.0)-x); 
	else 		y = one-((lo-(x*c)/((float)2.0-c))-hi);
	if(k >= -125) {
	    __uint32_t hy;
	    GET_FLOAT_WORD(hy,y);
	    SET_FLOAT_WORD(y,hy+(k<<23));	/* add k to y's exponent */
	    return y;
	} else {
	    __uint32_t hy;
	    GET_FLOAT_WORD(hy,y);
	    SET_FLOAT_WORD(y,hy+((k+100)<<23));	/* add k to y's exponent */
	    return y*twom100;
	}
}
#endif /* __OBSOLETE_MATH */
import newlib-2000-02-17 snapshot 2000-02-17 19:39:52 +00:00			`/* ef_exp.c -- float version of e_exp.c.`
			`* Conversion to float by Ian Lance Taylor, Cygnus Support, ian@cygnus.com.`
			`*/`

			`/*`
			`* ====================================================`
			`* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.`
			`*`
			`* Developed at SunPro, a Sun Microsystems, Inc. business.`
			`* Permission to use, copy, modify, and distribute this`
			`* software is freely granted, provided that this notice`
			`* is preserved.`
			`* ====================================================`
			`*/`

			`#include "fdlibm.h"`
libm/math: Use __math_xflow in obsolete math code [v2] C compilers may fold const values at compile time, so expressions which try to elicit underflow/overflow by performing simple arithemetic on suitable values will not generate the required exceptions. Work around this by replacing code which does these arithmetic operations with calls to the existing __math_xflow functions that are designed to do this correctly. Signed-off-by: Keith Packard <keithp@keithp.com> ---- v2: libm/math: Pass sign to __math_xflow instead of muliplying result 2020-07-30 16:41:05 -07:00			`#include "math_config.h"`
import newlib-2000-02-17 snapshot 2000-02-17 19:39:52 +00:00
New expf, exp2f, logf, log2f and powf implementations Based on code from https://github.com/ARM-software/optimized-routines/ This patch adds a highly optimized generic implementation of expf, exp2f, logf, log2f and powf. The new functions are not only faster (6x for powf!), but are also smaller and more accurate. In order to achieve this, the algorithm uses double precision arithmetic for accuracy, avoids divisions and uses small table lookups to minimize the polynomials. Special cases are handled inline to avoid the unnecessary overhead of wrapper functions and set errno to POSIX requirements. The new functions are added under newlib/libm/common, but the old implementations are kept (in newlib/libm/math) for non-IEEE or pre-C99 systems. Targets can enable the new math code by defining __OBSOLETE_MATH_DEFAULT to 0 in newlib/libc/include/machine/ieeefp.h, users can override the default by defining __OBSOLETE_MATH. Currently the new code is enabled for AArch64 and AArch32 with VFP. Targets with a single precision FPU may still prefer the old implementation. libm.a size changes: arm: -1692 arm/thumb/v7-a/nofp: -878 arm/thumb/v7-a+fp/hard: -864 arm/thumb/v7-a+fp/softfp: -908 aarch64: -1476 2017-05-25 16:41:38 +01:00			`#if __OBSOLETE_MATH`
import newlib-2000-02-17 snapshot 2000-02-17 19:39:52 +00:00			`#ifdef __v810__`
			`#define const`
			`#endif`

			`#ifdef __STDC__`
			`static const float`
			`#else`
			`static float`
			`#endif`
			`one = 1.0,`
			`halF[2] = {0.5,-0.5,},`
			`huge = 1.0e+30,`
			`twom100 = 7.8886090522e-31, /* 2*-100=0x0d800000 /`
			`ln2HI[2] ={ 6.9313812256e-01, /* 0x3f317180 */`
			`-6.9313812256e-01,}, /* 0xbf317180 */`
			`ln2LO[2] ={ 9.0580006145e-06, /* 0x3717f7d1 */`
			`-9.0580006145e-06,}, /* 0xb717f7d1 */`
			`invln2 = 1.4426950216e+00, /* 0x3fb8aa3b */`
			`P1 = 1.6666667163e-01, /* 0x3e2aaaab */`
			`P2 = -2.7777778450e-03, /* 0xbb360b61 */`
			`P3 = 6.6137559770e-05, /* 0x388ab355 */`
			`P4 = -1.6533901999e-06, /* 0xb5ddea0e */`
			`P5 = 4.1381369442e-08; /* 0x3331bb4c */`

			`#ifdef __STDC__`
			`float __ieee754_expf(float x) /* default IEEE double exp */`
			`#else`
			`float __ieee754_expf(x) /* default IEEE double exp */`
			`float x;`
			`#endif`
			`{`
			`float y,hi,lo,c,t;`
Throughout, run newlib with -Wall -Werror option and fix bugs and compiler warnings found this way. * libc/stdio/freopen.c (_freopen_r): Fix bug setting _flags. * libc/include/stdio.h (_rename): Define when building newlib. * libc/include/sys/signal.h (_kill): Ditto. * libc/include/sys/stat.h (_mkdir): Ditto. * libc/include/sys/time.h (_gettimeofday): Ditto. * libc/include/sys/times.h (_times): Ditto. * libc/include/sys/wait.h (_wait): Ditto. * libc/locale/lmessages.c (empty): Don't define for Cygwin. * libc/locale/lmonetary.c (cnv): Ditto. * libc/locale/nl_langinfo.c (nl_langinfo): Ditto for variable s. * libc/posix/collate.c: Throughout cast to avoid compiler warning. * libc/posix/engine.c (matcher): Initialize dp to avoid compiler warning. * libc/posix/glob.c: Disable on Cygwin. Explain why. * libc/posix/regcomp.c: Fix "uninitialized" compiler warnings. (dissect): Deliberately silence gcc compiler warning. Add comment to explain why. * libc/posix/wordexp.c (wordexp): Remove num_bytes variable since result is never used. * libc/posix/popen.c (popen): Ditto for variable last. * libc/reent/mkdirr.c: Include sys/stat.h. * libc/reent/renamer.c: Include stdio.h. * libc/search/hash.c: Throughout use underscored variants of the stat function family. (init_hash): Add missing definition for the __USE_INTERNAL_STAT64 case. * libc/search/hash_bigkey.c (__big_insert): Add parenthesis to avoid compiler warning. * libc/search/hash_page.c (overflow_page): Initalize freep to NULL to avoid compiler warning. * libc/stdio/asiprintf.c (_asiprintf_r): Cast unsigned char * to char * to avoid compiler warning. (asiprintf): Ditto. * libc/stdio/asprintf.c (_asprintf_r): Ditto. (asprintf): Ditto. * libc/stdio/vasiprintf.c (_vasiprintf_r): Ditto. * libc/stdio/vasprintf.c (_vasprintf_r): Ditto. * libc/stdio/mktemp.c (_gettemp): Cast to unsigned char in call to isdigit to avoid compiler warning. * libc/stdio/vfprintf.c (_VFPRINTF_R): Initialize variables used for grouping to avoid compiler warning. Only define and set nseps and nrepeats if they are really used. * libc/stdio/vfwprintf.c (_VFWPRINTF_R): Ditto. Only define state if it is really used. * libc/stdio/vfscanf.c (u_char): Revert to be defined as unsigned char. (__SVFSCANF_R): Cast fmt in call to __mbtowc. * libc/stdlib/mbtowc_r.c (JIS_state_table): Disable when building Cygwin. (JIS_action_table): Ditto. * libc/stdlib/wctomb_r.c (__utf8_wctomb): Add parenthesis to avoid compiler warning. * libc/string/strcasestr.c: Deliberately silence gcc compiler warning. Add comment to explain why. * libc/time/strptime.c (strptime): Cast to unsigned char in calls to isspace to avoid compiler warning. * libm/math/e_atan2.c (__ieee754_atan2): Add parenthesis to avoid compiler warning. * libm/math/e_exp.c (__ieee754_exp): Initialize k to 0 to avoid compiler warning. Drop setting it to 0 later. * libm/math/ef_exp.c (__ieee754_expf): Ditto. * libm/math/e_pow.c (__ieee754_pow): Add braces to avoid compiler warning. * libm/math/ef_pow.c (__ieee754_powf): Ditto. * libm/math/er_lgamma.c (__ieee754_lgamma_r): Initialize nadj to 0 to avoid compiler warning. * libm/math/erf_lgamma.c (__ieee754_lgammaf_r): Ditto. * libm/math/e_rem_pio2.c (__ieee754_rem_pio2): Ditto for variable z. * libm/common/sf_round.c (roundf): Remove signbit variable since result is never used. 2012-08-08 11:04:18 +00:00			`__int32_t k = 0,xsb,sx;`
import newlib-2000-02-17 snapshot 2000-02-17 19:39:52 +00:00			`__uint32_t hx;`

* libc/include/machine/ieeefp.h: Comment about new configuration macros _FLT_LARGEST_EXPONENT_IS_NORMAL and _FLT_NO_DENORMALS. * libm/common/fdlib.h: Define new macros for testing floats. * libm/common/sf_: Use them. libm/math/ef_: Likewise. libm/math/sf_*: Likewise. 2001-04-04 13:33:01 +00:00			`GET_FLOAT_WORD(sx,x);`
			`xsb = (sx>>31)&1; /* sign bit of x */`
			`hx = sx & 0x7fffffff; /* high word of \|x\| */`
import newlib-2000-02-17 snapshot 2000-02-17 19:39:52 +00:00
			`/* filter out non-finite argument */`
* libc/include/machine/ieeefp.h: Comment about new configuration macros _FLT_LARGEST_EXPONENT_IS_NORMAL and _FLT_NO_DENORMALS. * libm/common/fdlib.h: Define new macros for testing floats. * libm/common/sf_: Use them. libm/math/ef_: Likewise. libm/math/sf_*: Likewise. 2001-04-04 13:33:01 +00:00			`if(FLT_UWORD_IS_NAN(hx))`
			`return x+x; /* NaN */`
			`if(FLT_UWORD_IS_INFINITE(hx))`
			`return (xsb==0)? x:0.0; /* exp(+-inf)={inf,0} */`
			`if(sx > FLT_UWORD_LOG_MAX)`
libm/math: Use __math_xflow in obsolete math code [v2] C compilers may fold const values at compile time, so expressions which try to elicit underflow/overflow by performing simple arithemetic on suitable values will not generate the required exceptions. Work around this by replacing code which does these arithmetic operations with calls to the existing __math_xflow functions that are designed to do this correctly. Signed-off-by: Keith Packard <keithp@keithp.com> ---- v2: libm/math: Pass sign to __math_xflow instead of muliplying result 2020-07-30 16:41:05 -07:00			`return __math_oflowf(0); /* overflow */`
* libc/include/machine/ieeefp.h: Comment about new configuration macros _FLT_LARGEST_EXPONENT_IS_NORMAL and _FLT_NO_DENORMALS. * libm/common/fdlib.h: Define new macros for testing floats. * libm/common/sf_: Use them. libm/math/ef_: Likewise. libm/math/sf_*: Likewise. 2001-04-04 13:33:01 +00:00			`if(sx < 0 && hx > FLT_UWORD_LOG_MIN)`
libm/math: ensure that expf(-huge) sets FE_UNDERFLOW exception It was calling __math_uflow(0) instead of __math_uflowf(0), which resulted in no exception being set on machines with exception support for float but not double. Signed-off-by: Keith Packard <keithp@keithp.com> 2020-08-07 22:40:21 -07:00			`return __math_uflowf(0); /* underflow */`
* libc/include/machine/ieeefp.h: Comment about new configuration macros _FLT_LARGEST_EXPONENT_IS_NORMAL and _FLT_NO_DENORMALS. * libm/common/fdlib.h: Define new macros for testing floats. * libm/common/sf_: Use them. libm/math/ef_: Likewise. libm/math/sf_*: Likewise. 2001-04-04 13:33:01 +00:00
import newlib-2000-02-17 snapshot 2000-02-17 19:39:52 +00:00			`/* argument reduction */`
			`if(hx > 0x3eb17218) { /* if \|x\| > 0.5 ln2 */`
			`if(hx < 0x3F851592) { /* and \|x\| < 1.5 ln2 */`
			`hi = x-ln2HI[xsb]; lo=ln2LO[xsb]; k = 1-xsb-xsb;`
			`} else {`
			`k = invln2*x+halF[xsb];`
			`t = k;`
			`hi = x - tln2HI[0]; / tln2HI is exact here /`
			`lo = t*ln2LO[0];`
			`}`
			`x = hi - lo;`
			`}`
Fix error in exp in magnitude [2e-32,2e-28] While testing the exp function we noticed some errors at the specified magnitude. Within this range the exp function returns the input value +1 as an output. We chose to run a test of 1m exponentially spaced values in the ranges [-2^-27,-2^-32] and [2^-32,2^-27] which showed 7603 and 3912 results with an error of >=0.5 ULP (compared with MPFR in 128 bit) with the highest being 0.56 ULP and 0.53 ULP. It's easy to fix by changing the magnitude at which the input value +1 is returned from <2^-28 to <2^-32 and using the polynomial instead. This reduces the number of results with an error of >=0.5 ULP to 485 and 479 in above tests, all of which are exactly 0.5 ULP. As we were already checking on exp we also took a look at expf. For expf the magnitude where the input value +1 is returned can be increased from <2^-28 to <2^-23 without accuracy loss for a slight performance improvement. To ensure this was the correct value we tested all values in the ranges [-2^-17,-2^-28] and [2^-28,2^-17] (~92.3m values each). 2020-03-06 15:46:33 +01:00			`else if(hx < 0x34000000) { /* when \|x\|<2*-23 /`
import newlib-2000-02-17 snapshot 2000-02-17 19:39:52 +00:00			`if(huge+x>one) return one+x;/* trigger inexact */`
			`}`

			`/* x is now in primary range */`
			`t = x*x;`
			`c = x - t(P1+t(P2+t(P3+t(P4+t*P5))));`
			`if(k==0) return one-((x*c)/(c-(float)2.0)-x);`
			`else y = one-((lo-(x*c)/((float)2.0-c))-hi);`
			`if(k >= -125) {`
			`__uint32_t hy;`
			`GET_FLOAT_WORD(hy,y);`
			`SET_FLOAT_WORD(y,hy+(k<<23)); /* add k to y's exponent */`
			`return y;`
			`} else {`
			`__uint32_t hy;`
			`GET_FLOAT_WORD(hy,y);`
			`SET_FLOAT_WORD(y,hy+((k+100)<<23)); /* add k to y's exponent */`
			`return y*twom100;`
			`}`
			`}`
New expf, exp2f, logf, log2f and powf implementations Based on code from https://github.com/ARM-software/optimized-routines/ This patch adds a highly optimized generic implementation of expf, exp2f, logf, log2f and powf. The new functions are not only faster (6x for powf!), but are also smaller and more accurate. In order to achieve this, the algorithm uses double precision arithmetic for accuracy, avoids divisions and uses small table lookups to minimize the polynomials. Special cases are handled inline to avoid the unnecessary overhead of wrapper functions and set errno to POSIX requirements. The new functions are added under newlib/libm/common, but the old implementations are kept (in newlib/libm/math) for non-IEEE or pre-C99 systems. Targets can enable the new math code by defining __OBSOLETE_MATH_DEFAULT to 0 in newlib/libc/include/machine/ieeefp.h, users can override the default by defining __OBSOLETE_MATH. Currently the new code is enabled for AArch64 and AArch32 with VFP. Targets with a single precision FPU may still prefer the old implementation. libm.a size changes: arm: -1692 arm/thumb/v7-a/nofp: -878 arm/thumb/v7-a+fp/hard: -864 arm/thumb/v7-a+fp/softfp: -908 aarch64: -1476 2017-05-25 16:41:38 +01:00			`#endif /* __OBSOLETE_MATH */`