Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Normal
Revision Log

sf_pow.c @ 444

Last change on this file since 444 was 444, checked in by satin@…, 6 years ago
add newlib,libalmos-mkh, restructure shared_syscalls.h and mini-libc
File size: 6.7 KB

Rev	Line
[444]	1	/* Single-precision pow function.
	2	Copyright (c) 2017 ARM Ltd. All rights reserved.
	3
	4	Redistribution and use in source and binary forms, with or without
	5	modification, are permitted provided that the following conditions
	6	are met:
	7	1. Redistributions of source code must retain the above copyright
	8	notice, this list of conditions and the following disclaimer.
	9	2. Redistributions in binary form must reproduce the above copyright
	10	notice, this list of conditions and the following disclaimer in the
	11	documentation and/or other materials provided with the distribution.
	12	3. The name of the company may not be used to endorse or promote
	13	products derived from this software without specific prior written
	14	permission.
	15
	16	THIS SOFTWARE IS PROVIDED BY ARM LTD ``AS IS AND ANY EXPRESS OR IMPLIED
	17	WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
	18	MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
	19	IN NO EVENT SHALL ARM LTD BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	20	SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
	21	TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
	22	PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
	23	LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
	24	NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
	25	SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */
	26
	27	#include "fdlibm.h"
	28	#if !__OBSOLETE_MATH
	29
	30	#include <math.h>
	31	#include <stdint.h>
	32	#include "math_config.h"
	33
	34	/*
	35	POWF_LOG2_POLY_ORDER = 5
	36	EXP2F_TABLE_BITS = 5
	37
	38	ULP error: 0.82 (~ 0.5 + relerr*2^24)
	39	relerr: 1.27 * 2^-26 (Relative error ~= 128Ln2relerr_log2 + relerr_exp2)
	40	relerr_log2: 1.83 * 2^-33 (Relative error of logx.)
	41	relerr_exp2: 1.69 * 2^-34 (Relative error of exp2(ylogx).)
	42	*/
	43
	44	#define N (1 << POWF_LOG2_TABLE_BITS)
	45	#define T __powf_log2_data.tab
	46	#define A __powf_log2_data.poly
	47	#define OFF 0x3f330000
	48
	49	/* Subnormal input is normalized so ix has negative biased exponent.
	50	Output is multiplied by N (POWF_SCALE) if TOINT_INTRINICS is set. */
	51	static inline double_t
	52	log2_inline (uint32_t ix)
	53	{
	54	/* double_t for better performance on targets with FLT_EVAL_METHOD==2. */
	55	double_t z, r, r2, r4, p, q, y, y0, invc, logc;
	56	uint32_t iz, top, tmp;
	57	int k, i;
	58
	59	/* x = 2^k z; where z is in range [OFF,2*OFF] and exact.
	60	The range is split into N subintervals.
	61	The ith subinterval contains z and c is near its center. */
	62	tmp = ix - OFF;
	63	i = (tmp >> (23 - POWF_LOG2_TABLE_BITS)) % N;
	64	top = tmp & 0xff800000;
	65	iz = ix - top;
	66	k = (int32_t) top >> (23 - POWF_SCALE_BITS); /* arithmetic shift */
	67	invc = T[i].invc;
	68	logc = T[i].logc;
	69	z = (double_t) asfloat (iz);
	70
	71	/* log2(x) = log1p(z/c-1)/ln2 + log2(c) + k */
	72	r = z * invc - 1;
	73	y0 = logc + (double_t) k;
	74
	75	/* Pipelined polynomial evaluation to approximate log1p(r)/ln2. */
	76	r2 = r * r;
	77	y = A[0] * r + A[1];
	78	p = A[2] * r + A[3];
	79	r4 = r2 * r2;
	80	q = A[4] * r + y0;
	81	q = p * r2 + q;
	82	y = y * r4 + q;
	83	return y;
	84	}
	85
	86	#undef N
	87	#undef T
	88	#define N (1 << EXP2F_TABLE_BITS)
	89	#define T __exp2f_data.tab
	90	#define SIGN_BIAS (1 << (EXP2F_TABLE_BITS + 11))
	91
	92	/* The output of log2 and thus the input of exp2 is either scaled by N
	93	(in case of fast toint intrinsics) or not. The unscaled xd must be
	94	in [-1021,1023], sign_bias sets the sign of the result. */
	95	static inline double_t
	96	exp2_inline (double_t xd, unsigned long sign_bias)
	97	{
	98	uint64_t ki, ski, t;
	99	/* double_t for better performance on targets with FLT_EVAL_METHOD==2. */
	100	double_t kd, z, r, r2, y, s;
	101
	102	#if TOINT_INTRINSICS
	103	# define C __exp2f_data.poly_scaled
	104	/* Nx = k + r with r in [-1/2, 1/2] /
	105	kd = roundtoint (xd); /* k */
	106	ki = converttoint (xd);
	107	#else
	108	# define C __exp2f_data.poly
	109	# define SHIFT __exp2f_data.shift_scaled
	110	/* x = k/N + r with r in [-1/(2N), 1/(2N)] */
	111	kd = (double) (xd + SHIFT); /* Rounding to double precision is required. */
	112	ki = asuint64 (kd);
	113	kd -= SHIFT; /* k/N */
	114	#endif
	115	r = xd - kd;
	116
	117	/* exp2(x) = 2^(k/N) * 2^r ~= s * (C0r^3 + C1r^2 + C2r + 1) /
	118	t = T[ki % N];
	119	ski = ki + sign_bias;
	120	t += ski << (52 - EXP2F_TABLE_BITS);
	121	s = asdouble (t);
	122	z = C[0] * r + C[1];
	123	r2 = r * r;
	124	y = C[2] * r + 1;
	125	y = z * r2 + y;
	126	y = y * s;
	127	return y;
	128	}
	129
	130	/* Returns 0 if not int, 1 if odd int, 2 if even int. */
	131	static inline int
	132	checkint (uint32_t iy)
	133	{
	134	int e = iy >> 23 & 0xff;
	135	if (e < 0x7f)
	136	return 0;
	137	if (e > 0x7f + 23)
	138	return 2;
	139	if (iy & ((1 << (0x7f + 23 - e)) - 1))
	140	return 0;
	141	if (iy & (1 << (0x7f + 23 - e)))
	142	return 1;
	143	return 2;
	144	}
	145
	146	static inline int
	147	zeroinfnan (uint32_t ix)
	148	{
	149	return 2 * ix - 1 >= 2u * 0x7f800000 - 1;
	150	}
	151
	152	float
	153	powf (float x, float y)
	154	{
	155	unsigned long sign_bias = 0;
	156	uint32_t ix, iy;
	157
	158	ix = asuint (x);
	159	iy = asuint (y);
	160	if (__builtin_expect (ix - 0x00800000 >= 0x7f800000 - 0x00800000
	161	\|\| zeroinfnan (iy),
	162	0))
	163	{
	164	/* Either (x < 0x1p-126 or inf or nan) or (y is 0 or inf or nan). */
	165	if (__builtin_expect (zeroinfnan (iy), 0))
	166	{
	167	if (2 * iy == 0)
	168	return issignalingf_inline (x) ? x + y : 1.0f;
	169	if (ix == 0x3f800000)
	170	return issignalingf_inline (y) ? x + y : 1.0f;
	171	if (2 * ix > 2u * 0x7f800000 \|\| 2 * iy > 2u * 0x7f800000)
	172	return x + y;
	173	if (2 * ix == 2 * 0x3f800000)
	174	return 1.0f;
	175	if ((2 * ix < 2 * 0x3f800000) == !(iy & 0x80000000))
	176	return 0.0f; /* \|x\|<1 && y==inf or \|x\|>1 && y==-inf. */
	177	return y * y;
	178	}
	179	if (__builtin_expect (zeroinfnan (ix), 0))
	180	{
	181	float_t x2 = x * x;
	182	if (ix & 0x80000000 && checkint (iy) == 1)
	183	{
	184	x2 = -x2;
	185	sign_bias = 1;
	186	}
	187	#if WANT_ERRNO
	188	if (2 * ix == 0 && iy & 0x80000000)
	189	return __math_divzerof (sign_bias);
	190	#endif
	191	return iy & 0x80000000 ? 1 / x2 : x2;
	192	}
	193	/* x and y are non-zero finite. */
	194	if (ix & 0x80000000)
	195	{
	196	/* Finite x < 0. */
	197	int yint = checkint (iy);
	198	if (yint == 0)
	199	return __math_invalidf (x);
	200	if (yint == 1)
	201	sign_bias = SIGN_BIAS;
	202	ix &= 0x7fffffff;
	203	}
	204	if (ix < 0x00800000)
	205	{
	206	/* Normalize subnormal x so exponent becomes negative. */
	207	ix = asuint (x * 0x1p23f);
	208	ix &= 0x7fffffff;
	209	ix -= 23 << 23;
	210	}
	211	}
	212	double_t logx = log2_inline (ix);
	213	double_t ylogx = y * logx; /* Note: cannot overflow, y is single prec. */
	214	if (__builtin_expect ((asuint64 (ylogx) >> 47 & 0xffff)
	215	>= asuint64 (126.0 * POWF_SCALE) >> 47,
	216	0))
	217	{
	218	/* \|ylog(x)\| >= 126. /
	219	if (ylogx > 0x1.fffffffd1d571p+6 * POWF_SCALE)
	220	return __math_oflowf (sign_bias);
	221	if (ylogx <= -150.0 * POWF_SCALE)
	222	return __math_uflowf (sign_bias);
	223	#if WANT_ERRNO_UFLOW
	224	if (ylogx < -149.0 * POWF_SCALE)
	225	return __math_may_uflowf (sign_bias);
	226	#endif
	227	}
	228	return (float) exp2_inline (ylogx, sign_bias);
	229	}
	230	#endif /* !__OBSOLETE_MATH */

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: trunk/libs/newlib/src/newlib/libm/common/sf_pow.c @ 444

Download in other formats: