Blame - fusl/src/math/exp2f.c - mojo-tools

blob: e88fa6956f1b233f3a554a28a9173066929deff2 [file] [log] [blame]

Viet-Trung Luu	96b05c1	2016-01-11 11:26:36 -0800	[diff] [blame]	1	/* origin: FreeBSD /usr/src/lib/msun/src/s_exp2f.c */
				2	/*-
				3	* Copyright (c) 2005 David Schultz <das@FreeBSD.ORG>
				4	* All rights reserved.
				5	*
				6	* Redistribution and use in source and binary forms, with or without
				7	* modification, are permitted provided that the following conditions
				8	* are met:
				9	* 1. Redistributions of source code must retain the above copyright
				10	* notice, this list of conditions and the following disclaimer.
				11	* 2. Redistributions in binary form must reproduce the above copyright
				12	* notice, this list of conditions and the following disclaimer in the
				13	* documentation and/or other materials provided with the distribution.
				14	*
				15	* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
				16	* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
				17	* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
				18	* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
				19	* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
				20	* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
				21	* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
				22	* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
				23	* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
				24	* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
				25	* SUCH DAMAGE.
				26	*/
				27
				28	#include "libm.h"
				29
				30	#define TBLSIZE 16
				31
George Kulakowski	17e3b04	2016-02-18 15:59:50 -0800	[diff] [blame]	32	static const float redux = 0x1.8p23f / TBLSIZE, P1 = 0x1.62e430p-1f,
				33	P2 = 0x1.ebfbe0p-3f, P3 = 0x1.c6b348p-5f,
				34	P4 = 0x1.3b2c9cp-7f;
Viet-Trung Luu	96b05c1	2016-01-11 11:26:36 -0800	[diff] [blame]	35
				36	static const double exp2ft[TBLSIZE] = {
George Kulakowski	17e3b04	2016-02-18 15:59:50 -0800	[diff] [blame]	37	0x1.6a09e667f3bcdp-1, 0x1.7a11473eb0187p-1, 0x1.8ace5422aa0dbp-1,
				38	0x1.9c49182a3f090p-1, 0x1.ae89f995ad3adp-1, 0x1.c199bdd85529cp-1,
				39	0x1.d5818dcfba487p-1, 0x1.ea4afa2a490dap-1, 0x1.0000000000000p+0,
				40	0x1.0b5586cf9890fp+0, 0x1.172b83c7d517bp+0, 0x1.2387a6e756238p+0,
				41	0x1.306fe0a31b715p+0, 0x1.3dea64c123422p+0, 0x1.4bfdad5362a27p+0,
				42	0x1.5ab07dd485429p+0,
Viet-Trung Luu	96b05c1	2016-01-11 11:26:36 -0800	[diff] [blame]	43	};
				44
				45	/*
				46	* exp2f(x): compute the base 2 exponential of x
				47	*
				48	* Accuracy: Peak error < 0.501 ulp; location of peak: -0.030110927.
				49	*
				50	* Method: (equally-spaced tables)
				51	*
				52	* Reduce x:
				53	* x = k + y, for integer k and \|y\| <= 1/2.
				54	* Thus we have exp2f(x) = 2*k exp2(y).
				55	*
				56	* Reduce y:
				57	* y = i/TBLSIZE + z for integer i near y * TBLSIZE.
				58	* Thus we have exp2(y) = exp2(i/TBLSIZE) * exp2(z),
				59	* with \|z\| <= 2**-(TBLSIZE+1).
				60	*
				61	* We compute exp2(i/TBLSIZE) via table lookup and exp2(z) via a
				62	* degree-4 minimax polynomial with maximum error under 1.4 * 2**-33.
				63	* Using double precision for everything except the reduction makes
				64	* roundoff error insignificant and simplifies the scaling step.
				65	*
				66	* This method is due to Tang, but I do not use his suggested parameters:
				67	*
				68	* Tang, P. Table-driven Implementation of the Exponential Function
				69	* in IEEE Floating-Point Arithmetic. TOMS 15(2), 144-157 (1989).
				70	*/
George Kulakowski	17e3b04	2016-02-18 15:59:50 -0800	[diff] [blame]	71	float exp2f(float x) {
				72	double_t t, r, z;
				73	union {
				74	float f;
				75	uint32_t i;
				76	} u = {x};
				77	union {
				78	double f;
				79	uint64_t i;
				80	} uk;
				81	uint32_t ix, i0, k;
Viet-Trung Luu	96b05c1	2016-01-11 11:26:36 -0800	[diff] [blame]	82
George Kulakowski	17e3b04	2016-02-18 15:59:50 -0800	[diff] [blame]	83	/* Filter out exceptional cases. */
				84	ix = u.i & 0x7fffffff;
				85	if (ix > 0x42fc0000) { /* \|x\| > 126 */
				86	if (u.i >= 0x43000000 && u.i < 0x80000000) { /* x >= 128 */
				87	x *= 0x1p127f;
				88	return x;
				89	}
				90	if (u.i >= 0x80000000) { /* x < -126 */
				91	if (u.i >= 0xc3160000 \|\| (u.i & 0x0000ffff))
				92	FORCE_EVAL(-0x1p-149f / x);
				93	if (u.i >= 0xc3160000) /* x <= -150 */
				94	return 0;
				95	}
				96	} else if (ix <= 0x33000000) { /* \|x\| <= 0x1p-25 */
				97	return 1.0f + x;
				98	}
Viet-Trung Luu	96b05c1	2016-01-11 11:26:36 -0800	[diff] [blame]	99
George Kulakowski	17e3b04	2016-02-18 15:59:50 -0800	[diff] [blame]	100	/* Reduce x, computing z, i0, and k. */
				101	u.f = x + redux;
				102	i0 = u.i;
				103	i0 += TBLSIZE / 2;
				104	k = i0 / TBLSIZE;
				105	uk.i = (uint64_t)(0x3ff + k) << 52;
				106	i0 &= TBLSIZE - 1;
				107	u.f -= redux;
				108	z = x - u.f;
				109	/* Compute r = exp2(y) = exp2ft[i0] * p(z). */
				110	r = exp2ft[i0];
				111	t = r * z;
				112	r = r + t * (P1 + z * P2) + t * (z * z) * (P3 + z * P4);
Viet-Trung Luu	96b05c1	2016-01-11 11:26:36 -0800	[diff] [blame]	113
George Kulakowski	17e3b04	2016-02-18 15:59:50 -0800	[diff] [blame]	114	/* Scale by 2*k /
				115	return r * uk.f;
Viet-Trung Luu	96b05c1	2016-01-11 11:26:36 -0800	[diff] [blame]	116	}