blob: e88fa6956f1b233f3a554a28a9173066929deff2 [file] [log] [blame]
Viet-Trung Luu96b05c12016-01-11 11:26:36 -08001/* origin: FreeBSD /usr/src/lib/msun/src/s_exp2f.c */
2/*-
3 * Copyright (c) 2005 David Schultz <das@FreeBSD.ORG>
4 * All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 * SUCH DAMAGE.
26 */
27
28#include "libm.h"
29
30#define TBLSIZE 16
31
George Kulakowski17e3b042016-02-18 15:59:50 -080032static const float redux = 0x1.8p23f / TBLSIZE, P1 = 0x1.62e430p-1f,
33 P2 = 0x1.ebfbe0p-3f, P3 = 0x1.c6b348p-5f,
34 P4 = 0x1.3b2c9cp-7f;
Viet-Trung Luu96b05c12016-01-11 11:26:36 -080035
36static const double exp2ft[TBLSIZE] = {
George Kulakowski17e3b042016-02-18 15:59:50 -080037 0x1.6a09e667f3bcdp-1, 0x1.7a11473eb0187p-1, 0x1.8ace5422aa0dbp-1,
38 0x1.9c49182a3f090p-1, 0x1.ae89f995ad3adp-1, 0x1.c199bdd85529cp-1,
39 0x1.d5818dcfba487p-1, 0x1.ea4afa2a490dap-1, 0x1.0000000000000p+0,
40 0x1.0b5586cf9890fp+0, 0x1.172b83c7d517bp+0, 0x1.2387a6e756238p+0,
41 0x1.306fe0a31b715p+0, 0x1.3dea64c123422p+0, 0x1.4bfdad5362a27p+0,
42 0x1.5ab07dd485429p+0,
Viet-Trung Luu96b05c12016-01-11 11:26:36 -080043};
44
45/*
46 * exp2f(x): compute the base 2 exponential of x
47 *
48 * Accuracy: Peak error < 0.501 ulp; location of peak: -0.030110927.
49 *
50 * Method: (equally-spaced tables)
51 *
52 * Reduce x:
53 * x = k + y, for integer k and |y| <= 1/2.
54 * Thus we have exp2f(x) = 2**k * exp2(y).
55 *
56 * Reduce y:
57 * y = i/TBLSIZE + z for integer i near y * TBLSIZE.
58 * Thus we have exp2(y) = exp2(i/TBLSIZE) * exp2(z),
59 * with |z| <= 2**-(TBLSIZE+1).
60 *
61 * We compute exp2(i/TBLSIZE) via table lookup and exp2(z) via a
62 * degree-4 minimax polynomial with maximum error under 1.4 * 2**-33.
63 * Using double precision for everything except the reduction makes
64 * roundoff error insignificant and simplifies the scaling step.
65 *
66 * This method is due to Tang, but I do not use his suggested parameters:
67 *
68 * Tang, P. Table-driven Implementation of the Exponential Function
69 * in IEEE Floating-Point Arithmetic. TOMS 15(2), 144-157 (1989).
70 */
George Kulakowski17e3b042016-02-18 15:59:50 -080071float exp2f(float x) {
72 double_t t, r, z;
73 union {
74 float f;
75 uint32_t i;
76 } u = {x};
77 union {
78 double f;
79 uint64_t i;
80 } uk;
81 uint32_t ix, i0, k;
Viet-Trung Luu96b05c12016-01-11 11:26:36 -080082
George Kulakowski17e3b042016-02-18 15:59:50 -080083 /* Filter out exceptional cases. */
84 ix = u.i & 0x7fffffff;
85 if (ix > 0x42fc0000) { /* |x| > 126 */
86 if (u.i >= 0x43000000 && u.i < 0x80000000) { /* x >= 128 */
87 x *= 0x1p127f;
88 return x;
89 }
90 if (u.i >= 0x80000000) { /* x < -126 */
91 if (u.i >= 0xc3160000 || (u.i & 0x0000ffff))
92 FORCE_EVAL(-0x1p-149f / x);
93 if (u.i >= 0xc3160000) /* x <= -150 */
94 return 0;
95 }
96 } else if (ix <= 0x33000000) { /* |x| <= 0x1p-25 */
97 return 1.0f + x;
98 }
Viet-Trung Luu96b05c12016-01-11 11:26:36 -080099
George Kulakowski17e3b042016-02-18 15:59:50 -0800100 /* Reduce x, computing z, i0, and k. */
101 u.f = x + redux;
102 i0 = u.i;
103 i0 += TBLSIZE / 2;
104 k = i0 / TBLSIZE;
105 uk.i = (uint64_t)(0x3ff + k) << 52;
106 i0 &= TBLSIZE - 1;
107 u.f -= redux;
108 z = x - u.f;
109 /* Compute r = exp2(y) = exp2ft[i0] * p(z). */
110 r = exp2ft[i0];
111 t = r * z;
112 r = r + t * (P1 + z * P2) + t * (z * z) * (P3 + z * P4);
Viet-Trung Luu96b05c12016-01-11 11:26:36 -0800113
George Kulakowski17e3b042016-02-18 15:59:50 -0800114 /* Scale by 2**k */
115 return r * uk.f;
Viet-Trung Luu96b05c12016-01-11 11:26:36 -0800116}