1*c9945492SAndroid Build Coastguard Worker /* origin: FreeBSD /usr/src/lib/msun/src/s_cbrtl.c */
2*c9945492SAndroid Build Coastguard Worker /*-
3*c9945492SAndroid Build Coastguard Worker * ====================================================
4*c9945492SAndroid Build Coastguard Worker * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
5*c9945492SAndroid Build Coastguard Worker * Copyright (c) 2009-2011, Bruce D. Evans, Steven G. Kargl, David Schultz.
6*c9945492SAndroid Build Coastguard Worker *
7*c9945492SAndroid Build Coastguard Worker * Developed at SunPro, a Sun Microsystems, Inc. business.
8*c9945492SAndroid Build Coastguard Worker * Permission to use, copy, modify, and distribute this
9*c9945492SAndroid Build Coastguard Worker * software is freely granted, provided that this notice
10*c9945492SAndroid Build Coastguard Worker * is preserved.
11*c9945492SAndroid Build Coastguard Worker * ====================================================
12*c9945492SAndroid Build Coastguard Worker *
13*c9945492SAndroid Build Coastguard Worker * The argument reduction and testing for exceptional cases was
14*c9945492SAndroid Build Coastguard Worker * written by Steven G. Kargl with input from Bruce D. Evans
15*c9945492SAndroid Build Coastguard Worker * and David A. Schultz.
16*c9945492SAndroid Build Coastguard Worker */
17*c9945492SAndroid Build Coastguard Worker
18*c9945492SAndroid Build Coastguard Worker #include "libm.h"
19*c9945492SAndroid Build Coastguard Worker
20*c9945492SAndroid Build Coastguard Worker #if LDBL_MANT_DIG == 53 && LDBL_MAX_EXP == 1024
cbrtl(long double x)21*c9945492SAndroid Build Coastguard Worker long double cbrtl(long double x)
22*c9945492SAndroid Build Coastguard Worker {
23*c9945492SAndroid Build Coastguard Worker return cbrt(x);
24*c9945492SAndroid Build Coastguard Worker }
25*c9945492SAndroid Build Coastguard Worker #elif (LDBL_MANT_DIG == 64 || LDBL_MANT_DIG == 113) && LDBL_MAX_EXP == 16384
26*c9945492SAndroid Build Coastguard Worker static const unsigned B1 = 709958130; /* B1 = (127-127.0/3-0.03306235651)*2**23 */
27*c9945492SAndroid Build Coastguard Worker
cbrtl(long double x)28*c9945492SAndroid Build Coastguard Worker long double cbrtl(long double x)
29*c9945492SAndroid Build Coastguard Worker {
30*c9945492SAndroid Build Coastguard Worker union ldshape u = {x}, v;
31*c9945492SAndroid Build Coastguard Worker union {float f; uint32_t i;} uft;
32*c9945492SAndroid Build Coastguard Worker long double r, s, t, w;
33*c9945492SAndroid Build Coastguard Worker double_t dr, dt, dx;
34*c9945492SAndroid Build Coastguard Worker float_t ft;
35*c9945492SAndroid Build Coastguard Worker int e = u.i.se & 0x7fff;
36*c9945492SAndroid Build Coastguard Worker int sign = u.i.se & 0x8000;
37*c9945492SAndroid Build Coastguard Worker
38*c9945492SAndroid Build Coastguard Worker /*
39*c9945492SAndroid Build Coastguard Worker * If x = +-Inf, then cbrt(x) = +-Inf.
40*c9945492SAndroid Build Coastguard Worker * If x = NaN, then cbrt(x) = NaN.
41*c9945492SAndroid Build Coastguard Worker */
42*c9945492SAndroid Build Coastguard Worker if (e == 0x7fff)
43*c9945492SAndroid Build Coastguard Worker return x + x;
44*c9945492SAndroid Build Coastguard Worker if (e == 0) {
45*c9945492SAndroid Build Coastguard Worker /* Adjust subnormal numbers. */
46*c9945492SAndroid Build Coastguard Worker u.f *= 0x1p120;
47*c9945492SAndroid Build Coastguard Worker e = u.i.se & 0x7fff;
48*c9945492SAndroid Build Coastguard Worker /* If x = +-0, then cbrt(x) = +-0. */
49*c9945492SAndroid Build Coastguard Worker if (e == 0)
50*c9945492SAndroid Build Coastguard Worker return x;
51*c9945492SAndroid Build Coastguard Worker e -= 120;
52*c9945492SAndroid Build Coastguard Worker }
53*c9945492SAndroid Build Coastguard Worker e -= 0x3fff;
54*c9945492SAndroid Build Coastguard Worker u.i.se = 0x3fff;
55*c9945492SAndroid Build Coastguard Worker x = u.f;
56*c9945492SAndroid Build Coastguard Worker switch (e % 3) {
57*c9945492SAndroid Build Coastguard Worker case 1:
58*c9945492SAndroid Build Coastguard Worker case -2:
59*c9945492SAndroid Build Coastguard Worker x *= 2;
60*c9945492SAndroid Build Coastguard Worker e--;
61*c9945492SAndroid Build Coastguard Worker break;
62*c9945492SAndroid Build Coastguard Worker case 2:
63*c9945492SAndroid Build Coastguard Worker case -1:
64*c9945492SAndroid Build Coastguard Worker x *= 4;
65*c9945492SAndroid Build Coastguard Worker e -= 2;
66*c9945492SAndroid Build Coastguard Worker break;
67*c9945492SAndroid Build Coastguard Worker }
68*c9945492SAndroid Build Coastguard Worker v.f = 1.0;
69*c9945492SAndroid Build Coastguard Worker v.i.se = sign | (0x3fff + e/3);
70*c9945492SAndroid Build Coastguard Worker
71*c9945492SAndroid Build Coastguard Worker /*
72*c9945492SAndroid Build Coastguard Worker * The following is the guts of s_cbrtf, with the handling of
73*c9945492SAndroid Build Coastguard Worker * special values removed and extra care for accuracy not taken,
74*c9945492SAndroid Build Coastguard Worker * but with most of the extra accuracy not discarded.
75*c9945492SAndroid Build Coastguard Worker */
76*c9945492SAndroid Build Coastguard Worker
77*c9945492SAndroid Build Coastguard Worker /* ~5-bit estimate: */
78*c9945492SAndroid Build Coastguard Worker uft.f = x;
79*c9945492SAndroid Build Coastguard Worker uft.i = (uft.i & 0x7fffffff)/3 + B1;
80*c9945492SAndroid Build Coastguard Worker ft = uft.f;
81*c9945492SAndroid Build Coastguard Worker
82*c9945492SAndroid Build Coastguard Worker /* ~16-bit estimate: */
83*c9945492SAndroid Build Coastguard Worker dx = x;
84*c9945492SAndroid Build Coastguard Worker dt = ft;
85*c9945492SAndroid Build Coastguard Worker dr = dt * dt * dt;
86*c9945492SAndroid Build Coastguard Worker dt = dt * (dx + dx + dr) / (dx + dr + dr);
87*c9945492SAndroid Build Coastguard Worker
88*c9945492SAndroid Build Coastguard Worker /* ~47-bit estimate: */
89*c9945492SAndroid Build Coastguard Worker dr = dt * dt * dt;
90*c9945492SAndroid Build Coastguard Worker dt = dt * (dx + dx + dr) / (dx + dr + dr);
91*c9945492SAndroid Build Coastguard Worker
92*c9945492SAndroid Build Coastguard Worker #if LDBL_MANT_DIG == 64
93*c9945492SAndroid Build Coastguard Worker /*
94*c9945492SAndroid Build Coastguard Worker * dt is cbrtl(x) to ~47 bits (after x has been reduced to 1 <= x < 8).
95*c9945492SAndroid Build Coastguard Worker * Round it away from zero to 32 bits (32 so that t*t is exact, and
96*c9945492SAndroid Build Coastguard Worker * away from zero for technical reasons).
97*c9945492SAndroid Build Coastguard Worker */
98*c9945492SAndroid Build Coastguard Worker t = dt + (0x1.0p32L + 0x1.0p-31L) - 0x1.0p32;
99*c9945492SAndroid Build Coastguard Worker #elif LDBL_MANT_DIG == 113
100*c9945492SAndroid Build Coastguard Worker /*
101*c9945492SAndroid Build Coastguard Worker * Round dt away from zero to 47 bits. Since we don't trust the 47,
102*c9945492SAndroid Build Coastguard Worker * add 2 47-bit ulps instead of 1 to round up. Rounding is slow and
103*c9945492SAndroid Build Coastguard Worker * might be avoidable in this case, since on most machines dt will
104*c9945492SAndroid Build Coastguard Worker * have been evaluated in 53-bit precision and the technical reasons
105*c9945492SAndroid Build Coastguard Worker * for rounding up might not apply to either case in cbrtl() since
106*c9945492SAndroid Build Coastguard Worker * dt is much more accurate than needed.
107*c9945492SAndroid Build Coastguard Worker */
108*c9945492SAndroid Build Coastguard Worker t = dt + 0x2.0p-46 + 0x1.0p60L - 0x1.0p60;
109*c9945492SAndroid Build Coastguard Worker #endif
110*c9945492SAndroid Build Coastguard Worker
111*c9945492SAndroid Build Coastguard Worker /*
112*c9945492SAndroid Build Coastguard Worker * Final step Newton iteration to 64 or 113 bits with
113*c9945492SAndroid Build Coastguard Worker * error < 0.667 ulps
114*c9945492SAndroid Build Coastguard Worker */
115*c9945492SAndroid Build Coastguard Worker s = t*t; /* t*t is exact */
116*c9945492SAndroid Build Coastguard Worker r = x/s; /* error <= 0.5 ulps; |r| < |t| */
117*c9945492SAndroid Build Coastguard Worker w = t+t; /* t+t is exact */
118*c9945492SAndroid Build Coastguard Worker r = (r-t)/(w+r); /* r-t is exact; w+r ~= 3*t */
119*c9945492SAndroid Build Coastguard Worker t = t+t*r; /* error <= 0.5 + 0.5/3 + epsilon */
120*c9945492SAndroid Build Coastguard Worker
121*c9945492SAndroid Build Coastguard Worker t *= v.f;
122*c9945492SAndroid Build Coastguard Worker return t;
123*c9945492SAndroid Build Coastguard Worker }
124*c9945492SAndroid Build Coastguard Worker #endif
125