1*c9945492SAndroid Build Coastguard Worker #include <stdint.h>
2*c9945492SAndroid Build Coastguard Worker #include <math.h>
3*c9945492SAndroid Build Coastguard Worker #include "libm.h"
4*c9945492SAndroid Build Coastguard Worker #include "sqrt_data.h"
5*c9945492SAndroid Build Coastguard Worker
6*c9945492SAndroid Build Coastguard Worker #define FENV_SUPPORT 1
7*c9945492SAndroid Build Coastguard Worker
mul32(uint32_t a,uint32_t b)8*c9945492SAndroid Build Coastguard Worker static inline uint32_t mul32(uint32_t a, uint32_t b)
9*c9945492SAndroid Build Coastguard Worker {
10*c9945492SAndroid Build Coastguard Worker return (uint64_t)a*b >> 32;
11*c9945492SAndroid Build Coastguard Worker }
12*c9945492SAndroid Build Coastguard Worker
13*c9945492SAndroid Build Coastguard Worker /* see sqrt.c for more detailed comments. */
14*c9945492SAndroid Build Coastguard Worker
sqrtf(float x)15*c9945492SAndroid Build Coastguard Worker float sqrtf(float x)
16*c9945492SAndroid Build Coastguard Worker {
17*c9945492SAndroid Build Coastguard Worker uint32_t ix, m, m1, m0, even, ey;
18*c9945492SAndroid Build Coastguard Worker
19*c9945492SAndroid Build Coastguard Worker ix = asuint(x);
20*c9945492SAndroid Build Coastguard Worker if (predict_false(ix - 0x00800000 >= 0x7f800000 - 0x00800000)) {
21*c9945492SAndroid Build Coastguard Worker /* x < 0x1p-126 or inf or nan. */
22*c9945492SAndroid Build Coastguard Worker if (ix * 2 == 0)
23*c9945492SAndroid Build Coastguard Worker return x;
24*c9945492SAndroid Build Coastguard Worker if (ix == 0x7f800000)
25*c9945492SAndroid Build Coastguard Worker return x;
26*c9945492SAndroid Build Coastguard Worker if (ix > 0x7f800000)
27*c9945492SAndroid Build Coastguard Worker return __math_invalidf(x);
28*c9945492SAndroid Build Coastguard Worker /* x is subnormal, normalize it. */
29*c9945492SAndroid Build Coastguard Worker ix = asuint(x * 0x1p23f);
30*c9945492SAndroid Build Coastguard Worker ix -= 23 << 23;
31*c9945492SAndroid Build Coastguard Worker }
32*c9945492SAndroid Build Coastguard Worker
33*c9945492SAndroid Build Coastguard Worker /* x = 4^e m; with int e and m in [1, 4). */
34*c9945492SAndroid Build Coastguard Worker even = ix & 0x00800000;
35*c9945492SAndroid Build Coastguard Worker m1 = (ix << 8) | 0x80000000;
36*c9945492SAndroid Build Coastguard Worker m0 = (ix << 7) & 0x7fffffff;
37*c9945492SAndroid Build Coastguard Worker m = even ? m0 : m1;
38*c9945492SAndroid Build Coastguard Worker
39*c9945492SAndroid Build Coastguard Worker /* 2^e is the exponent part of the return value. */
40*c9945492SAndroid Build Coastguard Worker ey = ix >> 1;
41*c9945492SAndroid Build Coastguard Worker ey += 0x3f800000 >> 1;
42*c9945492SAndroid Build Coastguard Worker ey &= 0x7f800000;
43*c9945492SAndroid Build Coastguard Worker
44*c9945492SAndroid Build Coastguard Worker /* compute r ~ 1/sqrt(m), s ~ sqrt(m) with 2 goldschmidt iterations. */
45*c9945492SAndroid Build Coastguard Worker static const uint32_t three = 0xc0000000;
46*c9945492SAndroid Build Coastguard Worker uint32_t r, s, d, u, i;
47*c9945492SAndroid Build Coastguard Worker i = (ix >> 17) % 128;
48*c9945492SAndroid Build Coastguard Worker r = (uint32_t)__rsqrt_tab[i] << 16;
49*c9945492SAndroid Build Coastguard Worker /* |r*sqrt(m) - 1| < 0x1p-8 */
50*c9945492SAndroid Build Coastguard Worker s = mul32(m, r);
51*c9945492SAndroid Build Coastguard Worker /* |s/sqrt(m) - 1| < 0x1p-8 */
52*c9945492SAndroid Build Coastguard Worker d = mul32(s, r);
53*c9945492SAndroid Build Coastguard Worker u = three - d;
54*c9945492SAndroid Build Coastguard Worker r = mul32(r, u) << 1;
55*c9945492SAndroid Build Coastguard Worker /* |r*sqrt(m) - 1| < 0x1.7bp-16 */
56*c9945492SAndroid Build Coastguard Worker s = mul32(s, u) << 1;
57*c9945492SAndroid Build Coastguard Worker /* |s/sqrt(m) - 1| < 0x1.7bp-16 */
58*c9945492SAndroid Build Coastguard Worker d = mul32(s, r);
59*c9945492SAndroid Build Coastguard Worker u = three - d;
60*c9945492SAndroid Build Coastguard Worker s = mul32(s, u);
61*c9945492SAndroid Build Coastguard Worker /* -0x1.03p-28 < s/sqrt(m) - 1 < 0x1.fp-31 */
62*c9945492SAndroid Build Coastguard Worker s = (s - 1)>>6;
63*c9945492SAndroid Build Coastguard Worker /* s < sqrt(m) < s + 0x1.08p-23 */
64*c9945492SAndroid Build Coastguard Worker
65*c9945492SAndroid Build Coastguard Worker /* compute nearest rounded result. */
66*c9945492SAndroid Build Coastguard Worker uint32_t d0, d1, d2;
67*c9945492SAndroid Build Coastguard Worker float y, t;
68*c9945492SAndroid Build Coastguard Worker d0 = (m << 16) - s*s;
69*c9945492SAndroid Build Coastguard Worker d1 = s - d0;
70*c9945492SAndroid Build Coastguard Worker d2 = d1 + s + 1;
71*c9945492SAndroid Build Coastguard Worker s += d1 >> 31;
72*c9945492SAndroid Build Coastguard Worker s &= 0x007fffff;
73*c9945492SAndroid Build Coastguard Worker s |= ey;
74*c9945492SAndroid Build Coastguard Worker y = asfloat(s);
75*c9945492SAndroid Build Coastguard Worker if (FENV_SUPPORT) {
76*c9945492SAndroid Build Coastguard Worker /* handle rounding and inexact exception. */
77*c9945492SAndroid Build Coastguard Worker uint32_t tiny = predict_false(d2==0) ? 0 : 0x01000000;
78*c9945492SAndroid Build Coastguard Worker tiny |= (d1^d2) & 0x80000000;
79*c9945492SAndroid Build Coastguard Worker t = asfloat(tiny);
80*c9945492SAndroid Build Coastguard Worker y = eval_as_float(y + t);
81*c9945492SAndroid Build Coastguard Worker }
82*c9945492SAndroid Build Coastguard Worker return y;
83*c9945492SAndroid Build Coastguard Worker }
84