1*7c3d14c8STreehugger Robot /* This file is distributed under the University of Illinois Open Source
2*7c3d14c8STreehugger Robot * License. See LICENSE.TXT for details.
3*7c3d14c8STreehugger Robot */
4*7c3d14c8STreehugger Robot
5*7c3d14c8STreehugger Robot /* long double __gcc_qsub(long double x, long double y);
6*7c3d14c8STreehugger Robot * This file implements the PowerPC 128-bit double-double add operation.
7*7c3d14c8STreehugger Robot * This implementation is shamelessly cribbed from Apple's DDRT, circa 1993(!)
8*7c3d14c8STreehugger Robot */
9*7c3d14c8STreehugger Robot
10*7c3d14c8STreehugger Robot #include "DD.h"
11*7c3d14c8STreehugger Robot
__gcc_qsub(long double x,long double y)12*7c3d14c8STreehugger Robot long double __gcc_qsub(long double x, long double y)
13*7c3d14c8STreehugger Robot {
14*7c3d14c8STreehugger Robot static const uint32_t infinityHi = UINT32_C(0x7ff00000);
15*7c3d14c8STreehugger Robot
16*7c3d14c8STreehugger Robot DD dst = { .ld = x }, src = { .ld = y };
17*7c3d14c8STreehugger Robot
18*7c3d14c8STreehugger Robot register double A = dst.s.hi, a = dst.s.lo,
19*7c3d14c8STreehugger Robot B = -src.s.hi, b = -src.s.lo;
20*7c3d14c8STreehugger Robot
21*7c3d14c8STreehugger Robot /* If both operands are zero: */
22*7c3d14c8STreehugger Robot if ((A == 0.0) && (B == 0.0)) {
23*7c3d14c8STreehugger Robot dst.s.hi = A + B;
24*7c3d14c8STreehugger Robot dst.s.lo = 0.0;
25*7c3d14c8STreehugger Robot return dst.ld;
26*7c3d14c8STreehugger Robot }
27*7c3d14c8STreehugger Robot
28*7c3d14c8STreehugger Robot /* If either operand is NaN or infinity: */
29*7c3d14c8STreehugger Robot const doublebits abits = { .d = A };
30*7c3d14c8STreehugger Robot const doublebits bbits = { .d = B };
31*7c3d14c8STreehugger Robot if ((((uint32_t)(abits.x >> 32) & infinityHi) == infinityHi) ||
32*7c3d14c8STreehugger Robot (((uint32_t)(bbits.x >> 32) & infinityHi) == infinityHi)) {
33*7c3d14c8STreehugger Robot dst.s.hi = A + B;
34*7c3d14c8STreehugger Robot dst.s.lo = 0.0;
35*7c3d14c8STreehugger Robot return dst.ld;
36*7c3d14c8STreehugger Robot }
37*7c3d14c8STreehugger Robot
38*7c3d14c8STreehugger Robot /* If the computation overflows: */
39*7c3d14c8STreehugger Robot /* This may be playing things a little bit fast and loose, but it will do for a start. */
40*7c3d14c8STreehugger Robot const double testForOverflow = A + (B + (a + b));
41*7c3d14c8STreehugger Robot const doublebits testbits = { .d = testForOverflow };
42*7c3d14c8STreehugger Robot if (((uint32_t)(testbits.x >> 32) & infinityHi) == infinityHi) {
43*7c3d14c8STreehugger Robot dst.s.hi = testForOverflow;
44*7c3d14c8STreehugger Robot dst.s.lo = 0.0;
45*7c3d14c8STreehugger Robot return dst.ld;
46*7c3d14c8STreehugger Robot }
47*7c3d14c8STreehugger Robot
48*7c3d14c8STreehugger Robot double H, h;
49*7c3d14c8STreehugger Robot double T, t;
50*7c3d14c8STreehugger Robot double W, w;
51*7c3d14c8STreehugger Robot double Y;
52*7c3d14c8STreehugger Robot
53*7c3d14c8STreehugger Robot H = B + (A - (A + B));
54*7c3d14c8STreehugger Robot T = b + (a - (a + b));
55*7c3d14c8STreehugger Robot h = A + (B - (A + B));
56*7c3d14c8STreehugger Robot t = a + (b - (a + b));
57*7c3d14c8STreehugger Robot
58*7c3d14c8STreehugger Robot if (local_fabs(A) <= local_fabs(B))
59*7c3d14c8STreehugger Robot w = (a + b) + h;
60*7c3d14c8STreehugger Robot else
61*7c3d14c8STreehugger Robot w = (a + b) + H;
62*7c3d14c8STreehugger Robot
63*7c3d14c8STreehugger Robot W = (A + B) + w;
64*7c3d14c8STreehugger Robot Y = (A + B) - W;
65*7c3d14c8STreehugger Robot Y += w;
66*7c3d14c8STreehugger Robot
67*7c3d14c8STreehugger Robot if (local_fabs(a) <= local_fabs(b))
68*7c3d14c8STreehugger Robot w = t + Y;
69*7c3d14c8STreehugger Robot else
70*7c3d14c8STreehugger Robot w = T + Y;
71*7c3d14c8STreehugger Robot
72*7c3d14c8STreehugger Robot dst.s.hi = Y = W + w;
73*7c3d14c8STreehugger Robot dst.s.lo = (W - Y) + w;
74*7c3d14c8STreehugger Robot
75*7c3d14c8STreehugger Robot return dst.ld;
76*7c3d14c8STreehugger Robot }
77