xref: /aosp_15_r20/external/arm-optimized-routines/math/cosf.c (revision 412f47f9e737e10ed5cc46ec6a8d7fa2264f8a14)
1*412f47f9SXin Li /*
2*412f47f9SXin Li  * Single-precision cos function.
3*412f47f9SXin Li  *
4*412f47f9SXin Li  * Copyright (c) 2018-2021, Arm Limited.
5*412f47f9SXin Li  * SPDX-License-Identifier: MIT OR Apache-2.0 WITH LLVM-exception
6*412f47f9SXin Li  */
7*412f47f9SXin Li 
8*412f47f9SXin Li #include <stdint.h>
9*412f47f9SXin Li #include <math.h>
10*412f47f9SXin Li #include "math_config.h"
11*412f47f9SXin Li #include "sincosf.h"
12*412f47f9SXin Li 
13*412f47f9SXin Li /* Fast cosf implementation.  Worst-case ULP is 0.5607, maximum relative
14*412f47f9SXin Li    error is 0.5303 * 2^-23.  A single-step range reduction is used for
15*412f47f9SXin Li    small values.  Large inputs have their range reduced using fast integer
16*412f47f9SXin Li    arithmetic.  */
17*412f47f9SXin Li float
cosf(float y)18*412f47f9SXin Li cosf (float y)
19*412f47f9SXin Li {
20*412f47f9SXin Li   double x = y;
21*412f47f9SXin Li   double s;
22*412f47f9SXin Li   int n;
23*412f47f9SXin Li   const sincos_t *p = &__sincosf_table[0];
24*412f47f9SXin Li 
25*412f47f9SXin Li   if (abstop12 (y) < abstop12 (pio4f))
26*412f47f9SXin Li     {
27*412f47f9SXin Li       double x2 = x * x;
28*412f47f9SXin Li 
29*412f47f9SXin Li       if (unlikely (abstop12 (y) < abstop12 (0x1p-12f)))
30*412f47f9SXin Li 	return 1.0f;
31*412f47f9SXin Li 
32*412f47f9SXin Li       return sinf_poly (x, x2, p, 1);
33*412f47f9SXin Li     }
34*412f47f9SXin Li   else if (likely (abstop12 (y) < abstop12 (120.0f)))
35*412f47f9SXin Li     {
36*412f47f9SXin Li       x = reduce_fast (x, p, &n);
37*412f47f9SXin Li 
38*412f47f9SXin Li       /* Setup the signs for sin and cos.  */
39*412f47f9SXin Li       s = p->sign[n & 3];
40*412f47f9SXin Li 
41*412f47f9SXin Li       if (n & 2)
42*412f47f9SXin Li 	p = &__sincosf_table[1];
43*412f47f9SXin Li 
44*412f47f9SXin Li       return sinf_poly (x * s, x * x, p, n ^ 1);
45*412f47f9SXin Li     }
46*412f47f9SXin Li   else if (abstop12 (y) < abstop12 (INFINITY))
47*412f47f9SXin Li     {
48*412f47f9SXin Li       uint32_t xi = asuint (y);
49*412f47f9SXin Li       int sign = xi >> 31;
50*412f47f9SXin Li 
51*412f47f9SXin Li       x = reduce_large (xi, &n);
52*412f47f9SXin Li 
53*412f47f9SXin Li       /* Setup signs for sin and cos - include original sign.  */
54*412f47f9SXin Li       s = p->sign[(n + sign) & 3];
55*412f47f9SXin Li 
56*412f47f9SXin Li       if ((n + sign) & 2)
57*412f47f9SXin Li 	p = &__sincosf_table[1];
58*412f47f9SXin Li 
59*412f47f9SXin Li       return sinf_poly (x * s, x * x, p, n ^ 1);
60*412f47f9SXin Li     }
61*412f47f9SXin Li   else
62*412f47f9SXin Li     return __math_invalidf (y);
63*412f47f9SXin Li }
64