pl/math/sinhf_2u3.c

*412f47f9SXin Li/*
*412f47f9SXin Li * Single-precision sinh(x) function.
*412f47f9SXin Li *
*412f47f9SXin Li * Copyright (c) 2022-2023, Arm Limited.
*412f47f9SXin Li * SPDX-License-Identifier: MIT OR Apache-2.0 WITH LLVM-exception
*412f47f9SXin Li */
*412f47f9SXin Li
*412f47f9SXin Li#include "math_config.h"
*412f47f9SXin Li#include "pl_sig.h"
*412f47f9SXin Li#include "pl_test.h"
*412f47f9SXin Li
*412f47f9SXin Li#define AbsMask 0x7fffffff
*412f47f9SXin Li#define Half 0x3f000000
*412f47f9SXin Li#define Expm1OFlowLimit                                                        \
*412f47f9SXin Li  0x42b17218 /* 0x1.62e43p+6, 2^7*ln2, minimum value for which expm1f          \
*412f47f9SXin Li		overflows.  */
*412f47f9SXin Li#define OFlowLimit                                                             \
*412f47f9SXin Li  0x42b2d4fd /* 0x1.65a9fap+6, minimum positive value for which sinhf should   \
*412f47f9SXin Li		overflow.  */
*412f47f9SXin Li
*412f47f9SXin Lifloat
*412f47f9SXin Lioptr_aor_exp_f32 (float);
*412f47f9SXin Li
*412f47f9SXin Li/* Approximation for single-precision sinh(x) using expm1.
*412f47f9SXin Li   sinh(x) = (exp(x) - exp(-x)) / 2.
*412f47f9SXin Li   The maximum error is 2.26 ULP:
*412f47f9SXin Li   sinhf(0x1.e34a9ep-4) got 0x1.e469ep-4 want 0x1.e469e4p-4.  */
*412f47f9SXin Lifloat
*412f47f9SXin Lisinhf (float x)
*412f47f9SXin Li{
*412f47f9SXin Li  uint32_t ix = asuint (x);
*412f47f9SXin Li  uint32_t iax = ix & AbsMask;
*412f47f9SXin Li  float ax = asfloat (iax);
*412f47f9SXin Li  uint32_t sign = ix & ~AbsMask;
*412f47f9SXin Li  float halfsign = asfloat (Half | sign);
*412f47f9SXin Li
*412f47f9SXin Li  if (unlikely (iax >= Expm1OFlowLimit))
*412f47f9SXin Li    {
*412f47f9SXin Li      /* Special values and overflow.  */
*412f47f9SXin Li      if (iax >= 0x7fc00001 || iax == 0x7f800000)
*412f47f9SXin Li	return x;
*412f47f9SXin Li      if (iax >= 0x7f800000)
*412f47f9SXin Li	return __math_invalidf (x);
*412f47f9SXin Li      if (iax >= OFlowLimit)
*412f47f9SXin Li	return __math_oflowf (sign);
*412f47f9SXin Li
*412f47f9SXin Li      /* expm1f overflows a little before sinhf, (~88.7 vs ~89.4). We have to
*412f47f9SXin Li	 fill this gap by using a different algorithm, in this case we use a
*412f47f9SXin Li	 double-precision exp helper. For large x sinh(x) dominated by exp(x),
*412f47f9SXin Li	 however we cannot compute exp without overflow either. We use the
*412f47f9SXin Li	 identity:
*412f47f9SXin Li	 exp(a) = (exp(a / 2)) ^ 2.
*412f47f9SXin Li	 to compute sinh(x) ~= (exp(|x| / 2)) ^ 2 / 2    for x > 0
*412f47f9SXin Li			    ~= (exp(|x| / 2)) ^ 2 / -2   for x < 0.
*412f47f9SXin Li	 Greatest error in this region is 1.89 ULP:
*412f47f9SXin Li	 sinhf(0x1.65898cp+6) got 0x1.f00aep+127  want 0x1.f00adcp+127.  */
*412f47f9SXin Li      float e = optr_aor_exp_f32 (ax / 2);
*412f47f9SXin Li      return (e * halfsign) * e;
*412f47f9SXin Li    }
*412f47f9SXin Li
*412f47f9SXin Li  /* Use expm1f to retain acceptable precision for small numbers.
*412f47f9SXin Li     Let t = e^(|x|) - 1.  */
*412f47f9SXin Li  float t = expm1f (ax);
*412f47f9SXin Li  /* Then sinh(x) = (t + t / (t + 1)) / 2   for x > 0
*412f47f9SXin Li		    (t + t / (t + 1)) / -2  for x < 0.  */
*412f47f9SXin Li  return (t + t / (t + 1)) * halfsign;
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin LiPL_SIG (S, F, 1, sinh, -10.0, 10.0)
*412f47f9SXin LiPL_TEST_ULP (sinhf, 1.76)
*412f47f9SXin LiPL_TEST_SYM_INTERVAL (sinhf, 0, 0x1.62e43p+6, 100000)
*412f47f9SXin LiPL_TEST_SYM_INTERVAL (sinhf, 0x1.62e43p+6, 0x1.65a9fap+6, 100)
*412f47f9SXin LiPL_TEST_SYM_INTERVAL (sinhf, 0x1.65a9fap+6, inf, 100)