math/test/ulp.h

*412f47f9SXin Li/*
*412f47f9SXin Li * Generic functions for ULP error estimation.
*412f47f9SXin Li *
*412f47f9SXin Li * Copyright (c) 2019-2024, Arm Limited.
*412f47f9SXin Li * SPDX-License-Identifier: MIT OR Apache-2.0 WITH LLVM-exception
*412f47f9SXin Li */
*412f47f9SXin Li
*412f47f9SXin Li/* For each different math function type,
*412f47f9SXin Li   T(x) should add a different suffix to x.
*412f47f9SXin Li   RT(x) should add a return type specific suffix to x.  */
*412f47f9SXin Li
*412f47f9SXin Li#ifdef NEW_RT
*412f47f9SXin Li#undef NEW_RT
*412f47f9SXin Li
*412f47f9SXin Li# if USE_MPFR
*412f47f9SXin Listatic int RT(ulpscale_mpfr) (mpfr_t x, int t)
*412f47f9SXin Li{
*412f47f9SXin Li  /* TODO: pow of 2 cases.  */
*412f47f9SXin Li  if (mpfr_regular_p (x))
*412f47f9SXin Li    {
*412f47f9SXin Li      mpfr_exp_t e = mpfr_get_exp (x) - RT(prec);
*412f47f9SXin Li      if (e < RT(emin))
*412f47f9SXin Li	e = RT(emin) - 1;
*412f47f9SXin Li      if (e > RT(emax) - RT(prec))
*412f47f9SXin Li	e = RT(emax) - RT(prec);
*412f47f9SXin Li      return e;
*412f47f9SXin Li    }
*412f47f9SXin Li  if (mpfr_zero_p (x))
*412f47f9SXin Li    return RT(emin) - 1;
*412f47f9SXin Li  if (mpfr_inf_p (x))
*412f47f9SXin Li    return RT(emax) - RT(prec);
*412f47f9SXin Li  /* NaN.  */
*412f47f9SXin Li  return 0;
*412f47f9SXin Li}
*412f47f9SXin Li# endif
*412f47f9SXin Li
*412f47f9SXin Li/* Difference between exact result and closest real number that
*412f47f9SXin Li   gets rounded to got, i.e. error before rounding, for a correctly
*412f47f9SXin Li   rounded result the difference is 0.  */
*412f47f9SXin Listatic double RT (ulperr) (RT (float) got, const struct RT (ret) * p, int r,
*412f47f9SXin Li			   int ignore_zero_sign)
*412f47f9SXin Li{
*412f47f9SXin Li  RT(float) want = p->y;
*412f47f9SXin Li  RT(float) d;
*412f47f9SXin Li  double e;
*412f47f9SXin Li
*412f47f9SXin Li  if (RT(asuint) (got) == RT(asuint) (want))
*412f47f9SXin Li    return 0.0;
*412f47f9SXin Li  if (isnan (got) && isnan (want))
*412f47f9SXin Li    /* Ignore sign of NaN.  */
*412f47f9SXin Li    return RT (issignaling) (got) == RT (issignaling) (want) ? 0 : INFINITY;
*412f47f9SXin Li  if (signbit (got) != signbit (want))
*412f47f9SXin Li    {
*412f47f9SXin Li      /* Fall through to ULP calculation if ignoring sign of zero and at
*412f47f9SXin Li	 exactly one of want and got is non-zero.  */
*412f47f9SXin Li      if (ignore_zero_sign && want == got)
*412f47f9SXin Li	return 0.0;
*412f47f9SXin Li      if (!ignore_zero_sign || (want != 0 && got != 0))
*412f47f9SXin Li	return INFINITY;
*412f47f9SXin Li    }
*412f47f9SXin Li  if (!isfinite (want) || !isfinite (got))
*412f47f9SXin Li    {
*412f47f9SXin Li      if (isnan (got) != isnan (want))
*412f47f9SXin Li	return INFINITY;
*412f47f9SXin Li      if (isnan (want))
*412f47f9SXin Li	return 0;
*412f47f9SXin Li      if (isinf (got))
*412f47f9SXin Li	{
*412f47f9SXin Li	  got = RT(copysign) (RT(halfinf), got);
*412f47f9SXin Li	  want *= 0.5f;
*412f47f9SXin Li	}
*412f47f9SXin Li      if (isinf (want))
*412f47f9SXin Li	{
*412f47f9SXin Li	  want = RT(copysign) (RT(halfinf), want);
*412f47f9SXin Li	  got *= 0.5f;
*412f47f9SXin Li	}
*412f47f9SXin Li    }
*412f47f9SXin Li  if (r == FE_TONEAREST)
*412f47f9SXin Li    {
*412f47f9SXin Li      // TODO: incorrect when got vs want cross a powof2 boundary
*412f47f9SXin Li      /* error = got > want
*412f47f9SXin Li	      ? got - want - tail ulp - 0.5 ulp
*412f47f9SXin Li	      : got - want - tail ulp + 0.5 ulp.  */
*412f47f9SXin Li      d = got - want;
*412f47f9SXin Li      e = d > 0 ? -p->tail - 0.5 : -p->tail + 0.5;
*412f47f9SXin Li    }
*412f47f9SXin Li  else
*412f47f9SXin Li    {
*412f47f9SXin Li      if ((r == FE_DOWNWARD && got < want) || (r == FE_UPWARD && got > want)
*412f47f9SXin Li	  || (r == FE_TOWARDZERO && fabs (got) < fabs (want)))
*412f47f9SXin Li	got = RT(nextafter) (got, want);
*412f47f9SXin Li      d = got - want;
*412f47f9SXin Li      e = -p->tail;
*412f47f9SXin Li    }
*412f47f9SXin Li  return RT(scalbn) (d, -p->ulpexp) + e;
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin Listatic int RT(isok) (RT(float) ygot, int exgot, RT(float) ywant, int exwant,
*412f47f9SXin Li		      int exmay)
*412f47f9SXin Li{
*412f47f9SXin Li  return RT(asuint) (ygot) == RT(asuint) (ywant)
*412f47f9SXin Li	 && ((exgot ^ exwant) & ~exmay) == 0;
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin Listatic int RT(isok_nofenv) (RT(float) ygot, RT(float) ywant)
*412f47f9SXin Li{
*412f47f9SXin Li  return RT(asuint) (ygot) == RT(asuint) (ywant);
*412f47f9SXin Li}
*412f47f9SXin Li#endif
*412f47f9SXin Li
*412f47f9SXin Listatic inline void T (call_fenv) (const struct fun *f, struct T (args) a,
*412f47f9SXin Li				  int r, RT (float) * y, int *ex,
*412f47f9SXin Li				  const struct conf *conf)
*412f47f9SXin Li{
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (r);
*412f47f9SXin Li  feclearexcept (FE_ALL_EXCEPT);
*412f47f9SXin Li  *y = T (call) (f, a, conf);
*412f47f9SXin Li  *ex = fetestexcept (FE_ALL_EXCEPT);
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (FE_TONEAREST);
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin Listatic inline void T (call_nofenv) (const struct fun *f, struct T (args) a,
*412f47f9SXin Li				    int r, RT (float) * y, int *ex,
*412f47f9SXin Li				    const struct conf *conf)
*412f47f9SXin Li{
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (r);
*412f47f9SXin Li  *y = T (call) (f, a, conf);
*412f47f9SXin Li  *ex = 0;
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (FE_TONEAREST);
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin Listatic inline int T (call_long_fenv) (const struct fun *f, struct T (args) a,
*412f47f9SXin Li				      int r, struct RT (ret) * p,
*412f47f9SXin Li				      RT (float) ygot, int exgot)
*412f47f9SXin Li{
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (r);
*412f47f9SXin Li  feclearexcept (FE_ALL_EXCEPT);
*412f47f9SXin Li  volatile struct T(args) va = a; // TODO: barrier
*412f47f9SXin Li  a = va;
*412f47f9SXin Li  RT(double) yl = T(call_long) (f, a);
*412f47f9SXin Li  p->y = (RT(float)) yl;
*412f47f9SXin Li  volatile RT(float) vy = p->y; // TODO: barrier
*412f47f9SXin Li  (void) vy;
*412f47f9SXin Li  p->ex = fetestexcept (FE_ALL_EXCEPT);
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (FE_TONEAREST);
*412f47f9SXin Li  p->ex_may = FE_INEXACT;
*412f47f9SXin Li  if (RT(isok) (ygot, exgot, p->y, p->ex, p->ex_may))
*412f47f9SXin Li    return 1;
*412f47f9SXin Li  p->ulpexp = RT(ulpscale) (p->y);
*412f47f9SXin Li  if (isinf (p->y))
*412f47f9SXin Li    p->tail = RT(lscalbn) (yl - (RT(double)) 2 * RT(halfinf), -p->ulpexp);
*412f47f9SXin Li  else
*412f47f9SXin Li    p->tail = RT(lscalbn) (yl - p->y, -p->ulpexp);
*412f47f9SXin Li  if (RT(fabs) (p->y) < RT(min_normal))
*412f47f9SXin Li    {
*412f47f9SXin Li      /* TODO: subnormal result is treated as undeflow even if it's
*412f47f9SXin Li	 exact since call_long may not raise inexact correctly.  */
*412f47f9SXin Li      if (p->y != 0 || (p->ex & FE_INEXACT))
*412f47f9SXin Li	p->ex |= FE_UNDERFLOW | FE_INEXACT;
*412f47f9SXin Li    }
*412f47f9SXin Li  return 0;
*412f47f9SXin Li}
*412f47f9SXin Listatic inline int T(call_long_nofenv) (const struct fun *f, struct T(args) a,
*412f47f9SXin Li					int r, struct RT(ret) * p,
*412f47f9SXin Li					RT(float) ygot, int exgot)
*412f47f9SXin Li{
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (r);
*412f47f9SXin Li  RT(double) yl = T(call_long) (f, a);
*412f47f9SXin Li  p->y = (RT(float)) yl;
*412f47f9SXin Li  if (r != FE_TONEAREST)
*412f47f9SXin Li    fesetround (FE_TONEAREST);
*412f47f9SXin Li  if (RT(isok_nofenv) (ygot, p->y))
*412f47f9SXin Li    return 1;
*412f47f9SXin Li  p->ulpexp = RT(ulpscale) (p->y);
*412f47f9SXin Li  if (isinf (p->y))
*412f47f9SXin Li    p->tail = RT(lscalbn) (yl - (RT(double)) 2 * RT(halfinf), -p->ulpexp);
*412f47f9SXin Li  else
*412f47f9SXin Li    p->tail = RT(lscalbn) (yl - p->y, -p->ulpexp);
*412f47f9SXin Li  return 0;
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin Li/* There are nan input args and all quiet.  */
*412f47f9SXin Listatic inline int T(qnanpropagation) (struct T(args) a)
*412f47f9SXin Li{
*412f47f9SXin Li  return T(reduce) (a, isnan, ||) && !T(reduce) (a, RT(issignaling), ||);
*412f47f9SXin Li}
*412f47f9SXin Listatic inline RT(float) T(sum) (struct T(args) a)
*412f47f9SXin Li{
*412f47f9SXin Li  return T(reduce) (a, , +);
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin Li/* returns 1 if the got result is ok.  */
*412f47f9SXin Listatic inline int T(call_mpfr_fix) (const struct fun *f, struct T(args) a,
*412f47f9SXin Li				     int r_fenv, struct RT(ret) * p,
*412f47f9SXin Li				     RT(float) ygot, int exgot)
*412f47f9SXin Li{
*412f47f9SXin Li#if USE_MPFR
*412f47f9SXin Li  int t, t2;
*412f47f9SXin Li  mpfr_rnd_t r = rmap (r_fenv);
*412f47f9SXin Li  MPFR_DECL_INIT(my, RT(prec_mpfr));
*412f47f9SXin Li  MPFR_DECL_INIT(mr, RT(prec));
*412f47f9SXin Li  MPFR_DECL_INIT(me, RT(prec_mpfr));
*412f47f9SXin Li  mpfr_clear_flags ();
*412f47f9SXin Li  t = T(call_mpfr) (my, f, a, r);
*412f47f9SXin Li  /* Double rounding.  */
*412f47f9SXin Li  t2 = mpfr_set (mr, my, r);
*412f47f9SXin Li  if (t2)
*412f47f9SXin Li    t = t2;
*412f47f9SXin Li  mpfr_set_emin (RT(emin));
*412f47f9SXin Li  mpfr_set_emax (RT(emax));
*412f47f9SXin Li  t = mpfr_check_range (mr, t, r);
*412f47f9SXin Li  t = mpfr_subnormalize (mr, t, r);
*412f47f9SXin Li  mpfr_set_emax (MPFR_EMAX_DEFAULT);
*412f47f9SXin Li  mpfr_set_emin (MPFR_EMIN_DEFAULT);
*412f47f9SXin Li  p->y = mpfr_get_d (mr, r);
*412f47f9SXin Li  p->ex = t ? FE_INEXACT : 0;
*412f47f9SXin Li  p->ex_may = FE_INEXACT;
*412f47f9SXin Li  if (mpfr_underflow_p () && (p->ex & FE_INEXACT))
*412f47f9SXin Li    /* TODO: handle before and after rounding uflow cases.  */
*412f47f9SXin Li    p->ex |= FE_UNDERFLOW;
*412f47f9SXin Li  if (mpfr_overflow_p ())
*412f47f9SXin Li    p->ex |= FE_OVERFLOW | FE_INEXACT;
*412f47f9SXin Li  if (mpfr_divby0_p ())
*412f47f9SXin Li    p->ex |= FE_DIVBYZERO;
*412f47f9SXin Li  //if (mpfr_erangeflag_p ())
*412f47f9SXin Li  //  p->ex |= FE_INVALID;
*412f47f9SXin Li  if (!mpfr_nanflag_p () && RT(isok) (ygot, exgot, p->y, p->ex, p->ex_may))
*412f47f9SXin Li    return 1;
*412f47f9SXin Li  if (mpfr_nanflag_p () && !T(qnanpropagation) (a))
*412f47f9SXin Li    p->ex |= FE_INVALID;
*412f47f9SXin Li  p->ulpexp = RT(ulpscale_mpfr) (my, t);
*412f47f9SXin Li  if (!isfinite (p->y))
*412f47f9SXin Li    {
*412f47f9SXin Li      p->tail = 0;
*412f47f9SXin Li      if (isnan (p->y))
*412f47f9SXin Li	{
*412f47f9SXin Li	  /* If an input was nan keep its sign.  */
*412f47f9SXin Li	  p->y = T(sum) (a);
*412f47f9SXin Li	  if (!isnan (p->y))
*412f47f9SXin Li	    p->y = (p->y - p->y) / (p->y - p->y);
*412f47f9SXin Li	  return RT(isok) (ygot, exgot, p->y, p->ex, p->ex_may);
*412f47f9SXin Li	}
*412f47f9SXin Li      mpfr_set_si_2exp (mr, signbit (p->y) ? -1 : 1, 1024, MPFR_RNDN);
*412f47f9SXin Li      if (mpfr_cmpabs (my, mr) >= 0)
*412f47f9SXin Li	return RT(isok) (ygot, exgot, p->y, p->ex, p->ex_may);
*412f47f9SXin Li    }
*412f47f9SXin Li  mpfr_sub (me, my, mr, MPFR_RNDN);
*412f47f9SXin Li  mpfr_mul_2si (me, me, -p->ulpexp, MPFR_RNDN);
*412f47f9SXin Li  p->tail = mpfr_get_d (me, MPFR_RNDN);
*412f47f9SXin Li  return 0;
*412f47f9SXin Li#else
*412f47f9SXin Li  abort ();
*412f47f9SXin Li#endif
*412f47f9SXin Li}
*412f47f9SXin Li
*412f47f9SXin Listatic int T(cmp) (const struct fun *f, struct gen *gen,
*412f47f9SXin Li		     const struct conf *conf)
*412f47f9SXin Li{
*412f47f9SXin Li  double maxerr = 0;
*412f47f9SXin Li  uint64_t cnt = 0;
*412f47f9SXin Li  uint64_t cnt1 = 0;
*412f47f9SXin Li  uint64_t cnt2 = 0;
*412f47f9SXin Li  uint64_t cntfail = 0;
*412f47f9SXin Li  int r = conf->r;
*412f47f9SXin Li  int use_mpfr = conf->mpfr;
*412f47f9SXin Li  int fenv = conf->fenv;
*412f47f9SXin Li
*412f47f9SXin Li  for (;;)
*412f47f9SXin Li    {
*412f47f9SXin Li      struct RT(ret) want;
*412f47f9SXin Li      struct T(args) a = T(next) (gen);
*412f47f9SXin Li      int exgot;
*412f47f9SXin Li      int exgot2;
*412f47f9SXin Li      RT(float) ygot;
*412f47f9SXin Li      RT(float) ygot2;
*412f47f9SXin Li      int fail = 0;
*412f47f9SXin Li      if (fenv)
*412f47f9SXin Li	T (call_fenv) (f, a, r, &ygot, &exgot, conf);
*412f47f9SXin Li      else
*412f47f9SXin Li	T (call_nofenv) (f, a, r, &ygot, &exgot, conf);
*412f47f9SXin Li      if (f->twice) {
*412f47f9SXin Li	secondcall = 1;
*412f47f9SXin Li	if (fenv)
*412f47f9SXin Li	  T (call_fenv) (f, a, r, &ygot2, &exgot2, conf);
*412f47f9SXin Li	else
*412f47f9SXin Li	  T (call_nofenv) (f, a, r, &ygot2, &exgot2, conf);
*412f47f9SXin Li	secondcall = 0;
*412f47f9SXin Li	if (RT(asuint) (ygot) != RT(asuint) (ygot2))
*412f47f9SXin Li	  {
*412f47f9SXin Li	    fail = 1;
*412f47f9SXin Li	    cntfail++;
*412f47f9SXin Li	    T(printcall) (f, a);
*412f47f9SXin Li	    printf (" got %a then %a for same input\n", ygot, ygot2);
*412f47f9SXin Li	  }
*412f47f9SXin Li      }
*412f47f9SXin Li      cnt++;
*412f47f9SXin Li      int ok = use_mpfr
*412f47f9SXin Li		 ? T(call_mpfr_fix) (f, a, r, &want, ygot, exgot)
*412f47f9SXin Li		 : (fenv ? T(call_long_fenv) (f, a, r, &want, ygot, exgot)
*412f47f9SXin Li			 : T(call_long_nofenv) (f, a, r, &want, ygot, exgot));
*412f47f9SXin Li      if (!ok)
*412f47f9SXin Li	{
*412f47f9SXin Li	  int print = 0;
*412f47f9SXin Li	  double err = RT (ulperr) (ygot, &want, r, conf->ignore_zero_sign);
*412f47f9SXin Li	  double abserr = fabs (err);
*412f47f9SXin Li	  // TODO: count errors below accuracy limit.
*412f47f9SXin Li	  if (abserr > 0)
*412f47f9SXin Li	    cnt1++;
*412f47f9SXin Li	  if (abserr > 1)
*412f47f9SXin Li	    cnt2++;
*412f47f9SXin Li	  if (abserr > conf->errlim)
*412f47f9SXin Li	    {
*412f47f9SXin Li	      print = 1;
*412f47f9SXin Li	      if (!fail)
*412f47f9SXin Li		{
*412f47f9SXin Li		  fail = 1;
*412f47f9SXin Li		  cntfail++;
*412f47f9SXin Li		}
*412f47f9SXin Li	    }
*412f47f9SXin Li	  if (abserr > maxerr)
*412f47f9SXin Li	    {
*412f47f9SXin Li	      maxerr = abserr;
*412f47f9SXin Li	      if (!conf->quiet && abserr > conf->softlim)
*412f47f9SXin Li		print = 1;
*412f47f9SXin Li	    }
*412f47f9SXin Li	  if (print)
*412f47f9SXin Li	    {
*412f47f9SXin Li	      T(printcall) (f, a);
*412f47f9SXin Li	      // TODO: inf ulp handling
*412f47f9SXin Li	      printf (" got %a want %a %+g ulp err %g\n", ygot, want.y,
*412f47f9SXin Li		      want.tail, err);
*412f47f9SXin Li	    }
*412f47f9SXin Li	  int diff = fenv ? exgot ^ want.ex : 0;
*412f47f9SXin Li	  if (fenv && (diff & ~want.ex_may))
*412f47f9SXin Li	    {
*412f47f9SXin Li	      if (!fail)
*412f47f9SXin Li		{
*412f47f9SXin Li		  fail = 1;
*412f47f9SXin Li		  cntfail++;
*412f47f9SXin Li		}
*412f47f9SXin Li	      T(printcall) (f, a);
*412f47f9SXin Li	      printf (" is %a %+g ulp, got except 0x%0x", want.y, want.tail,
*412f47f9SXin Li		      exgot);
*412f47f9SXin Li	      if (diff & exgot)
*412f47f9SXin Li		printf (" wrongly set: 0x%x", diff & exgot);
*412f47f9SXin Li	      if (diff & ~exgot)
*412f47f9SXin Li		printf (" wrongly clear: 0x%x", diff & ~exgot);
*412f47f9SXin Li	      putchar ('\n');
*412f47f9SXin Li	    }
*412f47f9SXin Li	}
*412f47f9SXin Li      if (cnt >= conf->n)
*412f47f9SXin Li	break;
*412f47f9SXin Li      if (!conf->quiet && cnt % 0x100000 == 0)
*412f47f9SXin Li	printf ("progress: %6.3f%% cnt %llu cnt1 %llu cnt2 %llu cntfail %llu "
*412f47f9SXin Li		"maxerr %g\n",
*412f47f9SXin Li		100.0 * cnt / conf->n, (unsigned long long) cnt,
*412f47f9SXin Li		(unsigned long long) cnt1, (unsigned long long) cnt2,
*412f47f9SXin Li		(unsigned long long) cntfail, maxerr);
*412f47f9SXin Li    }
*412f47f9SXin Li  double cc = cnt;
*412f47f9SXin Li  if (cntfail)
*412f47f9SXin Li    printf ("FAIL ");
*412f47f9SXin Li  else
*412f47f9SXin Li    printf ("PASS ");
*412f47f9SXin Li  T(printgen) (f, gen);
*412f47f9SXin Li  printf (" round %c errlim %g maxerr %g %s cnt %llu cnt1 %llu %g%% cnt2 %llu "
*412f47f9SXin Li	  "%g%% cntfail %llu %g%%\n",
*412f47f9SXin Li	  conf->rc, conf->errlim,
*412f47f9SXin Li	  maxerr, conf->r == FE_TONEAREST ? "+0.5" : "+1.0",
*412f47f9SXin Li	  (unsigned long long) cnt,
*412f47f9SXin Li	  (unsigned long long) cnt1, 100.0 * cnt1 / cc,
*412f47f9SXin Li	  (unsigned long long) cnt2, 100.0 * cnt2 / cc,
*412f47f9SXin Li	  (unsigned long long) cntfail, 100.0 * cntfail / cc);
*412f47f9SXin Li  return !!cntfail;
*412f47f9SXin Li}