lib/builtins/fp_mul_impl.inc

*7c3d14c8STreehugger Robot//===---- lib/fp_mul_impl.inc - floating point multiplication -----*- C -*-===//
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot//                     The LLVM Compiler Infrastructure
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot// This file is dual licensed under the MIT and the University of Illinois Open
*7c3d14c8STreehugger Robot// Source Licenses. See LICENSE.TXT for details.
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot//===----------------------------------------------------------------------===//
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot// This file implements soft-float multiplication with the IEEE-754 default
*7c3d14c8STreehugger Robot// rounding (to nearest, ties to even).
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot//===----------------------------------------------------------------------===//
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot#include "fp_lib.h"
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robotstatic __inline fp_t __mulXf3__(fp_t a, fp_t b) {
*7c3d14c8STreehugger Robot    const unsigned int aExponent = toRep(a) >> significandBits & maxExponent;
*7c3d14c8STreehugger Robot    const unsigned int bExponent = toRep(b) >> significandBits & maxExponent;
*7c3d14c8STreehugger Robot    const rep_t productSign = (toRep(a) ^ toRep(b)) & signBit;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    rep_t aSignificand = toRep(a) & significandMask;
*7c3d14c8STreehugger Robot    rep_t bSignificand = toRep(b) & significandMask;
*7c3d14c8STreehugger Robot    int scale = 0;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Detect if a or b is zero, denormal, infinity, or NaN.
*7c3d14c8STreehugger Robot    if (aExponent-1U >= maxExponent-1U || bExponent-1U >= maxExponent-1U) {
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        const rep_t aAbs = toRep(a) & absMask;
*7c3d14c8STreehugger Robot        const rep_t bAbs = toRep(b) & absMask;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // NaN * anything = qNaN
*7c3d14c8STreehugger Robot        if (aAbs > infRep) return fromRep(toRep(a) | quietBit);
*7c3d14c8STreehugger Robot        // anything * NaN = qNaN
*7c3d14c8STreehugger Robot        if (bAbs > infRep) return fromRep(toRep(b) | quietBit);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        if (aAbs == infRep) {
*7c3d14c8STreehugger Robot            // infinity * non-zero = +/- infinity
*7c3d14c8STreehugger Robot            if (bAbs) return fromRep(aAbs | productSign);
*7c3d14c8STreehugger Robot            // infinity * zero = NaN
*7c3d14c8STreehugger Robot            else return fromRep(qnanRep);
*7c3d14c8STreehugger Robot        }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        if (bAbs == infRep) {
*7c3d14c8STreehugger Robot            //? non-zero * infinity = +/- infinity
*7c3d14c8STreehugger Robot            if (aAbs) return fromRep(bAbs | productSign);
*7c3d14c8STreehugger Robot            // zero * infinity = NaN
*7c3d14c8STreehugger Robot            else return fromRep(qnanRep);
*7c3d14c8STreehugger Robot        }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // zero * anything = +/- zero
*7c3d14c8STreehugger Robot        if (!aAbs) return fromRep(productSign);
*7c3d14c8STreehugger Robot        // anything * zero = +/- zero
*7c3d14c8STreehugger Robot        if (!bAbs) return fromRep(productSign);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // one or both of a or b is denormal, the other (if applicable) is a
*7c3d14c8STreehugger Robot        // normal number.  Renormalize one or both of a and b, and set scale to
*7c3d14c8STreehugger Robot        // include the necessary exponent adjustment.
*7c3d14c8STreehugger Robot        if (aAbs < implicitBit) scale += normalize(&aSignificand);
*7c3d14c8STreehugger Robot        if (bAbs < implicitBit) scale += normalize(&bSignificand);
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Or in the implicit significand bit.  (If we fell through from the
*7c3d14c8STreehugger Robot    // denormal path it was already set by normalize( ), but setting it twice
*7c3d14c8STreehugger Robot    // won't hurt anything.)
*7c3d14c8STreehugger Robot    aSignificand |= implicitBit;
*7c3d14c8STreehugger Robot    bSignificand |= implicitBit;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Get the significand of a*b.  Before multiplying the significands, shift
*7c3d14c8STreehugger Robot    // one of them left to left-align it in the field.  Thus, the product will
*7c3d14c8STreehugger Robot    // have (exponentBits + 2) integral digits, all but two of which must be
*7c3d14c8STreehugger Robot    // zero.  Normalizing this result is just a conditional left-shift by one
*7c3d14c8STreehugger Robot    // and bumping the exponent accordingly.
*7c3d14c8STreehugger Robot    rep_t productHi, productLo;
*7c3d14c8STreehugger Robot    wideMultiply(aSignificand, bSignificand << exponentBits,
*7c3d14c8STreehugger Robot                 &productHi, &productLo);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    int productExponent = aExponent + bExponent - exponentBias + scale;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Normalize the significand, adjust exponent if needed.
*7c3d14c8STreehugger Robot    if (productHi & implicitBit) productExponent++;
*7c3d14c8STreehugger Robot    else wideLeftShift(&productHi, &productLo, 1);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // If we have overflowed the type, return +/- infinity.
*7c3d14c8STreehugger Robot    if (productExponent >= maxExponent) return fromRep(infRep | productSign);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    if (productExponent <= 0) {
*7c3d14c8STreehugger Robot        // Result is denormal before rounding
*7c3d14c8STreehugger Robot        //
*7c3d14c8STreehugger Robot        // If the result is so small that it just underflows to zero, return
*7c3d14c8STreehugger Robot        // a zero of the appropriate sign.  Mathematically there is no need to
*7c3d14c8STreehugger Robot        // handle this case separately, but we make it a special case to
*7c3d14c8STreehugger Robot        // simplify the shift logic.
*7c3d14c8STreehugger Robot        const unsigned int shift = REP_C(1) - (unsigned int)productExponent;
*7c3d14c8STreehugger Robot        if (shift >= typeWidth) return fromRep(productSign);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // Otherwise, shift the significand of the result so that the round
*7c3d14c8STreehugger Robot        // bit is the high bit of productLo.
*7c3d14c8STreehugger Robot        wideRightShiftWithSticky(&productHi, &productLo, shift);
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot    else {
*7c3d14c8STreehugger Robot        // Result is normal before rounding; insert the exponent.
*7c3d14c8STreehugger Robot        productHi &= significandMask;
*7c3d14c8STreehugger Robot        productHi |= (rep_t)productExponent << significandBits;
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Insert the sign of the result:
*7c3d14c8STreehugger Robot    productHi |= productSign;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Final rounding.  The final result may overflow to infinity, or underflow
*7c3d14c8STreehugger Robot    // to zero, but those are the correct results in those cases.  We use the
*7c3d14c8STreehugger Robot    // default IEEE-754 round-to-nearest, ties-to-even rounding mode.
*7c3d14c8STreehugger Robot    if (productLo > signBit) productHi++;
*7c3d14c8STreehugger Robot    if (productLo == signBit) productHi += productHi & 1;
*7c3d14c8STreehugger Robot    return fromRep(productHi);
*7c3d14c8STreehugger Robot}