compiler-rt/lib/mulsf3.c

5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//===-- lib/mulsf3.c - Single-precision multiplication ------------*- C -*-===//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//                     The LLVM Compiler Infrastructure
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// This file is dual licensed under the MIT and the University of Illinois Open
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Source Licenses. See LICENSE.TXT for details.
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//===----------------------------------------------------------------------===//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// This file implements single-precision soft-float multiplication
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// with the IEEE-754 default rounding (to nearest, ties to even).
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)//===----------------------------------------------------------------------===//
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#define SINGLE_PRECISION
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "fp_lib.h"
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)ARM_EABI_FNALIAS(fmul, mulsf3)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)COMPILER_RT_ABI fp_t
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)__mulsf3(fp_t a, fp_t b) {
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    const unsigned int aExponent = toRep(a) >> significandBits & maxExponent;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    const unsigned int bExponent = toRep(b) >> significandBits & maxExponent;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    const rep_t productSign = (toRep(a) ^ toRep(b)) & signBit;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    rep_t aSignificand = toRep(a) & significandMask;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    rep_t bSignificand = toRep(b) & significandMask;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    int scale = 0;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Detect if a or b is zero, denormal, infinity, or NaN.
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    if (aExponent-1U >= maxExponent-1U || bExponent-1U >= maxExponent-1U) {
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        const rep_t aAbs = toRep(a) & absMask;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        const rep_t bAbs = toRep(b) & absMask;
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        // NaN * anything = qNaN
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        if (aAbs > infRep) return fromRep(toRep(a) | quietBit);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        // anything * NaN = qNaN
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        if (bAbs > infRep) return fromRep(toRep(b) | quietBit);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        if (aAbs == infRep) {
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            // infinity * non-zero = +/- infinity
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            if (bAbs) return fromRep(aAbs | productSign);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            // infinity * zero = NaN
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            else return fromRep(qnanRep);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        }
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        if (bAbs == infRep) {
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            // non-zero * infinity = +/- infinity
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            if (aAbs) return fromRep(bAbs | productSign);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            // zero * infinity = NaN
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            else return fromRep(qnanRep);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        }
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        // zero * anything = +/- zero
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        if (!aAbs) return fromRep(productSign);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        // anything * zero = +/- zero
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        if (!bAbs) return fromRep(productSign);
5821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
        // one or both of a or b is denormal, the other (if applicable) is a
        // normal number.  Renormalize one or both of a and b, and set scale to
        // include the necessary exponent adjustment.
        if (aAbs < implicitBit) scale += normalize(&aSignificand);
        if (bAbs < implicitBit) scale += normalize(&bSignificand);
    }

    // Or in the implicit significand bit.  (If we fell through from the
    // denormal path it was already set by normalize( ), but setting it twice
    // won't hurt anything.)
    aSignificand |= implicitBit;
    bSignificand |= implicitBit;

    // Get the significand of a*b.  Before multiplying the significands, shift
    // one of them left to left-align it in the field.  Thus, the product will
    // have (exponentBits + 2) integral digits, all but two of which must be
    // zero.  Normalizing this result is just a conditional left-shift by one
    // and bumping the exponent accordingly.
    rep_t productHi, productLo;
    wideMultiply(aSignificand, bSignificand << exponentBits,
                 &productHi, &productLo);

    int productExponent = aExponent + bExponent - exponentBias + scale;

    // Normalize the significand, adjust exponent if needed.
    if (productHi & implicitBit) productExponent++;
    else wideLeftShift(&productHi, &productLo, 1);

    // If we have overflowed the type, return +/- infinity.
    if (productExponent >= maxExponent) return fromRep(infRep | productSign);

    if (productExponent <= 0) {
        // Result is denormal before rounding, the exponent is zero and we
        // need to shift the significand.
        wideRightShiftWithSticky(&productHi, &productLo, 1U - (unsigned)productExponent);
    }

    else {
        // Result is normal before rounding; insert the exponent.
        productHi &= significandMask;
        productHi |= (rep_t)productExponent << significandBits;
    }

    // Insert the sign of the result:
    productHi |= productSign;

    // Final rounding.  The final result may overflow to infinity, or underflow
    // to zero, but those are the correct results in those cases.
    if (productLo > signBit) productHi++;
    if (productLo == signBit) productHi += productHi & 1;
    return fromRep(productHi);
}