lib/builtins/fp_add_impl.inc

*7c3d14c8STreehugger Robot//===----- lib/fp_add_impl.inc - floaing point addition -----------*- C -*-===//
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot//                     The LLVM Compiler Infrastructure
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot// This file is dual licensed under the MIT and the University of Illinois Open
*7c3d14c8STreehugger Robot// Source Licenses. See LICENSE.TXT for details.
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot//===----------------------------------------------------------------------===//
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot// This file implements soft-float addition with the IEEE-754 default rounding
*7c3d14c8STreehugger Robot// (to nearest, ties to even).
*7c3d14c8STreehugger Robot//
*7c3d14c8STreehugger Robot//===----------------------------------------------------------------------===//
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot#include "fp_lib.h"
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robotstatic __inline fp_t __addXf3__(fp_t a, fp_t b) {
*7c3d14c8STreehugger Robot    rep_t aRep = toRep(a);
*7c3d14c8STreehugger Robot    rep_t bRep = toRep(b);
*7c3d14c8STreehugger Robot    const rep_t aAbs = aRep & absMask;
*7c3d14c8STreehugger Robot    const rep_t bAbs = bRep & absMask;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Detect if a or b is zero, infinity, or NaN.
*7c3d14c8STreehugger Robot    if (aAbs - REP_C(1) >= infRep - REP_C(1) ||
*7c3d14c8STreehugger Robot        bAbs - REP_C(1) >= infRep - REP_C(1)) {
*7c3d14c8STreehugger Robot        // NaN + anything = qNaN
*7c3d14c8STreehugger Robot        if (aAbs > infRep) return fromRep(toRep(a) | quietBit);
*7c3d14c8STreehugger Robot        // anything + NaN = qNaN
*7c3d14c8STreehugger Robot        if (bAbs > infRep) return fromRep(toRep(b) | quietBit);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        if (aAbs == infRep) {
*7c3d14c8STreehugger Robot            // +/-infinity + -/+infinity = qNaN
*7c3d14c8STreehugger Robot            if ((toRep(a) ^ toRep(b)) == signBit) return fromRep(qnanRep);
*7c3d14c8STreehugger Robot            // +/-infinity + anything remaining = +/- infinity
*7c3d14c8STreehugger Robot            else return a;
*7c3d14c8STreehugger Robot        }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // anything remaining + +/-infinity = +/-infinity
*7c3d14c8STreehugger Robot        if (bAbs == infRep) return b;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // zero + anything = anything
*7c3d14c8STreehugger Robot        if (!aAbs) {
*7c3d14c8STreehugger Robot            // but we need to get the sign right for zero + zero
*7c3d14c8STreehugger Robot            if (!bAbs) return fromRep(toRep(a) & toRep(b));
*7c3d14c8STreehugger Robot            else return b;
*7c3d14c8STreehugger Robot        }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // anything + zero = anything
*7c3d14c8STreehugger Robot        if (!bAbs) return a;
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Swap a and b if necessary so that a has the larger absolute value.
*7c3d14c8STreehugger Robot    if (bAbs > aAbs) {
*7c3d14c8STreehugger Robot        const rep_t temp = aRep;
*7c3d14c8STreehugger Robot        aRep = bRep;
*7c3d14c8STreehugger Robot        bRep = temp;
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Extract the exponent and significand from the (possibly swapped) a and b.
*7c3d14c8STreehugger Robot    int aExponent = aRep >> significandBits & maxExponent;
*7c3d14c8STreehugger Robot    int bExponent = bRep >> significandBits & maxExponent;
*7c3d14c8STreehugger Robot    rep_t aSignificand = aRep & significandMask;
*7c3d14c8STreehugger Robot    rep_t bSignificand = bRep & significandMask;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Normalize any denormals, and adjust the exponent accordingly.
*7c3d14c8STreehugger Robot    if (aExponent == 0) aExponent = normalize(&aSignificand);
*7c3d14c8STreehugger Robot    if (bExponent == 0) bExponent = normalize(&bSignificand);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // The sign of the result is the sign of the larger operand, a.  If they
*7c3d14c8STreehugger Robot    // have opposite signs, we are performing a subtraction; otherwise addition.
*7c3d14c8STreehugger Robot    const rep_t resultSign = aRep & signBit;
*7c3d14c8STreehugger Robot    const bool subtraction = (aRep ^ bRep) & signBit;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Shift the significands to give us round, guard and sticky, and or in the
*7c3d14c8STreehugger Robot    // implicit significand bit.  (If we fell through from the denormal path it
*7c3d14c8STreehugger Robot    // was already set by normalize( ), but setting it twice won't hurt
*7c3d14c8STreehugger Robot    // anything.)
*7c3d14c8STreehugger Robot    aSignificand = (aSignificand | implicitBit) << 3;
*7c3d14c8STreehugger Robot    bSignificand = (bSignificand | implicitBit) << 3;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Shift the significand of b by the difference in exponents, with a sticky
*7c3d14c8STreehugger Robot    // bottom bit to get rounding correct.
*7c3d14c8STreehugger Robot    const unsigned int align = aExponent - bExponent;
*7c3d14c8STreehugger Robot    if (align) {
*7c3d14c8STreehugger Robot        if (align < typeWidth) {
*7c3d14c8STreehugger Robot            const bool sticky = bSignificand << (typeWidth - align);
*7c3d14c8STreehugger Robot            bSignificand = bSignificand >> align | sticky;
*7c3d14c8STreehugger Robot        } else {
*7c3d14c8STreehugger Robot            bSignificand = 1; // sticky; b is known to be non-zero.
*7c3d14c8STreehugger Robot        }
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot    if (subtraction) {
*7c3d14c8STreehugger Robot        aSignificand -= bSignificand;
*7c3d14c8STreehugger Robot        // If a == -b, return +zero.
*7c3d14c8STreehugger Robot        if (aSignificand == 0) return fromRep(0);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // If partial cancellation occured, we need to left-shift the result
*7c3d14c8STreehugger Robot        // and adjust the exponent:
*7c3d14c8STreehugger Robot        if (aSignificand < implicitBit << 3) {
*7c3d14c8STreehugger Robot            const int shift = rep_clz(aSignificand) - rep_clz(implicitBit << 3);
*7c3d14c8STreehugger Robot            aSignificand <<= shift;
*7c3d14c8STreehugger Robot            aExponent -= shift;
*7c3d14c8STreehugger Robot        }
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot    else /* addition */ {
*7c3d14c8STreehugger Robot        aSignificand += bSignificand;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot        // If the addition carried up, we need to right-shift the result and
*7c3d14c8STreehugger Robot        // adjust the exponent:
*7c3d14c8STreehugger Robot        if (aSignificand & implicitBit << 4) {
*7c3d14c8STreehugger Robot            const bool sticky = aSignificand & 1;
*7c3d14c8STreehugger Robot            aSignificand = aSignificand >> 1 | sticky;
*7c3d14c8STreehugger Robot            aExponent += 1;
*7c3d14c8STreehugger Robot        }
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // If we have overflowed the type, return +/- infinity:
*7c3d14c8STreehugger Robot    if (aExponent >= maxExponent) return fromRep(infRep | resultSign);
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    if (aExponent <= 0) {
*7c3d14c8STreehugger Robot        // Result is denormal before rounding; the exponent is zero and we
*7c3d14c8STreehugger Robot        // need to shift the significand.
*7c3d14c8STreehugger Robot        const int shift = 1 - aExponent;
*7c3d14c8STreehugger Robot        const bool sticky = aSignificand << (typeWidth - shift);
*7c3d14c8STreehugger Robot        aSignificand = aSignificand >> shift | sticky;
*7c3d14c8STreehugger Robot        aExponent = 0;
*7c3d14c8STreehugger Robot    }
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Low three bits are round, guard, and sticky.
*7c3d14c8STreehugger Robot    const int roundGuardSticky = aSignificand & 0x7;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Shift the significand into place, and mask off the implicit bit.
*7c3d14c8STreehugger Robot    rep_t result = aSignificand >> 3 & significandMask;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Insert the exponent and sign.
*7c3d14c8STreehugger Robot    result |= (rep_t)aExponent << significandBits;
*7c3d14c8STreehugger Robot    result |= resultSign;
*7c3d14c8STreehugger Robot
*7c3d14c8STreehugger Robot    // Final rounding.  The result may overflow to infinity, but that is the
*7c3d14c8STreehugger Robot    // correct result in that case.
*7c3d14c8STreehugger Robot    if (roundGuardSticky > 0x4) result++;
*7c3d14c8STreehugger Robot    if (roundGuardSticky == 0x4) result += result & 1;
*7c3d14c8STreehugger Robot    return fromRep(result);
*7c3d14c8STreehugger Robot}