| //===-- addsf3.S - Adds two single precision floating pointer numbers-----===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file implements the __addsf3 (single precision floating pointer number |
| // addition with the IEEE-754 default rounding (to nearest, ties to even) |
| // function for the ARM Thumb1 ISA. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "../assembly.h" |
| #define significandBits 23 |
| #define typeWidth 32 |
| |
| .syntax unified |
| .text |
| .thumb |
| .p2align 2 |
| |
| DEFINE_AEABI_FUNCTION_ALIAS(__aeabi_fadd, __addsf3) |
| |
| DEFINE_COMPILERRT_THUMB_FUNCTION(__addsf3) |
| push {r4, r5, r6, r7, lr} |
| // Get the absolute value of a and b. |
| lsls r2, r0, #1 |
| lsls r3, r1, #1 |
| lsrs r2, r2, #1 // aAbs |
| beq LOCAL_LABEL(a_zero_nan_inf) |
| lsrs r3, r3, #1 // bAbs |
| beq LOCAL_LABEL(zero_nan_inf) |
| |
| // Detect if a or b is infinity or Nan. |
| lsrs r6, r2, #(significandBits) |
| lsrs r7, r3, #(significandBits) |
| cmp r6, #0xFF |
| beq LOCAL_LABEL(zero_nan_inf) |
| cmp r7, #0xFF |
| beq LOCAL_LABEL(zero_nan_inf) |
| |
| // Swap Rep and Abs so that a and aAbs has the larger absolute value. |
| cmp r2, r3 |
| bhs LOCAL_LABEL(no_swap) |
| movs r4, r0 |
| movs r5, r2 |
| movs r0, r1 |
| movs r2, r3 |
| movs r1, r4 |
| movs r3, r5 |
| LOCAL_LABEL(no_swap): |
| |
| // Get the significands and shift them to give us round, guard and sticky. |
| lsls r4, r0, #(typeWidth - significandBits) |
| lsrs r4, r4, #(typeWidth - significandBits - 3) // aSignificand << 3 |
| lsls r5, r1, #(typeWidth - significandBits) |
| lsrs r5, r5, #(typeWidth - significandBits - 3) // bSignificand << 3 |
| |
| // Get the implicitBit. |
| movs r6, #1 |
| lsls r6, r6, #(significandBits + 3) |
| |
| // Get aExponent and set implicit bit if necessary. |
| lsrs r2, r2, #(significandBits) |
| beq LOCAL_LABEL(a_done_implicit_bit) |
| orrs r4, r6 |
| LOCAL_LABEL(a_done_implicit_bit): |
| |
| // Get bExponent and set implicit bit if necessary. |
| lsrs r3, r3, #(significandBits) |
| beq LOCAL_LABEL(b_done_implicit_bit) |
| orrs r5, r6 |
| LOCAL_LABEL(b_done_implicit_bit): |
| |
| // Get the difference in exponents. |
| subs r6, r2, r3 |
| beq LOCAL_LABEL(done_align) |
| |
| // If b is denormal, then a must be normal as align > 0, and we only need to |
| // right shift bSignificand by (align - 1) bits. |
| cmp r3, #0 |
| bne 1f |
| subs r6, r6, #1 |
| 1: |
| |
| // No longer needs bExponent. r3 is dead here. |
| // Set sticky bits of b: sticky = bSignificand << (typeWidth - align). |
| movs r3, #(typeWidth) |
| subs r3, r3, r6 |
| movs r7, r5 |
| lsls r7, r3 |
| beq 1f |
| movs r7, #1 |
| 1: |
| |
| // bSignificand = bSignificand >> align | sticky; |
| lsrs r5, r6 |
| orrs r5, r7 |
| bne LOCAL_LABEL(done_align) |
| movs r5, #1 // sticky; b is known to be non-zero. |
| |
| LOCAL_LABEL(done_align): |
| // isSubtraction = (aRep ^ bRep) >> 31; |
| movs r7, r0 |
| eors r7, r1 |
| lsrs r7, #31 |
| bne LOCAL_LABEL(do_substraction) |
| |
| // Same sign, do Addition. |
| |
| // aSignificand += bSignificand; |
| adds r4, r4, r5 |
| |
| // Check carry bit. |
| movs r6, #1 |
| lsls r6, r6, #(significandBits + 3 + 1) |
| movs r7, r4 |
| ands r7, r6 |
| beq LOCAL_LABEL(form_result) |
| // If the addition carried up, we need to right-shift the result and |
| // adjust the exponent. |
| movs r7, r4 |
| movs r6, #1 |
| ands r7, r6 // sticky = aSignificand & 1; |
| lsrs r4, #1 |
| orrs r4, r7 // result Significand |
| adds r2, #1 // result Exponent |
| // If we have overflowed the type, return +/- infinity. |
| cmp r2, 0xFF |
| beq LOCAL_LABEL(ret_inf) |
| |
| LOCAL_LABEL(form_result): |
| // Shift the sign, exponent and significand into place. |
| lsrs r0, #(typeWidth - 1) |
| lsls r0, #(typeWidth - 1) // Get Sign. |
| lsls r2, #(significandBits) |
| orrs r0, r2 |
| movs r1, r4 |
| lsls r4, #(typeWidth - significandBits - 3) |
| lsrs r4, #(typeWidth - significandBits) |
| orrs r0, r4 |
| |
| // Final rounding. The result may overflow to infinity, but that is the |
| // correct result in that case. |
| // roundGuardSticky = aSignificand & 0x7; |
| movs r2, #0x7 |
| ands r1, r2 |
| // if (roundGuardSticky > 0x4) result++; |
| |
| cmp r1, #0x4 |
| blt LOCAL_LABEL(done_round) |
| beq 1f |
| adds r0, #1 |
| pop {r4, r5, r6, r7, pc} |
| 1: |
| |
| // if (roundGuardSticky == 0x4) result += result & 1; |
| movs r1, r0 |
| lsrs r1, #1 |
| bcc LOCAL_LABEL(done_round) |
| adds r0, r0, #1 |
| LOCAL_LABEL(done_round): |
| pop {r4, r5, r6, r7, pc} |
| |
| LOCAL_LABEL(do_substraction): |
| subs r4, r4, r5 // aSignificand -= bSignificand; |
| beq LOCAL_LABEL(ret_zero) |
| movs r6, r4 |
| cmp r2, 0 |
| beq LOCAL_LABEL(form_result) // if a's exp is 0, no need to normalize. |
| // If partial cancellation occured, we need to left-shift the result |
| // and adjust the exponent: |
| lsrs r6, r6, #(significandBits + 3) |
| bne LOCAL_LABEL(form_result) |
| |
| push {r0, r1, r2, r3} |
| movs r0, r4 |
| bl SYMBOL_NAME(__clzsi2) |
| movs r5, r0 |
| pop {r0, r1, r2, r3} |
| // shift = rep_clz(aSignificand) - rep_clz(implicitBit << 3); |
| subs r5, r5, #(typeWidth - significandBits - 3 - 1) |
| // aSignificand <<= shift; aExponent -= shift; |
| lsls r4, r5 |
| subs r2, r2, r5 |
| bgt LOCAL_LABEL(form_result) |
| |
| // Do normalization if aExponent <= 0. |
| movs r6, #1 |
| subs r6, r6, r2 // 1 - aExponent; |
| movs r2, #0 // aExponent = 0; |
| movs r3, #(typeWidth) // bExponent is dead. |
| subs r3, r3, r6 |
| movs r7, r4 |
| lsls r7, r3 // stickyBit = (bool)(aSignificant << (typeWidth - align)) |
| beq 1f |
| movs r7, #1 |
| 1: |
| lsrs r4, r6 // aSignificand >> shift |
| orrs r4, r7 |
| b LOCAL_LABEL(form_result) |
| |
| LOCAL_LABEL(ret_zero): |
| movs r0, #0 |
| pop {r4, r5, r6, r7, pc} |
| |
| |
| LOCAL_LABEL(a_zero_nan_inf): |
| lsrs r3, r3, #1 |
| |
| LOCAL_LABEL(zero_nan_inf): |
| // Here r2 has aAbs, r3 has bAbs |
| movs r4, #0xFF |
| lsls r4, r4, #(significandBits) // Make +inf. |
| |
| cmp r2, r4 |
| bhi LOCAL_LABEL(a_is_nan) |
| cmp r3, r4 |
| bhi LOCAL_LABEL(b_is_nan) |
| |
| cmp r2, r4 |
| bne LOCAL_LABEL(a_is_rational) |
| // aAbs is INF. |
| eors r1, r0 // aRep ^ bRep. |
| movs r6, #1 |
| lsls r6, r6, #(typeWidth - 1) // get sign mask. |
| cmp r1, r6 // if they only differ on sign bit, it's -INF + INF |
| beq LOCAL_LABEL(a_is_nan) |
| pop {r4, r5, r6, r7, pc} |
| |
| LOCAL_LABEL(a_is_rational): |
| cmp r3, r4 |
| bne LOCAL_LABEL(b_is_rational) |
| movs r0, r1 |
| pop {r4, r5, r6, r7, pc} |
| |
| LOCAL_LABEL(b_is_rational): |
| // either a or b or both are zero. |
| adds r4, r2, r3 |
| beq LOCAL_LABEL(both_zero) |
| cmp r2, #0 // is absA 0 ? |
| beq LOCAL_LABEL(ret_b) |
| pop {r4, r5, r6, r7, pc} |
| |
| LOCAL_LABEL(both_zero): |
| ands r0, r1 // +0 + -0 = +0 |
| pop {r4, r5, r6, r7, pc} |
| |
| LOCAL_LABEL(ret_b): |
| movs r0, r1 |
| |
| LOCAL_LABEL(ret): |
| pop {r4, r5, r6, r7, pc} |
| |
| LOCAL_LABEL(b_is_nan): |
| movs r0, r1 |
| LOCAL_LABEL(a_is_nan): |
| movs r1, #1 |
| lsls r1, r1, #(significandBits -1) // r1 is quiet bit. |
| orrs r0, r1 |
| pop {r4, r5, r6, r7, pc} |
| |
| LOCAL_LABEL(ret_inf): |
| movs r4, #0xFF |
| lsls r4, r4, #(significandBits) |
| orrs r0, r4 |
| lsrs r0, r0, #(significandBits) |
| lsls r0, r0, #(significandBits) |
| pop {r4, r5, r6, r7, pc} |
| |
| |
| END_COMPILERRT_FUNCTION(__addsf3) |
| |
| NO_EXEC_STACK_DIRECTIVE |