bool softfloat_tryPropagateNaNF128M( const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ) { if ( softfloat_isNaNF128M( aWPtr ) || softfloat_isNaNF128M( bWPtr ) ) { softfloat_propagateNaNF128M( aWPtr, bWPtr, zWPtr ); return true; } return false; }
void f128M_roundToInt( const float128_t *aPtr, uint_fast8_t roundingMode, bool exact, float128_t *zPtr ) { const uint32_t *aWPtr; uint32_t *zWPtr; uint32_t ui96; int32_t exp; uint32_t sigExtra; bool sign; uint_fast8_t bitPos; bool roundNear; unsigned int index, lastIndex; bool extra; uint32_t wordA, bit, wordZ; uint_fast8_t carry; uint32_t extrasMask; /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ aWPtr = (const uint32_t *) aPtr; zWPtr = (uint32_t *) zPtr; /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ ui96 = aWPtr[indexWordHi( 4 )]; exp = expF128UI96( ui96 ); /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ if ( exp < 0x3FFF ) { zWPtr[indexWord( 4, 2 )] = 0; zWPtr[indexWord( 4, 1 )] = 0; zWPtr[indexWord( 4, 0 )] = 0; sigExtra = aWPtr[indexWord( 4, 2 )]; if ( ! sigExtra ) { sigExtra = aWPtr[indexWord( 4, 1 )] | aWPtr[indexWord( 4, 0 )]; } if ( ! sigExtra && ! (ui96 & 0x7FFFFFFF) ) goto ui96; if ( exact ) softfloat_exceptionFlags |= softfloat_flag_inexact; sign = signF128UI96( ui96 ); switch ( roundingMode ) { case softfloat_round_near_even: if ( ! fracF128UI96( ui96 ) && ! sigExtra ) break; case softfloat_round_near_maxMag: if ( exp == 0x3FFE ) goto mag1; break; case softfloat_round_min: if ( sign ) goto mag1; break; case softfloat_round_max: if ( ! sign ) goto mag1; break; } ui96 = packToF128UI96( sign, 0, 0 ); goto ui96; mag1: ui96 = packToF128UI96( sign, 0x3FFF, 0 ); goto ui96; } /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ if ( 0x406F <= exp ) { if ( (exp == 0x7FFF) && (fracF128UI96( ui96 ) || (aWPtr[indexWord( 4, 2 )] | aWPtr[indexWord( 4, 1 )] | aWPtr[indexWord( 4, 0 )])) ) { softfloat_propagateNaNF128M( aWPtr, 0, zWPtr ); return; } zWPtr[indexWord( 4, 2 )] = aWPtr[indexWord( 4, 2 )]; zWPtr[indexWord( 4, 1 )] = aWPtr[indexWord( 4, 1 )]; zWPtr[indexWord( 4, 0 )] = aWPtr[indexWord( 4, 0 )]; goto ui96; } /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ bitPos = 0x406F - exp; roundNear = (roundingMode == softfloat_round_near_maxMag) || (roundingMode == softfloat_round_near_even); bitPos -= roundNear; index = indexWordLo( 4 ); lastIndex = indexWordHi( 4 ); extra = 0; for (;;) { wordA = aWPtr[index]; if ( bitPos < 32 ) break; if ( wordA ) extra = 1; zWPtr[index] = 0; index += wordIncr; bitPos -= 32; } bit = (uint32_t) 1<<bitPos; if ( roundNear ) { wordZ = wordA + bit; carry = (wordZ < wordA); bit <<= 1; extrasMask = bit - 1; if ( (roundingMode == softfloat_round_near_even) && ! extra && ! (wordZ & extrasMask) ) { if ( ! bit ) { zWPtr[index] = wordZ; index += wordIncr; wordZ = aWPtr[index] + carry; carry &= ! wordZ; zWPtr[index] = wordZ & ~1; goto propagateCarry; } wordZ &= ~bit; } } else { extrasMask = bit - 1; wordZ = wordA; carry = 0; if ( (roundingMode != softfloat_round_minMag) && (signF128UI96( ui96 ) ^ (roundingMode == softfloat_round_max)) ) { if ( extra || (wordA & extrasMask) ) { wordZ += bit; carry = (wordZ < wordA); } } } wordZ &= ~extrasMask; zWPtr[index] = wordZ; propagateCarry: while ( index != lastIndex ) { index += wordIncr; wordZ = aWPtr[index] + carry; zWPtr[index] = wordZ; carry &= ! wordZ; } /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ if ( exact && (softfloat_compare128M( aWPtr, zWPtr ) != 0) ) { softfloat_exceptionFlags |= softfloat_flag_inexact; } return; /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ ui96: zWPtr[indexWordHi( 4 )] = ui96; }
void softfloat_mulAddF128M( const uint32_t *aWPtr, const uint32_t *bWPtr, const uint32_t *cWPtr, uint32_t *zWPtr, uint_fast8_t op ) { uint32_t uiA96; int32_t expA; uint32_t uiB96; int32_t expB; uint32_t uiC96; bool signC; int32_t expC; bool signProd, prodIsInfinite; uint32_t *ptr, uiZ96, sigA[4]; uint_fast8_t shiftCount; uint32_t sigX[5]; int32_t expProd; uint32_t sigProd[8], wordSig; bool doSub; uint_fast8_t (*addCarryMRoutinePtr)( uint_fast8_t, const uint32_t *, const uint32_t *, uint_fast8_t, uint32_t * ); int32_t expDiff; bool signZ; int32_t expZ; uint32_t *extSigPtr; uint_fast8_t carry; void (*roundPackRoutinePtr)( bool, int32_t, uint32_t *, uint32_t * ); /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ uiA96 = aWPtr[indexWordHi( 4 )]; expA = expF128UI96( uiA96 ); uiB96 = bWPtr[indexWordHi( 4 )]; expB = expF128UI96( uiB96 ); uiC96 = cWPtr[indexWordHi( 4 )]; signC = signF128UI96( uiC96 ) ^ (op == softfloat_mulAdd_subC); expC = expF128UI96( uiC96 ); signProd = signF128UI96( uiA96 ) ^ signF128UI96( uiB96 ) ^ (op == softfloat_mulAdd_subProd); /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ prodIsInfinite = false; if ( (expA == 0x7FFF) || (expB == 0x7FFF) ) { if ( softfloat_tryPropagateNaNF128M( aWPtr, bWPtr, zWPtr ) ) { goto propagateNaN_ZC; } ptr = (uint32_t *) aWPtr; if ( ! (uint32_t) (uiA96<<1) ) goto possibleInvalidProd; if ( ! (uint32_t) (uiB96<<1) ) { ptr = (uint32_t *) bWPtr; possibleInvalidProd: if ( ! (ptr[indexWord( 4, 2 )] | ptr[indexWord( 4, 1 )] | ptr[indexWord( 4, 0 )]) ) { goto invalid; } } prodIsInfinite = true; } if ( expC == 0x7FFF ) { if ( fracF128UI96( uiC96 ) || (cWPtr[indexWord( 4, 2 )] | cWPtr[indexWord( 4, 1 )] | cWPtr[indexWord( 4, 0 )]) ) { zWPtr[indexWordHi( 4 )] = 0; goto propagateNaN_ZC; } if ( prodIsInfinite && (signProd != signC) ) goto invalid; goto copyC; } if ( prodIsInfinite ) { uiZ96 = packToF128UI96( signProd, 0x7FFF, 0 ); goto uiZ; } /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ if ( expA ) { sigA[indexWordHi( 4 )] = fracF128UI96( uiA96 ) | 0x00010000; sigA[indexWord( 4, 2 )] = aWPtr[indexWord( 4, 2 )]; sigA[indexWord( 4, 1 )] = aWPtr[indexWord( 4, 1 )]; sigA[indexWord( 4, 0 )] = aWPtr[indexWord( 4, 0 )]; } else { expA = softfloat_shiftNormSigF128M( aWPtr, 0, sigA ); if ( expA == -128 ) goto zeroProd; } if ( expB ) { sigX[indexWordHi( 4 )] = fracF128UI96( uiB96 ) | 0x00010000; sigX[indexWord( 4, 2 )] = bWPtr[indexWord( 4, 2 )]; sigX[indexWord( 4, 1 )] = bWPtr[indexWord( 4, 1 )]; sigX[indexWord( 4, 0 )] = bWPtr[indexWord( 4, 0 )]; } else { expB = softfloat_shiftNormSigF128M( bWPtr, 0, sigX ); if ( expB == -128 ) goto zeroProd; } /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ expProd = expA + expB - 0x3FF0; softfloat_mul128MTo256M( sigA, sigX, sigProd ); /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ wordSig = fracF128UI96( uiC96 ); if ( expC ) { --expC; wordSig |= 0x00010000; } sigX[indexWordHi( 5 )] = wordSig; sigX[indexWord( 5, 3 )] = cWPtr[indexWord( 4, 2 )]; sigX[indexWord( 5, 2 )] = cWPtr[indexWord( 4, 1 )]; sigX[indexWord( 5, 1 )] = cWPtr[indexWord( 4, 0 )]; /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ doSub = (signProd != signC); addCarryMRoutinePtr = doSub ? softfloat_addComplCarryM : softfloat_addCarryM; expDiff = expProd - expC; if ( expDiff <= 0 ) { /*-------------------------------------------------------------------- *--------------------------------------------------------------------*/ signZ = signC; expZ = expC; if ( sigProd[indexWord( 8, 2 )] || (sigProd[indexWord( 8, 1 )] | sigProd[indexWord( 8, 0 )]) ) { sigProd[indexWord( 8, 3 )] |= 1; } extSigPtr = &sigProd[indexMultiwordHi( 8, 5 )]; if ( expDiff ) { softfloat_shiftRightJam160M( extSigPtr, -expDiff, extSigPtr ); } carry = 0; if ( doSub ) { wordSig = extSigPtr[indexWordLo( 5 )]; extSigPtr[indexWordLo( 5 )] = -wordSig; carry = ! wordSig; } (*addCarryMRoutinePtr)( 4, &sigX[indexMultiwordHi( 5, 4 )], extSigPtr + indexMultiwordHi( 5, 4 ), carry, extSigPtr + indexMultiwordHi( 5, 4 ) ); wordSig = extSigPtr[indexWordHi( 5 )]; if ( ! expZ ) { if ( wordSig & 0x80000000 ) { signZ = ! signZ; softfloat_negX160M( extSigPtr ); wordSig = extSigPtr[indexWordHi( 5 )]; } goto checkCancellation; } if ( wordSig < 0x00010000 ) { --expZ; softfloat_add160M( extSigPtr, extSigPtr, extSigPtr ); goto roundPack; } goto extSigReady_noCancellation; } else { /*-------------------------------------------------------------------- *--------------------------------------------------------------------*/ signZ = signProd; expZ = expProd; sigX[indexWordLo( 5 )] = 0; expDiff -= 128; if ( 0 <= expDiff ) { /*---------------------------------------------------------------- *----------------------------------------------------------------*/ if ( expDiff ) softfloat_shiftRightJam160M( sigX, expDiff, sigX ); wordSig = sigX[indexWordLo( 5 )]; carry = 0; if ( doSub ) { carry = ! wordSig; wordSig = -wordSig; } carry = (*addCarryMRoutinePtr)( 4, &sigProd[indexMultiwordLo( 8, 4 )], &sigX[indexMultiwordHi( 5, 4 )], carry, &sigProd[indexMultiwordLo( 8, 4 )] ); sigProd[indexWord( 8, 2 )] |= wordSig; ptr = &sigProd[indexWord( 8, 4 )]; } else { /*---------------------------------------------------------------- *----------------------------------------------------------------*/ shiftCount = expDiff & 31; if ( shiftCount ) { softfloat_shortShiftRight160M( sigX, shiftCount, sigX ); } expDiff >>= 5; extSigPtr = &sigProd[indexMultiwordLo( 8, 5 )] - wordIncr + expDiff * -wordIncr; carry = (*addCarryMRoutinePtr)( 5, extSigPtr, sigX, doSub, extSigPtr ); if ( expDiff == -4 ) { /*------------------------------------------------------------ *------------------------------------------------------------*/ wordSig = sigProd[indexWordHi( 8 )]; if ( wordSig & 0x80000000 ) { signZ = ! signZ; softfloat_negX256M( sigProd ); wordSig = sigProd[indexWordHi( 8 )]; } /*------------------------------------------------------------ *------------------------------------------------------------*/ if ( wordSig ) goto expProdBigger_noWordShift; wordSig = sigProd[indexWord( 8, 6 )]; if ( 0x00040000 <= wordSig ) goto expProdBigger_noWordShift; expZ -= 32; extSigPtr = &sigProd[indexMultiwordHi( 8, 5 )] - wordIncr; for (;;) { if ( wordSig ) break; wordSig = extSigPtr[indexWord( 5, 3 )]; if ( 0x00040000 <= wordSig ) break; expZ -= 32; extSigPtr -= wordIncr; if ( extSigPtr == &sigProd[indexMultiwordLo( 8, 5 )] ) { goto checkCancellation; } } /*------------------------------------------------------------ *------------------------------------------------------------*/ ptr = extSigPtr + indexWordLo( 5 ); do { ptr -= wordIncr; if ( *ptr ) { extSigPtr[indexWordLo( 5 )] |= 1; break; } } while ( ptr != &sigProd[indexWordLo( 8 )] ); wordSig = extSigPtr[indexWordHi( 5 )]; goto extSigReady; } ptr = extSigPtr + indexWordHi( 5 ) + wordIncr; } /*-------------------------------------------------------------------- *--------------------------------------------------------------------*/ if ( carry != doSub ) { if ( doSub ) { do { wordSig = *ptr; *ptr = wordSig - 1; ptr += wordIncr; } while ( ! wordSig ); } else { do { wordSig = *ptr + 1; *ptr = wordSig; ptr += wordIncr; } while ( ! wordSig ); } } /*-------------------------------------------------------------------- *--------------------------------------------------------------------*/ expProdBigger_noWordShift: if ( sigProd[indexWord( 8, 2 )] || (sigProd[indexWord( 8, 1 )] | sigProd[indexWord( 8, 0 )]) ) { sigProd[indexWord( 8, 3 )] |= 1; } extSigPtr = &sigProd[indexMultiwordHi( 8, 5 )]; wordSig = extSigPtr[indexWordHi( 5 )]; } extSigReady: roundPackRoutinePtr = softfloat_normRoundPackMToF128M; if ( wordSig < 0x00010000 ) goto doRoundPack; extSigReady_noCancellation: if ( 0x00020000 <= wordSig ) { ++expZ; softfloat_shortShiftRightJam160M( extSigPtr, 1, extSigPtr ); } roundPack: roundPackRoutinePtr = softfloat_roundPackMToF128M; doRoundPack: (*roundPackRoutinePtr)( signZ, expZ, extSigPtr, zWPtr ); return; /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ invalid: softfloat_invalidF128M( zWPtr ); propagateNaN_ZC: softfloat_propagateNaNF128M( zWPtr, cWPtr, zWPtr ); return; /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ zeroProd: if ( ! (uint32_t) (uiC96<<1) && (signProd != signC) && ! cWPtr[indexWord( 4, 2 )] && ! (cWPtr[indexWord( 4, 1 )] | cWPtr[indexWord( 4, 0 )]) ) { goto completeCancellation; } copyC: zWPtr[indexWordHi( 4 )] = uiC96; zWPtr[indexWord( 4, 2 )] = cWPtr[indexWord( 4, 2 )]; zWPtr[indexWord( 4, 1 )] = cWPtr[indexWord( 4, 1 )]; zWPtr[indexWord( 4, 0 )] = cWPtr[indexWord( 4, 0 )]; return; /*------------------------------------------------------------------------ *------------------------------------------------------------------------*/ checkCancellation: if ( wordSig || (extSigPtr[indexWord( 5, 3 )] | extSigPtr[indexWord( 5, 2 )]) || (extSigPtr[indexWord( 5, 1 )] | extSigPtr[indexWord( 5, 0 )]) ) { goto extSigReady; } completeCancellation: uiZ96 = packToF128UI96( (softfloat_roundingMode == softfloat_round_min), 0, 0 ); uiZ: zWPtr[indexWordHi( 4 )] = uiZ96; zWPtr[indexWord( 4, 2 )] = 0; zWPtr[indexWord( 4, 1 )] = 0; zWPtr[indexWord( 4, 0 )] = 0; }