Upgrade to softfloat3e.
This should solve licensing problems as well.
This commit is contained in:
332
src/cpu/softfloat3e/f128_mulAdd.cc
Normal file
332
src/cpu/softfloat3e/f128_mulAdd.cc
Normal file
@@ -0,0 +1,332 @@
|
||||
/*============================================================================
|
||||
|
||||
This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic
|
||||
Package, Release 3e, by John R. Hauser.
|
||||
|
||||
Copyright 2011, 2012, 2013, 2014 The Regents of the University of California.
|
||||
All rights reserved.
|
||||
|
||||
Redistribution and use in source and binary forms, with or without
|
||||
modification, are permitted provided that the following conditions are met:
|
||||
|
||||
1. Redistributions of source code must retain the above copyright notice,
|
||||
this list of conditions, and the following disclaimer.
|
||||
|
||||
2. Redistributions in binary form must reproduce the above copyright notice,
|
||||
this list of conditions, and the following disclaimer in the documentation
|
||||
and/or other materials provided with the distribution.
|
||||
|
||||
3. Neither the name of the University nor the names of its contributors may
|
||||
be used to endorse or promote products derived from this software without
|
||||
specific prior written permission.
|
||||
|
||||
THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY
|
||||
EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
||||
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE
|
||||
DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
|
||||
DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
||||
(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
|
||||
LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
|
||||
ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
||||
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
|
||||
=============================================================================*/
|
||||
|
||||
#include <stdint.h>
|
||||
#include "internals.h"
|
||||
#include "primitives.h"
|
||||
#include "primitiveTypes.h"
|
||||
#include "softfloat.h"
|
||||
#include "specialize.h"
|
||||
|
||||
float128_t f128_mulAdd(float128_t a, float128_t b, float128_t c, uint8_t op, struct softfloat_status_t *status)
|
||||
{
|
||||
bool signA;
|
||||
int32_t expA;
|
||||
struct uint128 sigA;
|
||||
bool signB;
|
||||
int32_t expB;
|
||||
struct uint128 sigB;
|
||||
bool signC;
|
||||
int32_t expC;
|
||||
struct uint128 sigC;
|
||||
bool signZ;
|
||||
uint64_t magBits;
|
||||
struct uint128 uiZ;
|
||||
struct exp32_sig128 normExpSig;
|
||||
int32_t expZ;
|
||||
uint64_t sig256Z[4];
|
||||
struct uint128 sigZ;
|
||||
int32_t shiftDist, expDiff;
|
||||
struct uint128 x128;
|
||||
uint64_t sig256C[4];
|
||||
static uint64_t zero256[4] = INIT_UINTM4(0, 0, 0, 0);
|
||||
uint64_t sigZExtra, sig256Z0;
|
||||
uint64_t uiA64, uiA0;
|
||||
uint64_t uiB64, uiB0;
|
||||
uint64_t uiC64, uiC0;
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
uiA64 = a.v64;
|
||||
uiA0 = a.v0;
|
||||
uiB64 = b.v64;
|
||||
uiB0 = b.v0;
|
||||
uiC64 = c.v64;
|
||||
uiC0 = c.v0;
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
signA = signF128UI64(uiA64);
|
||||
expA = expF128UI64(uiA64);
|
||||
sigA.v64 = fracF128UI64(uiA64);
|
||||
sigA.v0 = uiA0;
|
||||
signB = signF128UI64(uiB64);
|
||||
expB = expF128UI64(uiB64);
|
||||
sigB.v64 = fracF128UI64(uiB64);
|
||||
sigB.v0 = uiB0;
|
||||
signC = signF128UI64(uiC64) ^ ((op & softfloat_mulAdd_subC) != 0);
|
||||
expC = expF128UI64(uiC64);
|
||||
sigC.v64 = fracF128UI64(uiC64);
|
||||
sigC.v0 = uiC0;
|
||||
signZ = signA ^ signB ^ ((op & softfloat_mulAdd_subProd) != 0);
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
if (expA == 0x7FFF) {
|
||||
if ((sigA.v64 | sigA.v0) || ((expB == 0x7FFF) && (sigB.v64 | sigB.v0))) {
|
||||
goto propagateNaN_ABC;
|
||||
}
|
||||
magBits = expB | sigB.v64 | sigB.v0;
|
||||
goto infProdArg;
|
||||
}
|
||||
if (expB == 0x7FFF) {
|
||||
if (sigB.v64 | sigB.v0) goto propagateNaN_ABC;
|
||||
magBits = expA | sigA.v64 | sigA.v0;
|
||||
goto infProdArg;
|
||||
}
|
||||
if (expC == 0x7FFF) {
|
||||
if (sigC.v64 | sigC.v0) {
|
||||
uiZ.v64 = 0;
|
||||
uiZ.v0 = 0;
|
||||
goto propagateNaN_ZC;
|
||||
}
|
||||
uiZ.v64 = uiC64;
|
||||
uiZ.v0 = uiC0;
|
||||
return uiZ;
|
||||
}
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
if (! expA) {
|
||||
if (! (sigA.v64 | sigA.v0)) goto zeroProd;
|
||||
softfloat_raiseFlags(status, softfloat_flag_denormal);
|
||||
normExpSig = softfloat_normSubnormalF128Sig(sigA.v64, sigA.v0);
|
||||
expA = normExpSig.exp;
|
||||
sigA = normExpSig.sig;
|
||||
}
|
||||
if (! expB) {
|
||||
if (! (sigB.v64 | sigB.v0)) goto zeroProd;
|
||||
softfloat_raiseFlags(status, softfloat_flag_denormal);
|
||||
normExpSig = softfloat_normSubnormalF128Sig(sigB.v64, sigB.v0);
|
||||
expB = normExpSig.exp;
|
||||
sigB = normExpSig.sig;
|
||||
}
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
expZ = expA + expB - 0x3FFE;
|
||||
sigA.v64 |= UINT64_C(0x0001000000000000);
|
||||
sigB.v64 |= UINT64_C(0x0001000000000000);
|
||||
sigA = softfloat_shortShiftLeft128(sigA.v64, sigA.v0, 8);
|
||||
sigB = softfloat_shortShiftLeft128(sigB.v64, sigB.v0, 15);
|
||||
softfloat_mul128To256M(sigA.v64, sigA.v0, sigB.v64, sigB.v0, sig256Z);
|
||||
sigZ.v64 = sig256Z[indexWord(4, 3)];
|
||||
sigZ.v0 = sig256Z[indexWord(4, 2)];
|
||||
shiftDist = 0;
|
||||
if (! (sigZ.v64 & UINT64_C(0x0100000000000000))) {
|
||||
--expZ;
|
||||
shiftDist = -1;
|
||||
}
|
||||
if (! expC) {
|
||||
if (! (sigC.v64 | sigC.v0)) {
|
||||
shiftDist += 8;
|
||||
goto sigZ;
|
||||
}
|
||||
softfloat_raiseFlags(status, softfloat_flag_denormal);
|
||||
normExpSig = softfloat_normSubnormalF128Sig(sigC.v64, sigC.v0);
|
||||
expC = normExpSig.exp;
|
||||
sigC = normExpSig.sig;
|
||||
}
|
||||
sigC.v64 |= UINT64_C(0x0001000000000000);
|
||||
sigC = softfloat_shortShiftLeft128(sigC.v64, sigC.v0, 8);
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
expDiff = expZ - expC;
|
||||
if (expDiff < 0) {
|
||||
expZ = expC;
|
||||
if ((signZ == signC) || (expDiff < -1)) {
|
||||
shiftDist -= expDiff;
|
||||
if (shiftDist) {
|
||||
sigZ = softfloat_shiftRightJam128(sigZ.v64, sigZ.v0, shiftDist);
|
||||
}
|
||||
} else {
|
||||
if (! shiftDist) {
|
||||
x128 = softfloat_shortShiftRight128(sig256Z[indexWord(4, 1)], sig256Z[indexWord(4, 0)], 1);
|
||||
sig256Z[indexWord(4, 1)] = (sigZ.v0<<63) | x128.v64;
|
||||
sig256Z[indexWord(4, 0)] = x128.v0;
|
||||
sigZ = softfloat_shortShiftRight128(sigZ.v64, sigZ.v0, 1);
|
||||
sig256Z[indexWord(4, 3)] = sigZ.v64;
|
||||
sig256Z[indexWord(4, 2)] = sigZ.v0;
|
||||
}
|
||||
}
|
||||
} else {
|
||||
if (shiftDist) softfloat_add256M(sig256Z, sig256Z, sig256Z);
|
||||
if (! expDiff) {
|
||||
sigZ.v64 = sig256Z[indexWord(4, 3)];
|
||||
sigZ.v0 = sig256Z[indexWord(4, 2)];
|
||||
} else {
|
||||
sig256C[indexWord(4, 3)] = sigC.v64;
|
||||
sig256C[indexWord(4, 2)] = sigC.v0;
|
||||
sig256C[indexWord(4, 1)] = 0;
|
||||
sig256C[indexWord(4, 0)] = 0;
|
||||
softfloat_shiftRightJam256M(sig256C, expDiff, sig256C);
|
||||
}
|
||||
}
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
shiftDist = 8;
|
||||
if (signZ == signC) {
|
||||
/*--------------------------------------------------------------------
|
||||
*--------------------------------------------------------------------*/
|
||||
if (expDiff <= 0) {
|
||||
sigZ = softfloat_add128(sigC.v64, sigC.v0, sigZ.v64, sigZ.v0);
|
||||
} else {
|
||||
softfloat_add256M(sig256Z, sig256C, sig256Z);
|
||||
sigZ.v64 = sig256Z[indexWord(4, 3)];
|
||||
sigZ.v0 = sig256Z[indexWord(4, 2)];
|
||||
}
|
||||
if (sigZ.v64 & UINT64_C(0x0200000000000000)) {
|
||||
++expZ;
|
||||
shiftDist = 9;
|
||||
}
|
||||
} else {
|
||||
/*--------------------------------------------------------------------
|
||||
*--------------------------------------------------------------------*/
|
||||
if (expDiff < 0) {
|
||||
signZ = signC;
|
||||
if (expDiff < -1) {
|
||||
sigZ = softfloat_sub128(sigC.v64, sigC.v0, sigZ.v64, sigZ.v0);
|
||||
sigZExtra = sig256Z[indexWord(4, 1)] | sig256Z[indexWord(4, 0)];
|
||||
if (sigZExtra) {
|
||||
sigZ = softfloat_sub128(sigZ.v64, sigZ.v0, 0, 1);
|
||||
}
|
||||
if (! (sigZ.v64 & UINT64_C(0x0100000000000000))) {
|
||||
--expZ;
|
||||
shiftDist = 7;
|
||||
}
|
||||
goto shiftRightRoundPack;
|
||||
} else {
|
||||
sig256C[indexWord(4, 3)] = sigC.v64;
|
||||
sig256C[indexWord(4, 2)] = sigC.v0;
|
||||
sig256C[indexWord(4, 1)] = 0;
|
||||
sig256C[indexWord(4, 0)] = 0;
|
||||
softfloat_sub256M(sig256C, sig256Z, sig256Z);
|
||||
}
|
||||
} else if (! expDiff) {
|
||||
sigZ = softfloat_sub128(sigZ.v64, sigZ.v0, sigC.v64, sigC.v0);
|
||||
if (! (sigZ.v64 | sigZ.v0) && ! sig256Z[indexWord(4, 1)] && ! sig256Z[indexWord(4, 0)]) {
|
||||
goto completeCancellation;
|
||||
}
|
||||
sig256Z[indexWord(4, 3)] = sigZ.v64;
|
||||
sig256Z[indexWord(4, 2)] = sigZ.v0;
|
||||
if (sigZ.v64 & UINT64_C(0x8000000000000000)) {
|
||||
signZ = ! signZ;
|
||||
softfloat_sub256M(zero256, sig256Z, sig256Z);
|
||||
}
|
||||
} else {
|
||||
softfloat_sub256M(sig256Z, sig256C, sig256Z);
|
||||
if (1 < expDiff) {
|
||||
sigZ.v64 = sig256Z[indexWord(4, 3)];
|
||||
sigZ.v0 = sig256Z[indexWord(4, 2)];
|
||||
if (! (sigZ.v64 & UINT64_C(0x0100000000000000))) {
|
||||
--expZ;
|
||||
shiftDist = 7;
|
||||
}
|
||||
goto sigZ;
|
||||
}
|
||||
}
|
||||
/*--------------------------------------------------------------------
|
||||
*--------------------------------------------------------------------*/
|
||||
sigZ.v64 = sig256Z[indexWord(4, 3)];
|
||||
sigZ.v0 = sig256Z[indexWord(4, 2)];
|
||||
sigZExtra = sig256Z[indexWord(4, 1)];
|
||||
sig256Z0 = sig256Z[indexWord(4, 0)];
|
||||
if (sigZ.v64) {
|
||||
if (sig256Z0) sigZExtra |= 1;
|
||||
} else {
|
||||
expZ -= 64;
|
||||
sigZ.v64 = sigZ.v0;
|
||||
sigZ.v0 = sigZExtra;
|
||||
sigZExtra = sig256Z0;
|
||||
if (! sigZ.v64) {
|
||||
expZ -= 64;
|
||||
sigZ.v64 = sigZ.v0;
|
||||
sigZ.v0 = sigZExtra;
|
||||
sigZExtra = 0;
|
||||
if (! sigZ.v64) {
|
||||
expZ -= 64;
|
||||
sigZ.v64 = sigZ.v0;
|
||||
sigZ.v0 = 0;
|
||||
}
|
||||
}
|
||||
}
|
||||
shiftDist = softfloat_countLeadingZeros64(sigZ.v64);
|
||||
expZ += 7 - shiftDist;
|
||||
shiftDist = 15 - shiftDist;
|
||||
if (0 < shiftDist) goto shiftRightRoundPack;
|
||||
if (shiftDist) {
|
||||
shiftDist = -shiftDist;
|
||||
sigZ = softfloat_shortShiftLeft128(sigZ.v64, sigZ.v0, shiftDist);
|
||||
x128 = softfloat_shortShiftLeft128(0, sigZExtra, shiftDist);
|
||||
sigZ.v0 |= x128.v64;
|
||||
sigZExtra = x128.v0;
|
||||
}
|
||||
goto roundPack;
|
||||
}
|
||||
sigZ:
|
||||
sigZExtra = sig256Z[indexWord(4, 1)] | sig256Z[indexWord(4, 0)];
|
||||
shiftRightRoundPack:
|
||||
sigZExtra = (uint64_t) (sigZ.v0<<(64 - shiftDist)) | (sigZExtra != 0);
|
||||
sigZ = softfloat_shortShiftRight128(sigZ.v64, sigZ.v0, shiftDist);
|
||||
roundPack:
|
||||
return softfloat_roundPackToF128(signZ, expZ - 1, sigZ.v64, sigZ.v0, sigZExtra, status);
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
propagateNaN_ABC:
|
||||
uiZ = softfloat_propagateNaNF128UI(uiA64, uiA0, uiB64, uiB0, status);
|
||||
goto propagateNaN_ZC;
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
infProdArg:
|
||||
if ((sigC.v64 | sigC.v0) && expC == 0x7FFF) goto propagateNaN_ZC;
|
||||
if (magBits) {
|
||||
uiZ.v64 = packToF128UI64(signZ, 0x7FFF, 0);
|
||||
uiZ.v0 = 0;
|
||||
if (expC != 0x7FFF) return uiZ;
|
||||
if (signZ == signC) return uiZ;
|
||||
}
|
||||
softfloat_raiseFlags(status, softfloat_flag_invalid);
|
||||
uiZ.v64 = defaultNaNF128UI64;
|
||||
uiZ.v0 = defaultNaNF128UI0;
|
||||
propagateNaN_ZC:
|
||||
uiZ = softfloat_propagateNaNF128UI(uiZ.v64, uiZ.v0, uiC64, uiC0, status);
|
||||
return uiZ;
|
||||
/*------------------------------------------------------------------------
|
||||
*------------------------------------------------------------------------*/
|
||||
zeroProd:
|
||||
uiZ.v64 = uiC64;
|
||||
uiZ.v0 = uiC0;
|
||||
if (! (expC | sigC.v64 | sigC.v0) && (signZ != signC)) {
|
||||
completeCancellation:
|
||||
uiZ.v64 = packToF128UI64((softfloat_getRoundingMode(status) == softfloat_round_min), 0, 0);
|
||||
uiZ.v0 = 0;
|
||||
}
|
||||
return uiZ;
|
||||
}
|
||||
Reference in New Issue
Block a user