Merge pull request #2694 from Subv/vfp_vsub_ftz

Dyncom/VFP: Perform flush-to-zero on the second operand of vsub before sending it to vadd.
This commit is contained in:
Merry 2017-05-22 00:50:52 +01:00 committed by GitHub
commit 188d63fdb6
1 changed files with 12 additions and 2 deletions

View File

@ -1049,12 +1049,22 @@ static u32 vfp_single_fadd(ARMul_State* state, int sd, int sn, s32 m, u32 fpscr)
static u32 vfp_single_fsub(ARMul_State* state, int sd, int sn, s32 m, u32 fpscr) { static u32 vfp_single_fsub(ARMul_State* state, int sd, int sn, s32 m, u32 fpscr) {
LOG_TRACE(Core_ARM11, "s%u = %08x", sn, sd); LOG_TRACE(Core_ARM11, "s%u = %08x", sn, sd);
/* /*
* Subtraction is addition with one sign inverted. * Subtraction is addition with one sign inverted. Unpack the second operand to perform FTZ if
* necessary, we can't let fadd do this because a denormal in m might get flushed to +0 in FTZ
* mode, and the resulting sign of 0 OP +0 differs between fadd and fsub. We do not need to do
* this for n because +0 OP 0 is always +0 for both fadd and fsub.
*/ */
struct vfp_single vsm;
u32 exceptions = vfp_single_unpack(&vsm, m, fpscr);
if (exceptions & FPSCR_IDC) {
// The value was flushed to zero, re-pack it.
m = vfp_single_pack(&vsm);
}
if (m != 0x7FC00000) // Only negate if m isn't NaN. if (m != 0x7FC00000) // Only negate if m isn't NaN.
m = vfp_single_packed_negate(m); m = vfp_single_packed_negate(m);
return vfp_single_fadd(state, sd, sn, m, fpscr); return vfp_single_fadd(state, sd, sn, m, fpscr) | exceptions;
} }
/* /*