x86jit: Correctly handle NaNs in vfpxd sat clamps.

May be a small performance jit, but we've seen games with bugs because of NaNs recently, so better to be safe.
2024-11-23 21:39:52 +00:00 · 2014-05-16 00:55:34 -07:00 · 2014-05-16 00:55:34 -07:00 · ccc5458a84
commit ccc5458a84
parent 69b0b622be
1 changed files with 23 additions and 4 deletions
--- a/Core/MIPS/x86/CompVFPU.cpp
+++ b/Core/MIPS/x86/CompVFPU.cpp
@ -165,14 +165,33 @@ void Jit::ApplyPrefixD(const u8 *vregs, VectorSize sz) {
 		if (sat == 1)
 		{
 			fpr.MapRegV(vregs[i], MAP_DIRTY);
-			MAXSS(fpr.VX(vregs[i]), M(&zero));
-			MINSS(fpr.VX(vregs[i]), M(&one));
+
+			// Zero out XMM0 if it was <= +0.0f (but skip NAN.)
+			MOVSS(R(XMM0), fpr.VX(vregs[i]));
+			CMPLESS(XMM0, M(&zero));
+			ANDNPS(XMM0, fpr.V(vregs[i]));
+
+			// Retain a NAN in XMM0 (must be second operand.)
+			MOVSS(fpr.VX(vregs[i]), M(&one));
+			MINSS(fpr.VX(vregs[i]), R(XMM0));
 		}
 		else if (sat == 3)
 		{
 			fpr.MapRegV(vregs[i], MAP_DIRTY);
-			MAXSS(fpr.VX(vregs[i]), M(&minus_one));
-			MINSS(fpr.VX(vregs[i]), M(&one));
+
+			// Check for < -1.0f, but careful of NANs.
+			MOVSS(XMM1, M(&minus_one));
+			MOVSS(R(XMM0), fpr.VX(vregs[i]));
+			CMPLESS(XMM0, R(XMM1));
+			// If it was NOT less, the three ops below do nothing.
+			// Otherwise, they replace the value with -1.0f.
+			ANDPS(XMM1, R(XMM0));
+			ANDNPS(XMM0, fpr.V(vregs[i]));
+			ORPS(XMM0, R(XMM1));
+
+			// Retain a NAN in XMM0 (must be second operand.)
+			MOVSS(fpr.VX(vregs[i]), M(&one));
+			MINSS(fpr.VX(vregs[i]), R(XMM0));
 		}
 	}
 }