[JIT] Properly mask NaNs in vctsxs

2018-03-03 13:56:30 -06:00 · 2018-03-03 13:56:30 -06:00 · 1c1fdb4ccd
parent a9d2a50082
commit 1c1fdb4ccd
1 changed files with 12 additions and 9 deletions
--- a/src/xenia/cpu/backend/x64/x64_sequences.cc
+++ b/src/xenia/cpu/backend/x64/x64_sequences.cc
@ -1634,18 +1634,21 @@ struct VECTOR_CONVERT_F2I
      // saturate values > UINT_MAX
      e.vpor(i.dest, i.dest, e.xmm0);
    } else {
-      Xmm src1 = e.xmm2;
+      // xmm2 = NaN mask
-      e.vmovdqa(src1, i.src1);  // Duplicate src1.
+      e.vcmpunordps(e.xmm2, i.src1, i.src1);
-      e.vcvttps2dq(i.dest, i.src1);
+      // convert packed floats to packed dwords
      e.vcvttps2dq(e.xmm0, i.src1);
-      // if dest is indeterminate and i.src1 >= 0 (i.e. !(i.src1 & 0x80000000))
+      // (high bit) xmm1 = dest is indeterminate and i.src1 >= 0
-      //   i.dest = 0x7FFFFFFF
+      e.vpcmpeqd(e.xmm1, e.xmm0, e.GetXmmConstPtr(XMMIntMin));
-      e.vpcmpeqd(e.xmm0, i.dest, e.GetXmmConstPtr(XMMIntMin));
+      e.vpandn(e.xmm1, i.src1, e.xmm1);
      e.vpandn(e.xmm0, src1, e.xmm0);
-      // (high bit of xmm0 = is ind. && i.src1 >= 0)
+      // saturate positive values
-      e.vblendvps(i.dest, i.dest, e.GetXmmConstPtr(XMMIntMax), e.xmm0);
+      e.vblendvps(i.dest, e.xmm0, e.GetXmmConstPtr(XMMIntMax), e.xmm1);
      // mask NaNs
      e.vpandn(i.dest, e.xmm2, i.dest);
    }
  }
 };