mirror of https://github.com/PCSX2/pcsx2.git
<cotton>for april fools i can put on my next commit that microVU is finished and doubles fps
<cotton>but i guess i shouldn't do that on the svn :D <cotton>or maybe i can >.> <.< >.> git-svn-id: http://pcsx2.googlecode.com/svn/trunk@878 96395faa-99c1-11dd-bbfe-3dabce05a288
This commit is contained in:
parent
1e4f48437f
commit
a547ef4cea
|
@ -25,11 +25,20 @@
|
|||
|
||||
#define testZero(xmmReg, xmmTemp, gprTemp) { \
|
||||
SSE_XORPS_XMM_to_XMM(xmmTemp, xmmTemp); /* Clear xmmTemp (make it 0) */ \
|
||||
SSE_CMPEQPS_XMM_to_XMM(xmmTemp, xmmReg); /* Set all F's if each vector is zero */ \
|
||||
SSE_CMPEQPS_XMM_to_XMM(xmmTemp, xmmReg); /* Set all F's if zero */ \
|
||||
SSE_MOVMSKPS_XMM_to_R32(gprTemp, xmmTemp); /* Move the sign bits */ \
|
||||
TEST32ItoR(gprTemp, 1); /* Test "Is Zero" bit */ \
|
||||
}
|
||||
|
||||
#define testNeg(xmmReg, gprTemp, aJump) { \
|
||||
SSE_MOVMSKPS_XMM_to_R32(gprTemp, xmmReg); \
|
||||
TEST32ItoR(gprTemp, 1); /* Check sign bit */ \
|
||||
aJump = JZ8(0); /* Skip if positive */ \
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0x410); /* Set Invalid Flags */ \
|
||||
SSE_ANDPS_M128_to_XMM(xmmReg, (uptr)mVU_absclip); /* Abs(xmmReg) */ \
|
||||
x86SetJ8(aJump); \
|
||||
}
|
||||
|
||||
microVUf(void) mVU_DIV() {
|
||||
microVU* mVU = mVUx;
|
||||
if (!recPass) { mVUanalyzeFDIV<vuIndex>(_Fs_, _Fsf_, _Ft_, _Ftf_); }
|
||||
|
@ -69,17 +78,11 @@ microVUf(void) mVU_SQRT() {
|
|||
microVU* mVU = mVUx;
|
||||
if (!recPass) { mVUanalyzeFDIV<vuIndex>(0, 0, _Ft_, _Ftf_); }
|
||||
else {
|
||||
u8* ajmp;
|
||||
u8 *ajmp;
|
||||
getReg5(xmmFt, _Ft_, _Ftf_);
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0); // Clear I/D flags
|
||||
|
||||
/* Check for negative sqrt */
|
||||
SSE_MOVMSKPS_XMM_to_R32(gprT1, xmmFt);
|
||||
AND32ItoR(gprT1, 1); //Check sign
|
||||
ajmp = JZ8(0); //Skip if none are
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0x410); // Invalid Flag - Negative number sqrt
|
||||
SSE_ANDPS_M128_to_XMM(xmmFt, (uptr)mVU_absclip); // Do a cardinal sqrt
|
||||
x86SetJ8(ajmp);
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0); // Clear I/D flags
|
||||
testNeg(xmmFt, gprT1, ajmp); // Check for negative sqrt
|
||||
|
||||
if (CHECK_VU_OVERFLOW) SSE_MINSS_XMM_to_XMM(xmmFt, xmmMax); // Clamp infinities (only need to do positive clamp since xmmFt is positive)
|
||||
SSE_SQRTSS_XMM_to_XMM(xmmFt, xmmFt);
|
||||
|
@ -92,39 +95,33 @@ microVUf(void) mVU_RSQRT() {
|
|||
microVU* mVU = mVUx;
|
||||
if (!recPass) { mVUanalyzeFDIV<vuIndex>(_Fs_, _Fsf_, _Ft_, _Ftf_); }
|
||||
else {
|
||||
u8 *ajmp8, *bjmp8, *cjmp8, *djmp8;
|
||||
u8 *ajmp, *bjmp, *cjmp, *djmp;
|
||||
getReg5(xmmFs, _Fs_, _Fsf_);
|
||||
getReg5(xmmFt, _Ft_, _Ftf_);
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0); // Clear I/D flags
|
||||
|
||||
/* Check for negative divide */
|
||||
SSE_MOVMSKPS_XMM_to_R32(gprT1, xmmT1);
|
||||
AND32ItoR(gprT1, 1); //Check sign
|
||||
ajmp8 = JZ8(0); //Skip if none are
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0x410); // Invalid Flag - Negative number sqrt
|
||||
SSE_ANDPS_M128_to_XMM(xmmFt, (uptr)mVU_absclip); // Do a cardinal sqrt
|
||||
x86SetJ8(ajmp8);
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0); // Clear I/D flags
|
||||
testNeg(xmmFt, gprT1, ajmp); // Check for negative sqrt
|
||||
|
||||
SSE_SQRTSS_XMM_to_XMM(xmmFt, xmmFt);
|
||||
testZero(xmmFt, xmmT1, gprT1); // Test if Ft is zero
|
||||
ajmp8 = JZ8(0); // Skip if not zero
|
||||
ajmp = JZ8(0); // Skip if not zero
|
||||
|
||||
testZero(xmmFs, xmmT1, gprT1); // Test if Fs is zero
|
||||
bjmp8 = JZ8(0); // Skip if none are
|
||||
bjmp = JZ8(0); // Skip if none are
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0x410); // Set invalid flag (0/0)
|
||||
cjmp8 = JMP8(0);
|
||||
x86SetJ8(bjmp8);
|
||||
cjmp = JMP8(0);
|
||||
x86SetJ8(bjmp);
|
||||
MOV32ItoM((uptr)&mVU->divFlag, 0x820); // Zero divide flag (only when not 0/0)
|
||||
x86SetJ8(cjmp8);
|
||||
x86SetJ8(cjmp);
|
||||
|
||||
SSE_ANDPS_M128_to_XMM(xmmFs, (uptr)mVU_signbit);
|
||||
SSE_ORPS_XMM_to_XMM(xmmFs, xmmMax); // xmmFs = +/-Max
|
||||
|
||||
djmp8 = JMP8(0);
|
||||
x86SetJ8(ajmp8);
|
||||
djmp = JMP8(0);
|
||||
x86SetJ8(ajmp);
|
||||
SSE_DIVSS_XMM_to_XMM(xmmFs, xmmFt);
|
||||
mVUclamp1<vuIndex>(xmmFs, xmmFt, 8);
|
||||
x86SetJ8(djmp8);
|
||||
x86SetJ8(djmp);
|
||||
|
||||
mVUunpack_xyzw<vuIndex>(xmmFs, xmmFs, 0);
|
||||
mVUmergeRegs<vuIndex>(xmmPQ, xmmFs, writeQ ? 4 : 8);
|
||||
|
@ -184,7 +181,7 @@ microVUf(void) mVU_EATANxy() {
|
|||
SSE2_PSHUFD_XMM_to_XMM(xmmPQ, xmmPQ, writeP ? 0x27 : 0xC6); // Flip xmmPQ to get Valid P instance
|
||||
|
||||
SSE_MOVSS_XMM_to_XMM(xmmPQ, xmmFs);
|
||||
SSE_SUBSS_M32_to_XMM(xmmFs, (uptr)mVU_one);
|
||||
SSE_SUBSS_XMM_to_XMM(xmmFs, xmmFt); // y-x, not y-1? ><
|
||||
SSE_ADDSS_XMM_to_XMM(xmmFt, xmmPQ);
|
||||
SSE_DIVSS_XMM_to_XMM(xmmFs, xmmFt);
|
||||
|
||||
|
|
Loading…
Reference in New Issue