mirror of https://github.com/PCSX2/pcsx2.git
mostly some VU changes.
git-svn-id: http://pcsx2-playground.googlecode.com/svn/trunk@109 a6443dda-0b58-4228-96e9-037be469359c
This commit is contained in:
parent
e147a43668
commit
3af97aacd5
|
@ -811,7 +811,7 @@ static void (*recComOpM32_to_XMM[] )(x86SSERegType, uptr) = {
|
||||||
int recCommutativeOp(int info, int regd, int op)
|
int recCommutativeOp(int info, int regd, int op)
|
||||||
{
|
{
|
||||||
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
||||||
if (t0reg == -1) {SysPrintf("FPU: CommutativeOp Allocation Error!\n");}
|
//if (t0reg == -1) {SysPrintf("FPU: CommutativeOp Allocation Error!\n");}
|
||||||
|
|
||||||
switch(info & (PROCESS_EE_S|PROCESS_EE_T) ) {
|
switch(info & (PROCESS_EE_S|PROCESS_EE_T) ) {
|
||||||
case PROCESS_EE_S:
|
case PROCESS_EE_S:
|
||||||
|
@ -882,7 +882,7 @@ void recSUBhelper(int regd, int regt)
|
||||||
void recSUBop(int info, int regd)
|
void recSUBop(int info, int regd)
|
||||||
{
|
{
|
||||||
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
||||||
if (t0reg == -1) {SysPrintf("FPU: SUB Allocation Error!\n");}
|
//if (t0reg == -1) {SysPrintf("FPU: SUB Allocation Error!\n");}
|
||||||
|
|
||||||
//AND32ItoM((uptr)&fpuRegs.fprc[31], ~(FPUflagO|FPUflagU)); // Clear O and U flags
|
//AND32ItoM((uptr)&fpuRegs.fprc[31], ~(FPUflagO|FPUflagU)); // Clear O and U flags
|
||||||
|
|
||||||
|
@ -954,7 +954,7 @@ void recDIVhelper1(int regd, int regt)
|
||||||
u32 *ajmp32, *bjmp32;
|
u32 *ajmp32, *bjmp32;
|
||||||
int t1reg = _allocTempXMMreg(XMMT_FPS, -1);
|
int t1reg = _allocTempXMMreg(XMMT_FPS, -1);
|
||||||
int tempReg = _allocX86reg(-1, X86TYPE_TEMP, 0, 0);
|
int tempReg = _allocX86reg(-1, X86TYPE_TEMP, 0, 0);
|
||||||
if (t1reg == -1) {SysPrintf("FPU: DIV Allocation Error!\n");}
|
//if (t1reg == -1) {SysPrintf("FPU: DIV Allocation Error!\n");}
|
||||||
if (tempReg == -1) {SysPrintf("FPU: DIV Allocation Error!\n"); tempReg = EAX;}
|
if (tempReg == -1) {SysPrintf("FPU: DIV Allocation Error!\n"); tempReg = EAX;}
|
||||||
|
|
||||||
AND32ItoM((uptr)&fpuRegs.fprc[31], ~(FPUflagI|FPUflagD)); // Clear I and D flags
|
AND32ItoM((uptr)&fpuRegs.fprc[31], ~(FPUflagI|FPUflagD)); // Clear I and D flags
|
||||||
|
@ -1009,7 +1009,7 @@ void recDIVhelper2(int regd, int regt)
|
||||||
void recDIV_S_xmm(int info)
|
void recDIV_S_xmm(int info)
|
||||||
{
|
{
|
||||||
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
||||||
if (t0reg == -1) {SysPrintf("FPU: DIV Allocation Error!\n");}
|
//if (t0reg == -1) {SysPrintf("FPU: DIV Allocation Error!\n");}
|
||||||
|
|
||||||
switch(info & (PROCESS_EE_S|PROCESS_EE_T) ) {
|
switch(info & (PROCESS_EE_S|PROCESS_EE_T) ) {
|
||||||
case PROCESS_EE_S:
|
case PROCESS_EE_S:
|
||||||
|
@ -1141,7 +1141,7 @@ void recRSQRThelper1(int regd, int t0reg)
|
||||||
u32 *pjmp32;
|
u32 *pjmp32;
|
||||||
int t1reg = _allocTempXMMreg(XMMT_FPS, -1);
|
int t1reg = _allocTempXMMreg(XMMT_FPS, -1);
|
||||||
int tempReg = _allocX86reg(-1, X86TYPE_TEMP, 0, 0);
|
int tempReg = _allocX86reg(-1, X86TYPE_TEMP, 0, 0);
|
||||||
if (t1reg == -1) {SysPrintf("FPU: RSQRT Allocation Error!\n");}
|
//if (t1reg == -1) {SysPrintf("FPU: RSQRT Allocation Error!\n");}
|
||||||
if (tempReg == -1) {SysPrintf("FPU: RSQRT Allocation Error!\n"); tempReg = EAX;}
|
if (tempReg == -1) {SysPrintf("FPU: RSQRT Allocation Error!\n"); tempReg = EAX;}
|
||||||
|
|
||||||
AND32ItoM((uptr)&fpuRegs.fprc[31], ~(FPUflagI|FPUflagD)); // Clear I and D flags
|
AND32ItoM((uptr)&fpuRegs.fprc[31], ~(FPUflagI|FPUflagD)); // Clear I and D flags
|
||||||
|
@ -1198,7 +1198,7 @@ void recRSQRThelper2(int regd, int t0reg)
|
||||||
void recRSQRT_S_xmm(int info)
|
void recRSQRT_S_xmm(int info)
|
||||||
{
|
{
|
||||||
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
int t0reg = _allocTempXMMreg(XMMT_FPS, -1);
|
||||||
if (t0reg == -1) {SysPrintf("FPU: RSQRT Allocation Error!\n");}
|
//if (t0reg == -1) {SysPrintf("FPU: RSQRT Allocation Error!\n");}
|
||||||
//SysPrintf("FPU: RSQRT\n");
|
//SysPrintf("FPU: RSQRT\n");
|
||||||
|
|
||||||
switch(info & (PROCESS_EE_S|PROCESS_EE_T) ) {
|
switch(info & (PROCESS_EE_S|PROCESS_EE_T) ) {
|
||||||
|
|
|
@ -1291,6 +1291,26 @@ static vFloat vFloats2[16] = { //regTemp is modified
|
||||||
vFloat8, vFloat9, vFloat10, vFloat11b,
|
vFloat8, vFloat9, vFloat10, vFloat11b,
|
||||||
vFloat12, vFloat13b, vFloat14b, vFloat15 };
|
vFloat12, vFloat13b, vFloat14b, vFloat15 };
|
||||||
|
|
||||||
|
|
||||||
|
PCSX2_ALIGNED16(u64 vuFloatData[2]);
|
||||||
|
PCSX2_ALIGNED16(u64 vuFloatData2[2]);
|
||||||
|
// Makes NaN == 0; Very Slow - Use only for debugging
|
||||||
|
void vuFloatExtra( int regd, int XYZW) {
|
||||||
|
int t1reg = (regd == 0) ? (regd + 1) : (regd - 1);
|
||||||
|
int t2reg = (regd <= 1) ? (regd + 2) : (regd - 2);
|
||||||
|
SSE_MOVAPS_XMM_to_M128( (uptr)vuFloatData, t1reg );
|
||||||
|
SSE_MOVAPS_XMM_to_M128( (uptr)vuFloatData2, t2reg );
|
||||||
|
|
||||||
|
SSE_XORPS_XMM_to_XMM(t1reg, t1reg);
|
||||||
|
SSE_CMPORDPS_XMM_to_XMM(t1reg, regd);
|
||||||
|
SSE_MOVAPS_XMM_to_XMM(t2reg, regd);
|
||||||
|
SSE_ANDPS_XMM_to_XMM(t2reg, t1reg);
|
||||||
|
VU_MERGE_REGS_CUSTOM(regd, t2reg, XYZW);
|
||||||
|
|
||||||
|
SSE_MOVAPS_M128_to_XMM( t1reg, (uptr)vuFloatData );
|
||||||
|
SSE_MOVAPS_M128_to_XMM( t2reg, (uptr)vuFloatData2 );
|
||||||
|
}
|
||||||
|
|
||||||
// Clamps infinities to max/min non-infinity number (doesn't use any temp regs)
|
// Clamps infinities to max/min non-infinity number (doesn't use any temp regs)
|
||||||
void vuFloat( int info, int regd, int XYZW) {
|
void vuFloat( int info, int regd, int XYZW) {
|
||||||
if( CHECK_OVERFLOW ) {
|
if( CHECK_OVERFLOW ) {
|
||||||
|
@ -1302,6 +1322,7 @@ void vuFloat( int info, int regd, int XYZW) {
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
}*/
|
}*/
|
||||||
|
//vuFloatExtra(regd, XYZW);
|
||||||
vFloats1[XYZW](regd, regd);
|
vFloats1[XYZW](regd, regd);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -1309,6 +1330,7 @@ void vuFloat( int info, int regd, int XYZW) {
|
||||||
// Clamps infinities to max/min non-infinity number (uses a temp reg)
|
// Clamps infinities to max/min non-infinity number (uses a temp reg)
|
||||||
void vuFloat2(int regd, int regTemp, int XYZW) {
|
void vuFloat2(int regd, int regTemp, int XYZW) {
|
||||||
if( CHECK_OVERFLOW ) {
|
if( CHECK_OVERFLOW ) {
|
||||||
|
//vuFloatExtra(regd, XYZW);
|
||||||
vFloats2[XYZW](regd, regTemp);
|
vFloats2[XYZW](regd, regTemp);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -2533,9 +2555,7 @@ void recVUMI_MUL_xyzw_toD(VURegs *VU, int xyzw, int regd, int info)
|
||||||
SSE_XORPS_XMM_to_XMM(EEREC_TEMP, EEREC_TEMP);
|
SSE_XORPS_XMM_to_XMM(EEREC_TEMP, EEREC_TEMP);
|
||||||
VU_MERGE_REGS(regd, EEREC_TEMP);
|
VU_MERGE_REGS(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
else {
|
else SSE_XORPS_XMM_to_XMM(regd, regd);
|
||||||
SSE_XORPS_XMM_to_XMM(regd, regd);
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
assert(xyzw==3);
|
assert(xyzw==3);
|
||||||
|
@ -2661,25 +2681,30 @@ void recVUMI_MADD_toD(VURegs *VU, int regd, int info)
|
||||||
if( regd == EEREC_ACC ) {
|
if( regd == EEREC_ACC ) {
|
||||||
SSE_MOVSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MOVSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
else if (regd == EEREC_T) {
|
else if (regd == EEREC_T) {
|
||||||
SSE_MULSS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULSS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else if (regd == EEREC_S) {
|
else if (regd == EEREC_S) {
|
||||||
SSE_MULSS_XMM_to_XMM(regd, EEREC_T);
|
SSE_MULSS_XMM_to_XMM(regd, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
SSE_MOVSS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MOVSS_XMM_to_XMM(regd, EEREC_S);
|
||||||
SSE_MULSS_XMM_to_XMM(regd, EEREC_T);
|
SSE_MULSS_XMM_to_XMM(regd, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else if (_X_Y_Z_W != 0xf) {
|
else if (_X_Y_Z_W != 0xf) {
|
||||||
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(EEREC_TEMP, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(EEREC_TEMP, EEREC_ACC);
|
||||||
|
|
||||||
VU_MERGE_REGS(regd, EEREC_TEMP);
|
VU_MERGE_REGS(regd, EEREC_TEMP);
|
||||||
|
@ -2688,19 +2713,23 @@ void recVUMI_MADD_toD(VURegs *VU, int regd, int info)
|
||||||
if( regd == EEREC_ACC ) {
|
if( regd == EEREC_ACC ) {
|
||||||
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
else if (regd == EEREC_T) {
|
else if (regd == EEREC_T) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else if (regd == EEREC_S) {
|
else if (regd == EEREC_S) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
SSE_MOVAPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MOVAPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -2726,16 +2755,19 @@ void recVUMI_MADD_iq_toD(VURegs *VU, uptr addr, int regd, int info)
|
||||||
assert( EEREC_TEMP < XMMREGS );
|
assert( EEREC_TEMP < XMMREGS );
|
||||||
SSE_MOVSS_M32_to_XMM(EEREC_TEMP, addr);
|
SSE_MOVSS_M32_to_XMM(EEREC_TEMP, addr);
|
||||||
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_S ) {
|
else if( regd == EEREC_S ) {
|
||||||
SSE_MULSS_M32_to_XMM(regd, addr);
|
SSE_MULSS_M32_to_XMM(regd, addr);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
SSE_MOVSS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MOVSS_XMM_to_XMM(regd, EEREC_S);
|
||||||
SSE_MULSS_M32_to_XMM(regd, addr);
|
SSE_MULSS_M32_to_XMM(regd, addr);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -2758,6 +2790,7 @@ void recVUMI_MADD_iq_toD(VURegs *VU, uptr addr, int regd, int info)
|
||||||
|
|
||||||
if (_X_Y_Z_W != 0xf) {
|
if (_X_Y_Z_W != 0xf) {
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(EEREC_TEMP, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(EEREC_TEMP, EEREC_ACC);
|
||||||
|
|
||||||
VU_MERGE_REGS(regd, EEREC_TEMP);
|
VU_MERGE_REGS(regd, EEREC_TEMP);
|
||||||
|
@ -2765,20 +2798,24 @@ void recVUMI_MADD_iq_toD(VURegs *VU, uptr addr, int regd, int info)
|
||||||
else {
|
else {
|
||||||
if( regd == EEREC_ACC ) {
|
if( regd == EEREC_ACC ) {
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_S ) {
|
else if( regd == EEREC_S ) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_TEMP ) {
|
else if( regd == EEREC_TEMP ) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
SSE_MOVSS_M32_to_XMM(regd, addr);
|
SSE_MOVSS_M32_to_XMM(regd, addr);
|
||||||
SSE_SHUFPS_XMM_to_XMM(regd, regd, 0x00);
|
SSE_SHUFPS_XMM_to_XMM(regd, regd, 0x00);
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -2841,19 +2878,23 @@ void recVUMI_MADD_xyzw_toD(VURegs *VU, int xyzw, int regd, int info)
|
||||||
|
|
||||||
if( regd == EEREC_ACC ) {
|
if( regd == EEREC_ACC ) {
|
||||||
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_S ) {
|
else if( regd == EEREC_S ) {
|
||||||
SSE_MULSS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_MULSS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_TEMP ) {
|
else if( regd == EEREC_TEMP ) {
|
||||||
SSE_MULSS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULSS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
SSE_MOVSS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_MOVSS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULSS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, 8); }
|
||||||
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_ADDSS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -2863,6 +2904,7 @@ void recVUMI_MADD_xyzw_toD(VURegs *VU, int xyzw, int regd, int info)
|
||||||
|
|
||||||
if (_X_Y_Z_W != 0xf) {
|
if (_X_Y_Z_W != 0xf) {
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(EEREC_TEMP, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(EEREC_TEMP, EEREC_ACC);
|
||||||
|
|
||||||
VU_MERGE_REGS(regd, EEREC_TEMP);
|
VU_MERGE_REGS(regd, EEREC_TEMP);
|
||||||
|
@ -2870,19 +2912,23 @@ void recVUMI_MADD_xyzw_toD(VURegs *VU, int xyzw, int regd, int info)
|
||||||
else {
|
else {
|
||||||
if( regd == EEREC_ACC ) {
|
if( regd == EEREC_ACC ) {
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_S ) {
|
else if( regd == EEREC_S ) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_TEMP ) {
|
else if( regd == EEREC_TEMP ) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
_unpackVF_xyzw(regd, EEREC_T, xyzw);
|
_unpackVF_xyzw(regd, EEREC_T, xyzw);
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_ADDPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -2987,6 +3033,7 @@ void recVUMI_MSUB_toD(VURegs *VU, int regd, int info)
|
||||||
|
|
||||||
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
|
|
||||||
if( t1reg >= 0 ) {
|
if( t1reg >= 0 ) {
|
||||||
SSE_MOVAPS_XMM_to_XMM(t1reg, EEREC_ACC);
|
SSE_MOVAPS_XMM_to_XMM(t1reg, EEREC_ACC);
|
||||||
|
@ -3005,18 +3052,21 @@ void recVUMI_MSUB_toD(VURegs *VU, int regd, int info)
|
||||||
if( regd == EEREC_S ) {
|
if( regd == EEREC_S ) {
|
||||||
assert( regd != EEREC_ACC );
|
assert( regd != EEREC_ACC );
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_T ) {
|
else if( regd == EEREC_T ) {
|
||||||
assert( regd != EEREC_ACC );
|
assert( regd != EEREC_ACC );
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_TEMP ) {
|
else if( regd == EEREC_TEMP ) {
|
||||||
SSE_MOVAPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MOVAPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
||||||
}
|
}
|
||||||
|
@ -3024,6 +3074,7 @@ void recVUMI_MSUB_toD(VURegs *VU, int regd, int info)
|
||||||
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MOVAPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
if( regd != EEREC_ACC ) SSE_MOVAPS_XMM_to_XMM(regd, EEREC_ACC);
|
if( regd != EEREC_ACC ) SSE_MOVAPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_T);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -3041,6 +3092,7 @@ void recVUMI_MSUB_temp_toD(VURegs *VU, int regd, int info)
|
||||||
int t1reg = _vuGetTempXMMreg(info);
|
int t1reg = _vuGetTempXMMreg(info);
|
||||||
|
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
|
|
||||||
if( t1reg >= 0 ) {
|
if( t1reg >= 0 ) {
|
||||||
SSE_MOVAPS_XMM_to_XMM(t1reg, EEREC_ACC);
|
SSE_MOVAPS_XMM_to_XMM(t1reg, EEREC_ACC);
|
||||||
|
@ -3063,21 +3115,25 @@ void recVUMI_MSUB_temp_toD(VURegs *VU, int regd, int info)
|
||||||
else {
|
else {
|
||||||
if( regd == EEREC_ACC ) {
|
if( regd == EEREC_ACC ) {
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_S ) {
|
else if( regd == EEREC_S ) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
||||||
}
|
}
|
||||||
else if( regd == EEREC_TEMP ) {
|
else if( regd == EEREC_TEMP ) {
|
||||||
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(regd, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, regd, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
SSE_XORPS_M128_to_XMM(regd, (uptr)&const_clip[4]);
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
if( regd != EEREC_ACC ) SSE_MOVAPS_XMM_to_XMM(regd, EEREC_ACC);
|
if( regd != EEREC_ACC ) SSE_MOVAPS_XMM_to_XMM(regd, EEREC_ACC);
|
||||||
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
SSE_MULPS_XMM_to_XMM(EEREC_TEMP, EEREC_S);
|
||||||
|
if (CHECK_EXTRA_OVERFLOW) { vuFloat( info, EEREC_TEMP, _X_Y_Z_W); }
|
||||||
SSE_SUBPS_XMM_to_XMM(regd, EEREC_TEMP);
|
SSE_SUBPS_XMM_to_XMM(regd, EEREC_TEMP);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue