Jit64: Simplify dcbz.

This commit is contained in:
degasus 2016-08-23 22:52:34 +02:00
parent ef0dcfe558
commit 2925a5b219
1 changed files with 24 additions and 30 deletions

View File

@ -368,43 +368,37 @@ void Jit64::dcbz(UGeckoInstruction inst)
MOV(32, R(RSCRATCH), gpr.R(b)); MOV(32, R(RSCRATCH), gpr.R(b));
if (a) if (a)
ADD(32, R(RSCRATCH), gpr.R(a)); ADD(32, R(RSCRATCH), gpr.R(a));
AND(32, R(RSCRATCH), Imm32(~31));
if (!UReg_MSR(MSR).DR) if (UReg_MSR(MSR).DR)
{ {
// If address translation is turned off, just call the general-case code. // Perform lookup to see if we can use fast path.
AND(32, R(RSCRATCH), Imm32(~31)); MOV(32, R(RSCRATCH2), R(RSCRATCH));
MOV(32, M(&PC), Imm32(jit->js.compilerPC)); SHR(32, R(RSCRATCH2), Imm8(PowerPC::BAT_INDEX_SHIFT));
BitSet32 registersInUse = CallerSavedRegistersInUse(); TEST(32, MScaled(RSCRATCH2, SCALE_4, (u32)(u64)PowerPC::dbat_table), Imm32(2));
ABI_PushRegistersAndAdjustStack(registersInUse, 0); FixupBranch slow = J_CC(CC_Z, true);
ABI_CallFunctionR((void*)&PowerPC::ClearCacheLine, RSCRATCH);
ABI_PopRegistersAndAdjustStack(registersInUse, 0); // Fast path: compute full address, then zero out 32 bytes of memory.
return; PXOR(XMM0, R(XMM0));
MOVAPS(MComplex(RMEM, RSCRATCH, SCALE_1, 0), XMM0);
MOVAPS(MComplex(RMEM, RSCRATCH, SCALE_1, 16), XMM0);
// Slow path: call the general-case code.
SwitchToFarCode();
SetJumpTarget(slow);
} }
// Perform lookup to see if we can use fast path.
MOV(32, R(RSCRATCH2), R(RSCRATCH));
SHR(32, R(RSCRATCH), Imm8(PowerPC::BAT_INDEX_SHIFT));
TEST(32, MScaled(RSCRATCH, SCALE_4, (u32)(u64)PowerPC::dbat_table), Imm32(2));
FixupBranch slow = J_CC(CC_Z, true);
// Fast path: compute full address, then zero out 32 bytes of memory.
AND(32, R(RSCRATCH2), Imm8(~31));
PXOR(XMM0, R(XMM0));
MOVAPS(MComplex(RMEM, RSCRATCH2, SCALE_1, 0), XMM0);
MOVAPS(MComplex(RMEM, RSCRATCH2, SCALE_1, 16), XMM0);
// Slow path: mask the address, then call the general-case code.
SwitchToFarCode();
SetJumpTarget(slow);
AND(32, R(RSCRATCH2), Imm32(~31));
MOV(32, M(&PC), Imm32(jit->js.compilerPC)); MOV(32, M(&PC), Imm32(jit->js.compilerPC));
BitSet32 registersInUse = CallerSavedRegistersInUse(); BitSet32 registersInUse = CallerSavedRegistersInUse();
ABI_PushRegistersAndAdjustStack(registersInUse, 0); ABI_PushRegistersAndAdjustStack(registersInUse, 0);
ABI_CallFunctionR(&PowerPC::ClearCacheLine, RSCRATCH2); ABI_CallFunctionR(&PowerPC::ClearCacheLine, RSCRATCH);
ABI_PopRegistersAndAdjustStack(registersInUse, 0); ABI_PopRegistersAndAdjustStack(registersInUse, 0);
FixupBranch end = J(true);
SwitchToNearCode(); if (UReg_MSR(MSR).DR)
SetJumpTarget(end); {
FixupBranch end = J(true);
SwitchToNearCode();
SetJumpTarget(end);
}
} }
void Jit64::stX(UGeckoInstruction inst) void Jit64::stX(UGeckoInstruction inst)