subtract cycles after checking IRQ and Halt

also switch back to adding to ARM::Cycles instead of subtracting from them
This commit is contained in:
RSDuck 2020-07-27 23:14:23 +02:00
parent 026d0dcab8
commit 5903b11bda
6 changed files with 59 additions and 62 deletions

View File

@ -274,15 +274,15 @@ void ARMv5::JumpTo(u32 addr, bool restorecpsr)
if (addr & 0x2) if (addr & 0x2)
{ {
NextInstr[0] = CodeRead32(addr-2, true) >> 16; NextInstr[0] = CodeRead32(addr-2, true) >> 16;
Cycles -= CodeCycles; Cycles += CodeCycles;
NextInstr[1] = CodeRead32(addr+2, false); NextInstr[1] = CodeRead32(addr+2, false);
Cycles -= CodeCycles; Cycles += CodeCycles;
} }
else else
{ {
NextInstr[0] = CodeRead32(addr, true); NextInstr[0] = CodeRead32(addr, true);
NextInstr[1] = NextInstr[0] >> 16; NextInstr[1] = NextInstr[0] >> 16;
Cycles -= CodeCycles; Cycles += CodeCycles;
} }
CPSR |= 0x20; CPSR |= 0x20;
@ -295,9 +295,9 @@ void ARMv5::JumpTo(u32 addr, bool restorecpsr)
if (newregion != oldregion) SetupCodeMem(addr); if (newregion != oldregion) SetupCodeMem(addr);
NextInstr[0] = CodeRead32(addr, true); NextInstr[0] = CodeRead32(addr, true);
Cycles -= CodeCycles; Cycles += CodeCycles;
NextInstr[1] = CodeRead32(addr+4, false); NextInstr[1] = CodeRead32(addr+4, false);
Cycles -= CodeCycles; Cycles += CodeCycles;
CPSR &= ~0x20; CPSR &= ~0x20;
} }
@ -337,7 +337,7 @@ void ARMv4::JumpTo(u32 addr, bool restorecpsr)
NextInstr[0] = CodeRead16(addr); NextInstr[0] = CodeRead16(addr);
NextInstr[1] = CodeRead16(addr+2); NextInstr[1] = CodeRead16(addr+2);
Cycles -= NDS::ARM7MemTimings[CodeCycles][0] + NDS::ARM7MemTimings[CodeCycles][1]; Cycles += NDS::ARM7MemTimings[CodeCycles][0] + NDS::ARM7MemTimings[CodeCycles][1];
CPSR |= 0x20; CPSR |= 0x20;
} }
@ -350,7 +350,7 @@ void ARMv4::JumpTo(u32 addr, bool restorecpsr)
NextInstr[0] = CodeRead32(addr); NextInstr[0] = CodeRead32(addr);
NextInstr[1] = CodeRead32(addr+4); NextInstr[1] = CodeRead32(addr+4);
Cycles -= NDS::ARM7MemTimings[CodeCycles][2] + NDS::ARM7MemTimings[CodeCycles][3]; Cycles += NDS::ARM7MemTimings[CodeCycles][2] + NDS::ARM7MemTimings[CodeCycles][3];
CPSR &= ~0x20; CPSR &= ~0x20;
} }
@ -609,7 +609,7 @@ void ARMv5::Execute()
}*/ }*/
if (IRQ) TriggerIRQ(); if (IRQ) TriggerIRQ();
NDS::ARM9Timestamp -= Cycles; NDS::ARM9Timestamp += Cycles;
Cycles = 0; Cycles = 0;
} }
@ -643,9 +643,6 @@ void ARMv5::ExecuteJIT()
{ {
u32 instrAddr = R[15] - ((CPSR&0x20)?2:4); u32 instrAddr = R[15] - ((CPSR&0x20)?2:4);
// hack so Cycles <= 0 becomes Cycles < 0
Cycles = NDS::ARM9Target - NDS::ARM9Timestamp - 1;
if ((instrAddr < FastBlockLookupStart || instrAddr >= (FastBlockLookupStart + FastBlockLookupSize)) if ((instrAddr < FastBlockLookupStart || instrAddr >= (FastBlockLookupStart + FastBlockLookupSize))
&& !ARMJIT::SetupExecutableRegion(0, instrAddr, FastBlockLookup, FastBlockLookupStart, FastBlockLookupSize)) && !ARMJIT::SetupExecutableRegion(0, instrAddr, FastBlockLookup, FastBlockLookupStart, FastBlockLookupSize))
{ {
@ -661,13 +658,8 @@ void ARMv5::ExecuteJIT()
else else
ARMJIT::CompileBlock(this); ARMJIT::CompileBlock(this);
NDS::ARM9Timestamp = NDS::ARM9Target - Cycles - 1;
if (StopExecution) if (StopExecution)
{ {
if (IRQ)
TriggerIRQ();
if (Halted || IdleLoop) if (Halted || IdleLoop)
{ {
bool idleLoop = IdleLoop; bool idleLoop = IdleLoop;
@ -678,7 +670,13 @@ void ARMv5::ExecuteJIT()
} }
break; break;
} }
if (IRQ)
TriggerIRQ();
} }
NDS::ARM9Timestamp += Cycles;
Cycles = 0;
} }
if (Halted == 2) if (Halted == 2)
@ -755,7 +753,7 @@ void ARMv4::Execute()
}*/ }*/
if (IRQ) TriggerIRQ(); if (IRQ) TriggerIRQ();
NDS::ARM7Timestamp -= Cycles; NDS::ARM7Timestamp += Cycles;
Cycles = 0; Cycles = 0;
} }
@ -795,8 +793,6 @@ void ARMv4::ExecuteJIT()
{ {
u32 instrAddr = R[15] - ((CPSR&0x20)?2:4); u32 instrAddr = R[15] - ((CPSR&0x20)?2:4);
Cycles = NDS::ARM7Target - NDS::ARM7Timestamp - 1;
if ((instrAddr < FastBlockLookupStart || instrAddr >= (FastBlockLookupStart + FastBlockLookupSize)) if ((instrAddr < FastBlockLookupStart || instrAddr >= (FastBlockLookupStart + FastBlockLookupSize))
&& !ARMJIT::SetupExecutableRegion(1, instrAddr, FastBlockLookup, FastBlockLookupStart, FastBlockLookupSize)) && !ARMJIT::SetupExecutableRegion(1, instrAddr, FastBlockLookup, FastBlockLookupStart, FastBlockLookupSize))
{ {
@ -812,14 +808,9 @@ void ARMv4::ExecuteJIT()
else else
ARMJIT::CompileBlock(this); ARMJIT::CompileBlock(this);
NDS::ARM7Timestamp = NDS::ARM7Target - Cycles - 1;
// TODO optimize this shit!!! // TODO optimize this shit!!!
if (StopExecution) if (StopExecution)
{ {
if (IRQ)
TriggerIRQ();
if (Halted || IdleLoop) if (Halted || IdleLoop)
{ {
bool idleLoop = IdleLoop; bool idleLoop = IdleLoop;
@ -830,7 +821,13 @@ void ARMv4::ExecuteJIT()
} }
break; break;
} }
if (IRQ)
TriggerIRQ();
} }
NDS::ARM7Timestamp += Cycles;
Cycles = 0;
} }
if (Halted == 2) if (Halted == 2)

View File

@ -202,14 +202,14 @@ public:
{ {
// code only. always nonseq 32-bit for ARM9. // code only. always nonseq 32-bit for ARM9.
s32 numC = (R[15] & 0x2) ? 0 : CodeCycles; s32 numC = (R[15] & 0x2) ? 0 : CodeCycles;
Cycles -= numC; Cycles += numC;
} }
void AddCycles_CI(s32 numI) void AddCycles_CI(s32 numI)
{ {
// code+internal // code+internal
s32 numC = (R[15] & 0x2) ? 0 : CodeCycles; s32 numC = (R[15] & 0x2) ? 0 : CodeCycles;
Cycles -= numC + numI; Cycles += numC + numI;
} }
void AddCycles_CDI() void AddCycles_CDI()
@ -220,9 +220,9 @@ public:
s32 numD = DataCycles; s32 numD = DataCycles;
//if (DataRegion != CodeRegion) //if (DataRegion != CodeRegion)
Cycles -= std::max(numC + numD - 6, std::max(numC, numD)); Cycles += std::max(numC + numD - 6, std::max(numC, numD));
//else //else
// Cycles -= numC + numD; // Cycles += numC + numD;
} }
void AddCycles_CD() void AddCycles_CD()
@ -232,9 +232,9 @@ public:
s32 numD = DataCycles; s32 numD = DataCycles;
//if (DataRegion != CodeRegion) //if (DataRegion != CodeRegion)
Cycles -= std::max(numC + numD - 6, std::max(numC, numD)); Cycles += std::max(numC + numD - 6, std::max(numC, numD));
//else //else
// Cycles -= numC + numD; // Cycles += numC + numD;
} }
void GetCodeMemRegion(u32 addr, NDS::MemRegion* region); void GetCodeMemRegion(u32 addr, NDS::MemRegion* region);
@ -396,13 +396,13 @@ public:
void AddCycles_C() void AddCycles_C()
{ {
// code only. this code fetch is sequential. // code only. this code fetch is sequential.
Cycles -= NDS::ARM7MemTimings[CodeCycles][(CPSR&0x20)?1:3]; Cycles += NDS::ARM7MemTimings[CodeCycles][(CPSR&0x20)?1:3];
} }
void AddCycles_CI(s32 num) void AddCycles_CI(s32 num)
{ {
// code+internal. results in a nonseq code fetch. // code+internal. results in a nonseq code fetch.
Cycles -= NDS::ARM7MemTimings[CodeCycles][(CPSR&0x20)?0:2] + num; Cycles += NDS::ARM7MemTimings[CodeCycles][(CPSR&0x20)?0:2] + num;
} }
void AddCycles_CDI() void AddCycles_CDI()
@ -414,21 +414,21 @@ public:
if ((DataRegion >> 24) == 0x02) // mainRAM if ((DataRegion >> 24) == 0x02) // mainRAM
{ {
if (CodeRegion == 0x02) if (CodeRegion == 0x02)
Cycles -= numC + numD; Cycles += numC + numD;
else else
{ {
numC++; numC++;
Cycles -= std::max(numC + numD - 3, std::max(numC, numD)); Cycles += std::max(numC + numD - 3, std::max(numC, numD));
} }
} }
else if (CodeRegion == 0x02) else if (CodeRegion == 0x02)
{ {
numD++; numD++;
Cycles -= std::max(numC + numD - 3, std::max(numC, numD)); Cycles += std::max(numC + numD - 3, std::max(numC, numD));
} }
else else
{ {
Cycles -= numC + numD + 1; Cycles += numC + numD + 1;
} }
} }
@ -441,17 +441,17 @@ public:
if ((DataRegion >> 24) == 0x02) if ((DataRegion >> 24) == 0x02)
{ {
if (CodeRegion == 0x02) if (CodeRegion == 0x02)
Cycles -= numC + numD; Cycles += numC + numD;
else else
Cycles -= std::max(numC + numD - 3, std::max(numC, numD)); Cycles += std::max(numC + numD - 3, std::max(numC, numD));
} }
else if (CodeRegion == 0x02) else if (CodeRegion == 0x02)
{ {
Cycles -= std::max(numC + numD - 3, std::max(numC, numD)); Cycles += std::max(numC + numD - 3, std::max(numC, numD));
} }
else else
{ {
Cycles -= numC + numD; Cycles += numC + numD;
} }
} }
}; };

View File

@ -143,7 +143,7 @@ void Compiler::Comp_JumpTo(u32 addr, bool forceNonConstantCycles)
if ((Thumb || CurInstr.Cond() >= 0xE) && !forceNonConstantCycles) if ((Thumb || CurInstr.Cond() >= 0xE) && !forceNonConstantCycles)
ConstantCycles += cycles; ConstantCycles += cycles;
else else
SUB(RCycles, RCycles, cycles); ADD(RCycles, RCycles, cycles);
} }
@ -181,7 +181,7 @@ void* Compiler::Gen_JumpTo9(int kind)
STR(INDEX_UNSIGNED, W0, RCPU, offsetof(ARMv5, R[15])); STR(INDEX_UNSIGNED, W0, RCPU, offsetof(ARMv5, R[15]));
ADD(W1, W1, W1); ADD(W1, W1, W1);
SUB(RCycles, RCycles, W1); ADD(RCycles, RCycles, W1);
RET(); RET();
} }
@ -201,7 +201,7 @@ void* Compiler::Gen_JumpTo9(int kind)
ADD(W2, W1, W1); ADD(W2, W1, W1);
TSTI2R(W0, 0x2); TSTI2R(W0, 0x2);
CSEL(W1, W1, W2, CC_EQ); CSEL(W1, W1, W2, CC_EQ);
SUB(RCycles, RCycles, W1); ADD(RCycles, RCycles, W1);
RET(); RET();
} }
@ -229,7 +229,7 @@ void* Compiler::Gen_JumpTo7(int kind)
UBFX(W2, W3, 0, 8); UBFX(W2, W3, 0, 8);
UBFX(W3, W3, 8, 8); UBFX(W3, W3, 8, 8);
ADD(W2, W3, W2); ADD(W2, W3, W2);
SUB(RCycles, RCycles, W2); ADD(RCycles, RCycles, W2);
ANDI2R(W0, W0, ~3); ANDI2R(W0, W0, ~3);
@ -253,7 +253,7 @@ void* Compiler::Gen_JumpTo7(int kind)
UBFX(W2, W3, 16, 8); UBFX(W2, W3, 16, 8);
UBFX(W3, W3, 24, 8); UBFX(W3, W3, 24, 8);
ADD(W2, W3, W2); ADD(W2, W3, W2);
SUB(RCycles, RCycles, W2); ADD(RCycles, RCycles, W2);
ANDI2R(W0, W0, ~1); ANDI2R(W0, W0, ~1);

View File

@ -629,7 +629,7 @@ void Compiler::Comp_BranchSpecialBehaviour(bool taken)
{ {
RegCache.PrepareExit(); RegCache.PrepareExit();
SUB(RCycles, RCycles, ConstantCycles); ADD(RCycles, RCycles, ConstantCycles);
QuickTailCall(X0, ARM_Ret); QuickTailCall(X0, ARM_Ret);
} }
} }
@ -770,7 +770,7 @@ JitBlockEntry Compiler::CompileBlock(ARM* cpu, bool thumb, FetchedInstr instrs[]
RegCache.Flush(); RegCache.Flush();
SUB(RCycles, RCycles, ConstantCycles); ADD(RCycles, RCycles, ConstantCycles);
QuickTailCall(X0, ARM_Ret); QuickTailCall(X0, ARM_Ret);
FlushIcache(); FlushIcache();
@ -800,7 +800,7 @@ void Compiler::Comp_AddCycles_C(bool forceNonConstant)
if (forceNonConstant) if (forceNonConstant)
ConstantCycles += cycles; ConstantCycles += cycles;
else else
SUB(RCycles, RCycles, cycles); ADD(RCycles, RCycles, cycles);
} }
void Compiler::Comp_AddCycles_CI(u32 numI) void Compiler::Comp_AddCycles_CI(u32 numI)
@ -814,7 +814,7 @@ void Compiler::Comp_AddCycles_CI(u32 numI)
if (Thumb || CurInstr.Cond() == 0xE) if (Thumb || CurInstr.Cond() == 0xE)
ConstantCycles += cycles; ConstantCycles += cycles;
else else
SUB(RCycles, RCycles, cycles); ADD(RCycles, RCycles, cycles);
} }
void Compiler::Comp_AddCycles_CI(u32 c, ARM64Reg numI, ArithOption shift) void Compiler::Comp_AddCycles_CI(u32 c, ARM64Reg numI, ArithOption shift)
@ -825,11 +825,11 @@ void Compiler::Comp_AddCycles_CI(u32 c, ARM64Reg numI, ArithOption shift)
NDS::ARM7MemTimings[CurInstr.CodeCycles][Thumb ? 0 : 2] NDS::ARM7MemTimings[CurInstr.CodeCycles][Thumb ? 0 : 2]
: ((R15 & 0x2) ? 0 : CurInstr.CodeCycles)) + c; : ((R15 & 0x2) ? 0 : CurInstr.CodeCycles)) + c;
SUB(RCycles, RCycles, cycles); ADD(RCycles, RCycles, cycles);
if (Thumb || CurInstr.Cond() >= 0xE) if (Thumb || CurInstr.Cond() >= 0xE)
ConstantCycles += cycles; ConstantCycles += cycles;
else else
SUB(RCycles, RCycles, cycles); ADD(RCycles, RCycles, cycles);
} }
void Compiler::Comp_AddCycles_CDI() void Compiler::Comp_AddCycles_CDI()
@ -866,7 +866,7 @@ void Compiler::Comp_AddCycles_CDI()
} }
if (!Thumb && CurInstr.Cond() < 0xE) if (!Thumb && CurInstr.Cond() < 0xE)
SUB(RCycles, RCycles, cycles); ADD(RCycles, RCycles, cycles);
else else
ConstantCycles += cycles; ConstantCycles += cycles;
} }
@ -910,7 +910,7 @@ void Compiler::Comp_AddCycles_CD()
} }
if ((!Thumb && CurInstr.Cond() < 0xE) && IrregularCycles) if ((!Thumb && CurInstr.Cond() < 0xE) && IrregularCycles)
SUB(RCycles, RCycles, cycles); ADD(RCycles, RCycles, cycles);
else else
ConstantCycles += cycles; ConstantCycles += cycles;
} }

View File

@ -127,7 +127,7 @@ void Compiler::Comp_JumpTo(u32 addr, bool forceNonConstantCycles)
if ((Thumb || CurInstr.Cond() >= 0xE) && !forceNonConstantCycles) if ((Thumb || CurInstr.Cond() >= 0xE) && !forceNonConstantCycles)
ConstantCycles += cycles; ConstantCycles += cycles;
else else
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles));
} }
void Compiler::Comp_JumpTo(Gen::X64Reg addr, bool restoreCPSR) void Compiler::Comp_JumpTo(Gen::X64Reg addr, bool restoreCPSR)

View File

@ -627,7 +627,7 @@ void Compiler::Comp_SpecialBranchBehaviour(bool taken)
{ {
RegCache.PrepareExit(); RegCache.PrepareExit();
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm32(ConstantCycles)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm32(ConstantCycles));
JMP((u8*)&ARM_Ret, true); JMP((u8*)&ARM_Ret, true);
} }
} }
@ -760,7 +760,7 @@ JitBlockEntry Compiler::CompileBlock(ARM* cpu, bool thumb, FetchedInstr instrs[]
RegCache.Flush(); RegCache.Flush();
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm32(ConstantCycles)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm32(ConstantCycles));
JMP((u8*)ARM_Ret, true); JMP((u8*)ARM_Ret, true);
/*FILE* codeout = fopen("codeout", "a"); /*FILE* codeout = fopen("codeout", "a");
@ -779,7 +779,7 @@ void Compiler::Comp_AddCycles_C(bool forceNonConstant)
: ((R15 & 0x2) ? 0 : CurInstr.CodeCycles); : ((R15 & 0x2) ? 0 : CurInstr.CodeCycles);
if ((!Thumb && CurInstr.Cond() < 0xE) || forceNonConstant) if ((!Thumb && CurInstr.Cond() < 0xE) || forceNonConstant)
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles));
else else
ConstantCycles += cycles; ConstantCycles += cycles;
} }
@ -791,7 +791,7 @@ void Compiler::Comp_AddCycles_CI(u32 i)
: ((R15 & 0x2) ? 0 : CurInstr.CodeCycles)) + i; : ((R15 & 0x2) ? 0 : CurInstr.CodeCycles)) + i;
if (!Thumb && CurInstr.Cond() < 0xE) if (!Thumb && CurInstr.Cond() < 0xE)
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles));
else else
ConstantCycles += cycles; ConstantCycles += cycles;
} }
@ -805,12 +805,12 @@ void Compiler::Comp_AddCycles_CI(Gen::X64Reg i, int add)
if (!Thumb && CurInstr.Cond() < 0xE) if (!Thumb && CurInstr.Cond() < 0xE)
{ {
LEA(32, RSCRATCH, MDisp(i, add + cycles)); LEA(32, RSCRATCH, MDisp(i, add + cycles));
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), R(RSCRATCH)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), R(RSCRATCH));
} }
else else
{ {
ConstantCycles += cycles; ConstantCycles += cycles;
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), R(i)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), R(i));
} }
} }
@ -848,7 +848,7 @@ void Compiler::Comp_AddCycles_CDI()
} }
if (!Thumb && CurInstr.Cond() < 0xE) if (!Thumb && CurInstr.Cond() < 0xE)
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles));
else else
ConstantCycles += cycles; ConstantCycles += cycles;
} }
@ -892,7 +892,7 @@ void Compiler::Comp_AddCycles_CD()
} }
if (IrregularCycles && !Thumb && CurInstr.Cond() < 0xE) if (IrregularCycles && !Thumb && CurInstr.Cond() < 0xE)
SUB(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles)); ADD(32, MDisp(RCPU, offsetof(ARM, Cycles)), Imm8(cycles));
else else
ConstantCycles += cycles; ConstantCycles += cycles;
} }