2019-06-21 23:28:32 +00:00
|
|
|
#include "ARMJIT.h"
|
|
|
|
|
2019-06-25 15:09:27 +00:00
|
|
|
#include <string.h>
|
2019-10-02 23:10:59 +00:00
|
|
|
#include <assert.h>
|
2020-04-25 11:40:51 +00:00
|
|
|
#include <unordered_map>
|
|
|
|
|
|
|
|
#define XXH_STATIC_LINKING_ONLY
|
|
|
|
#include "xxhash/xxhash.h"
|
2019-06-25 15:09:27 +00:00
|
|
|
|
2019-07-14 02:33:36 +00:00
|
|
|
#include "Config.h"
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
#include "ARMJIT_Internal.h"
|
2020-02-04 17:29:52 +00:00
|
|
|
#if defined(__x86_64__)
|
2019-06-21 23:28:32 +00:00
|
|
|
#include "ARMJIT_x64/ARMJIT_Compiler.h"
|
2020-02-04 17:50:16 +00:00
|
|
|
#elif defined(__aarch64__)
|
2020-02-04 17:29:52 +00:00
|
|
|
#include "ARMJIT_A64/ARMJIT_Compiler.h"
|
2020-02-04 17:50:16 +00:00
|
|
|
#else
|
|
|
|
#error "The current target platform doesn't have a JIT backend"
|
2020-02-04 17:29:52 +00:00
|
|
|
#endif
|
2019-06-21 23:28:32 +00:00
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
#include "ARMInterpreter_ALU.h"
|
|
|
|
#include "ARMInterpreter_LoadStore.h"
|
|
|
|
#include "ARMInterpreter_Branch.h"
|
|
|
|
#include "ARMInterpreter.h"
|
|
|
|
|
|
|
|
#include "GPU3D.h"
|
|
|
|
#include "SPU.h"
|
|
|
|
#include "Wifi.h"
|
2019-10-18 11:29:17 +00:00
|
|
|
#include "NDSCart.h"
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2019-06-21 23:28:32 +00:00
|
|
|
namespace ARMJIT
|
|
|
|
{
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
#define JIT_DEBUGPRINT(msg, ...)
|
2019-10-18 11:29:17 +00:00
|
|
|
//#define JIT_DEBUGPRINT(msg, ...) printf(msg, ## __VA_ARGS__)
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2019-06-21 23:28:32 +00:00
|
|
|
Compiler* compiler;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
const u32 ExeMemRegionSizes[] = {
|
|
|
|
0x8000, // Unmapped Region (dummy)
|
|
|
|
0x8000, // ITCM
|
|
|
|
4*1024*1024, // Main RAM
|
|
|
|
0x8000, // SWRAM
|
|
|
|
0xA4000, // LCDC
|
|
|
|
0x8000, // ARM9 BIOS
|
|
|
|
0x4000, // ARM7 BIOS
|
|
|
|
0x10000, // ARM7 WRAM
|
|
|
|
0x40000 // ARM7 WVRAM
|
|
|
|
};
|
2019-06-21 23:28:32 +00:00
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
const u32 ExeMemRegionOffsets[] = {
|
|
|
|
0,
|
|
|
|
0x8000,
|
|
|
|
0x10000,
|
|
|
|
0x410000,
|
|
|
|
0x418000,
|
|
|
|
0x4BC000,
|
|
|
|
0x4C4000,
|
|
|
|
0x4C8000,
|
|
|
|
0x4D8000,
|
|
|
|
0x518000,
|
2019-06-21 23:28:32 +00:00
|
|
|
};
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
#define DUP2(x) x, x
|
|
|
|
|
|
|
|
const static ExeMemKind JIT_MEM[2][32] = {
|
2019-06-21 23:28:32 +00:00
|
|
|
//arm9
|
|
|
|
{
|
2019-10-02 23:10:59 +00:00
|
|
|
/* 0X*/ DUP2(exeMem_ITCM),
|
|
|
|
/* 1X*/ DUP2(exeMem_ITCM), // mirror
|
|
|
|
/* 2X*/ DUP2(exeMem_MainRAM),
|
|
|
|
/* 3X*/ DUP2(exeMem_SWRAM),
|
|
|
|
/* 4X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 5X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 6X*/ exeMem_Unmapped,
|
|
|
|
exeMem_LCDC, // Plain ARM9-CPU Access (LCDC mode) (max 656KB)
|
|
|
|
/* 7X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 8X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 9X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* AX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* BX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* CX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* DX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* EX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* FX*/ DUP2(exeMem_ARM9_BIOS)
|
2019-06-21 23:28:32 +00:00
|
|
|
},
|
|
|
|
//arm7
|
|
|
|
{
|
2019-10-02 23:10:59 +00:00
|
|
|
/* 0X*/ DUP2(exeMem_ARM7_BIOS),
|
|
|
|
/* 1X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 2X*/ DUP2(exeMem_MainRAM),
|
|
|
|
/* 3X*/ exeMem_SWRAM,
|
|
|
|
exeMem_ARM7_WRAM,
|
|
|
|
/* 4X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 5X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 6X*/ DUP2(exeMem_ARM7_WVRAM), /* contrary to Gbatek, melonDS and itself,
|
|
|
|
DeSmuME doesn't mirror the 64 MB region at 0x6800000 */
|
|
|
|
/* 7X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 8X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* 9X*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* AX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* BX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* CX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* DX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* EX*/ DUP2(exeMem_Unmapped),
|
|
|
|
/* FX*/ DUP2(exeMem_Unmapped)
|
2019-06-21 23:28:32 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
#undef DUP2
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
/*
|
|
|
|
translates address to pseudo physical address
|
|
|
|
- more compact, eliminates mirroring, everything comes in a row
|
|
|
|
- we only need one translation table
|
|
|
|
*/
|
|
|
|
u32 AddrTranslate9[0x2000];
|
|
|
|
u32 AddrTranslate7[0x4000];
|
2019-06-21 23:28:32 +00:00
|
|
|
|
2019-10-16 21:39:12 +00:00
|
|
|
AddressRange CodeRanges[ExeMemSpaceSize / 512];
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
std::unordered_map<u32, JitBlock*> JitBlocks;
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
template <typename K, typename V, int Size, V InvalidValue>
|
|
|
|
struct UnreliableHashTable
|
2019-06-21 23:28:32 +00:00
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
struct Bucket
|
|
|
|
{
|
|
|
|
K KeyA, KeyB;
|
|
|
|
V ValA, ValB;
|
|
|
|
};
|
|
|
|
|
|
|
|
Bucket Table[Size];
|
|
|
|
|
|
|
|
void Reset()
|
|
|
|
{
|
|
|
|
for (int i = 0; i < Size; i++)
|
|
|
|
{
|
|
|
|
Table[i].ValA = Table[i].ValB = InvalidValue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
UnreliableHashTable()
|
|
|
|
{
|
|
|
|
Reset();
|
|
|
|
}
|
|
|
|
|
|
|
|
V Insert(K key, V value)
|
|
|
|
{
|
|
|
|
u32 slot = XXH3_64bits(&key, sizeof(K)) & (Size - 1);
|
|
|
|
Bucket* bucket = &Table[slot];
|
|
|
|
|
|
|
|
if (bucket->ValA == value || bucket->ValB == value)
|
|
|
|
{
|
|
|
|
return InvalidValue;
|
|
|
|
}
|
|
|
|
else if (bucket->ValA == InvalidValue)
|
|
|
|
{
|
|
|
|
bucket->KeyA = key;
|
|
|
|
bucket->ValA = value;
|
|
|
|
}
|
|
|
|
else if (bucket->ValB == InvalidValue)
|
|
|
|
{
|
|
|
|
bucket->KeyB = key;
|
|
|
|
bucket->ValB = value;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
V prevVal = bucket->ValB;
|
|
|
|
bucket->KeyB = bucket->KeyA;
|
|
|
|
bucket->ValB = bucket->ValA;
|
|
|
|
bucket->KeyA = key;
|
|
|
|
bucket->ValA = value;
|
|
|
|
return prevVal;
|
|
|
|
}
|
|
|
|
|
|
|
|
return InvalidValue;
|
|
|
|
}
|
|
|
|
|
|
|
|
void Remove(K key)
|
|
|
|
{
|
|
|
|
u32 slot = XXH3_64bits(&key, sizeof(K)) & (Size - 1);
|
|
|
|
Bucket* bucket = &Table[slot];
|
|
|
|
|
|
|
|
if (bucket->KeyA == key && bucket->ValA != InvalidValue)
|
|
|
|
{
|
|
|
|
bucket->ValA = InvalidValue;
|
|
|
|
if (bucket->ValB != InvalidValue)
|
|
|
|
{
|
|
|
|
bucket->KeyA = bucket->KeyB;
|
|
|
|
bucket->ValA = bucket->ValB;
|
|
|
|
bucket->ValB = InvalidValue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (bucket->KeyB == key && bucket->ValB != InvalidValue)
|
|
|
|
bucket->ValB = InvalidValue;
|
|
|
|
}
|
|
|
|
|
|
|
|
V LookUp(K addr)
|
|
|
|
{
|
|
|
|
u32 slot = XXH3_64bits(&addr, 4) & (Size - 1);
|
|
|
|
Bucket* bucket = &Table[slot];
|
|
|
|
|
|
|
|
if (bucket->ValA != InvalidValue && bucket->KeyA == addr)
|
|
|
|
return bucket->ValA;
|
|
|
|
if (bucket->ValB != InvalidValue && bucket->KeyB == addr)
|
|
|
|
return bucket->ValB;
|
|
|
|
|
|
|
|
return InvalidValue;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
UnreliableHashTable<u32, JitBlock*, 0x800, nullptr> RestoreCandidates;
|
|
|
|
UnreliableHashTable<u32, u32, 0x1000, UINT32_MAX> FastBlockLookUp;
|
2019-06-21 23:28:32 +00:00
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
void Init()
|
|
|
|
{
|
2019-07-21 11:36:48 +00:00
|
|
|
for (int i = 0; i < 0x2000; i++)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
|
|
|
ExeMemKind kind = JIT_MEM[0][i >> 8];
|
|
|
|
u32 size = ExeMemRegionSizes[kind];
|
|
|
|
|
|
|
|
AddrTranslate9[i] = ExeMemRegionOffsets[kind] + ((i << 15) & (size - 1));
|
|
|
|
}
|
2019-07-21 11:36:48 +00:00
|
|
|
for (int i = 0; i < 0x4000; i++)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
|
|
|
ExeMemKind kind = JIT_MEM[1][i >> 9];
|
|
|
|
u32 size = ExeMemRegionSizes[kind];
|
|
|
|
|
|
|
|
AddrTranslate7[i] = ExeMemRegionOffsets[kind] + ((i << 14) & (size - 1));
|
|
|
|
}
|
2019-06-21 23:28:32 +00:00
|
|
|
|
|
|
|
compiler = new Compiler();
|
|
|
|
}
|
|
|
|
|
|
|
|
void DeInit()
|
|
|
|
{
|
|
|
|
delete compiler;
|
|
|
|
}
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
void FloodFillSetFlags(FetchedInstr instrs[], int start, u8 flags)
|
2019-08-25 10:28:48 +00:00
|
|
|
{
|
|
|
|
for (int j = start; j >= 0; j--)
|
|
|
|
{
|
|
|
|
u8 match = instrs[j].Info.WriteFlags & flags;
|
|
|
|
u8 matchMaybe = (instrs[j].Info.WriteFlags >> 4) & flags;
|
|
|
|
if (matchMaybe) // writes flags maybe
|
|
|
|
instrs[j].SetFlags |= matchMaybe;
|
|
|
|
if (match)
|
|
|
|
{
|
|
|
|
instrs[j].SetFlags |= match;
|
|
|
|
flags &= ~match;
|
|
|
|
if (!flags)
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-11-03 14:33:20 +00:00
|
|
|
bool DecodeLiteral(const FetchedInstr& instr, u32& addr)
|
|
|
|
{
|
|
|
|
switch (instr.Info.Kind)
|
|
|
|
{
|
|
|
|
case ARMInstrInfo::ak_STR_IMM:
|
|
|
|
case ARMInstrInfo::ak_STRB_IMM:
|
|
|
|
addr = (instr.Addr + 8) + ((instr.Instr & 0xFFF) * (instr.Instr & (1 << 23) ? 1 : -1));
|
|
|
|
return true;
|
|
|
|
case ARMInstrInfo::ak_STRD_IMM:
|
|
|
|
case ARMInstrInfo::ak_STRH_IMM:
|
|
|
|
addr = (instr.Addr + 8) + (((instr.Instr & 0xF00) >> 4 | (instr.Instr & 0xF)) * (instr.Instr & (1 << 23) ? 1 : -1));
|
|
|
|
return true;
|
|
|
|
case ARMInstrInfo::ak_STM: // I honestly hope noone was ever crazy enough to do stm pc, {whatever}
|
|
|
|
addr = instr.Addr + 8;
|
|
|
|
return true;
|
|
|
|
default:
|
|
|
|
JIT_DEBUGPRINT("Literal %08x %x not recognised\n", instr.Instr, instr.Addr);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-10-18 11:29:17 +00:00
|
|
|
bool DecodeBranch(bool thumb, const FetchedInstr& instr, u32& cond, bool hasLink, u32 lr, bool& link,
|
|
|
|
u32& linkAddr, u32& targetAddr)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
|
|
|
if (thumb)
|
|
|
|
{
|
|
|
|
u32 r15 = instr.Addr + 4;
|
|
|
|
cond = 0xE;
|
|
|
|
|
2019-10-18 11:29:17 +00:00
|
|
|
link = instr.Info.Kind == ARMInstrInfo::tk_BL_LONG;
|
|
|
|
linkAddr = instr.Addr + 4;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
if (instr.Info.Kind == ARMInstrInfo::tk_BL_LONG && !(instr.Instr & (1 << 12)))
|
|
|
|
{
|
|
|
|
targetAddr = r15 + ((s32)((instr.Instr & 0x7FF) << 21) >> 9);
|
|
|
|
targetAddr += ((instr.Instr >> 16) & 0x7FF) << 1;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (instr.Info.Kind == ARMInstrInfo::tk_B)
|
|
|
|
{
|
|
|
|
s32 offset = (s32)((instr.Instr & 0x7FF) << 21) >> 20;
|
|
|
|
targetAddr = r15 + offset;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (instr.Info.Kind == ARMInstrInfo::tk_BCOND)
|
|
|
|
{
|
|
|
|
cond = (instr.Instr >> 8) & 0xF;
|
|
|
|
s32 offset = (s32)(instr.Instr << 24) >> 23;
|
|
|
|
targetAddr = r15 + offset;
|
|
|
|
return true;
|
|
|
|
}
|
2019-10-18 11:29:17 +00:00
|
|
|
else if (hasLink && instr.Info.Kind == ARMInstrInfo::tk_BX && instr.A_Reg(3) == 14)
|
|
|
|
{
|
|
|
|
JIT_DEBUGPRINT("returning!\n");
|
|
|
|
targetAddr = lr;
|
|
|
|
return true;
|
|
|
|
}
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2019-10-18 11:29:17 +00:00
|
|
|
link = instr.Info.Kind == ARMInstrInfo::ak_BL;
|
|
|
|
linkAddr = instr.Addr + 4;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
cond = instr.Cond();
|
|
|
|
if (instr.Info.Kind == ARMInstrInfo::ak_BL
|
|
|
|
|| instr.Info.Kind == ARMInstrInfo::ak_B)
|
|
|
|
{
|
|
|
|
s32 offset = (s32)(instr.Instr << 8) >> 6;
|
|
|
|
u32 r15 = instr.Addr + 8;
|
|
|
|
targetAddr = r15 + offset;
|
|
|
|
return true;
|
|
|
|
}
|
2019-10-18 11:29:17 +00:00
|
|
|
else if (hasLink && instr.Info.Kind == ARMInstrInfo::ak_BX && instr.A_Reg(0) == 14)
|
|
|
|
{
|
|
|
|
JIT_DEBUGPRINT("returning!\n");
|
|
|
|
targetAddr = lr;
|
|
|
|
return true;
|
|
|
|
}
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool IsIdleLoop(FetchedInstr* instrs, int instrsCount)
|
|
|
|
{
|
|
|
|
// see https://github.com/dolphin-emu/dolphin/blob/master/Source/Core/Core/PowerPC/PPCAnalyst.cpp#L678
|
|
|
|
// it basically checks if one iteration of a loop depends on another
|
|
|
|
// the rules are quite simple
|
|
|
|
|
|
|
|
u16 regsWrittenTo = 0;
|
|
|
|
u16 regsDisallowedToWrite = 0;
|
|
|
|
for (int i = 0; i < instrsCount; i++)
|
|
|
|
{
|
|
|
|
//printf("instr %d %x regs(%x %x) %x %x\n", i, instrs[i].Instr, instrs[i].Info.DstRegs, instrs[i].Info.SrcRegs, regsWrittenTo, regsDisallowedToWrite);
|
|
|
|
if (instrs[i].Info.SpecialKind == ARMInstrInfo::special_WriteMem)
|
|
|
|
return false;
|
|
|
|
if (i < instrsCount - 1 && instrs[i].Info.Branches())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
u16 srcRegs = instrs[i].Info.SrcRegs & ~(1 << 15);
|
|
|
|
u16 dstRegs = instrs[i].Info.DstRegs & ~(1 << 15);
|
|
|
|
|
|
|
|
regsDisallowedToWrite |= srcRegs & ~regsWrittenTo;
|
|
|
|
|
|
|
|
if (dstRegs & regsDisallowedToWrite)
|
|
|
|
return false;
|
|
|
|
regsWrittenTo |= dstRegs;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
typedef void (*InterpreterFunc)(ARM* cpu);
|
|
|
|
|
2020-02-04 16:28:51 +00:00
|
|
|
void NOP(ARM* cpu) {}
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
#define F(x) &ARMInterpreter::A_##x
|
|
|
|
#define F_ALU(name, s) \
|
|
|
|
F(name##_REG_LSL_IMM##s), F(name##_REG_LSR_IMM##s), F(name##_REG_ASR_IMM##s), F(name##_REG_ROR_IMM##s), \
|
|
|
|
F(name##_REG_LSL_REG##s), F(name##_REG_LSR_REG##s), F(name##_REG_ASR_REG##s), F(name##_REG_ROR_REG##s), F(name##_IMM##s)
|
|
|
|
#define F_MEM_WB(name) \
|
|
|
|
F(name##_REG_LSL), F(name##_REG_LSR), F(name##_REG_ASR), F(name##_REG_ROR), F(name##_IMM), \
|
|
|
|
F(name##_POST_REG_LSL), F(name##_POST_REG_LSR), F(name##_POST_REG_ASR), F(name##_POST_REG_ROR), F(name##_POST_IMM)
|
|
|
|
#define F_MEM_HD(name) \
|
|
|
|
F(name##_REG), F(name##_IMM), F(name##_POST_REG), F(name##_POST_IMM)
|
|
|
|
InterpreterFunc InterpretARM[ARMInstrInfo::ak_Count] =
|
|
|
|
{
|
|
|
|
F_ALU(AND,), F_ALU(AND,_S),
|
|
|
|
F_ALU(EOR,), F_ALU(EOR,_S),
|
|
|
|
F_ALU(SUB,), F_ALU(SUB,_S),
|
|
|
|
F_ALU(RSB,), F_ALU(RSB,_S),
|
|
|
|
F_ALU(ADD,), F_ALU(ADD,_S),
|
|
|
|
F_ALU(ADC,), F_ALU(ADC,_S),
|
|
|
|
F_ALU(SBC,), F_ALU(SBC,_S),
|
|
|
|
F_ALU(RSC,), F_ALU(RSC,_S),
|
|
|
|
F_ALU(ORR,), F_ALU(ORR,_S),
|
|
|
|
F_ALU(MOV,), F_ALU(MOV,_S),
|
|
|
|
F_ALU(BIC,), F_ALU(BIC,_S),
|
|
|
|
F_ALU(MVN,), F_ALU(MVN,_S),
|
|
|
|
F_ALU(TST,),
|
|
|
|
F_ALU(TEQ,),
|
|
|
|
F_ALU(CMP,),
|
|
|
|
F_ALU(CMN,),
|
|
|
|
|
|
|
|
F(MUL), F(MLA), F(UMULL), F(UMLAL), F(SMULL), F(SMLAL), F(SMLAxy), F(SMLAWy), F(SMULWy), F(SMLALxy), F(SMULxy),
|
|
|
|
F(CLZ), F(QADD), F(QDADD), F(QSUB), F(QDSUB),
|
|
|
|
|
|
|
|
F_MEM_WB(STR),
|
|
|
|
F_MEM_WB(STRB),
|
|
|
|
F_MEM_WB(LDR),
|
|
|
|
F_MEM_WB(LDRB),
|
|
|
|
|
|
|
|
F_MEM_HD(STRH),
|
|
|
|
F_MEM_HD(LDRD),
|
|
|
|
F_MEM_HD(STRD),
|
|
|
|
F_MEM_HD(LDRH),
|
|
|
|
F_MEM_HD(LDRSB),
|
|
|
|
F_MEM_HD(LDRSH),
|
|
|
|
|
|
|
|
F(SWP), F(SWPB),
|
|
|
|
F(LDM), F(STM),
|
|
|
|
|
|
|
|
F(B), F(BL), F(BLX_IMM), F(BX), F(BLX_REG),
|
2020-02-04 16:28:51 +00:00
|
|
|
F(UNK), F(MSR_IMM), F(MSR_REG), F(MRS), F(MCR), F(MRC), F(SVC),
|
|
|
|
NOP
|
2019-10-02 23:10:59 +00:00
|
|
|
};
|
|
|
|
#undef F_ALU
|
|
|
|
#undef F_MEM_WB
|
|
|
|
#undef F_MEM_HD
|
|
|
|
#undef F
|
|
|
|
|
2019-10-16 21:39:12 +00:00
|
|
|
void T_BL_LONG(ARM* cpu)
|
|
|
|
{
|
|
|
|
ARMInterpreter::T_BL_LONG_1(cpu);
|
|
|
|
cpu->R[15] += 2;
|
|
|
|
ARMInterpreter::T_BL_LONG_2(cpu);
|
|
|
|
}
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
#define F(x) ARMInterpreter::T_##x
|
|
|
|
InterpreterFunc InterpretTHUMB[ARMInstrInfo::tk_Count] =
|
|
|
|
{
|
|
|
|
F(LSL_IMM), F(LSR_IMM), F(ASR_IMM),
|
|
|
|
F(ADD_REG_), F(SUB_REG_), F(ADD_IMM_), F(SUB_IMM_),
|
|
|
|
F(MOV_IMM), F(CMP_IMM), F(ADD_IMM), F(SUB_IMM),
|
|
|
|
F(AND_REG), F(EOR_REG), F(LSL_REG), F(LSR_REG), F(ASR_REG),
|
|
|
|
F(ADC_REG), F(SBC_REG), F(ROR_REG), F(TST_REG), F(NEG_REG),
|
|
|
|
F(CMP_REG), F(CMN_REG), F(ORR_REG), F(MUL_REG), F(BIC_REG), F(MVN_REG),
|
|
|
|
F(ADD_HIREG), F(CMP_HIREG), F(MOV_HIREG),
|
|
|
|
F(ADD_PCREL), F(ADD_SPREL), F(ADD_SP),
|
|
|
|
F(LDR_PCREL), F(STR_REG), F(STRB_REG), F(LDR_REG), F(LDRB_REG), F(STRH_REG),
|
|
|
|
F(LDRSB_REG), F(LDRH_REG), F(LDRSH_REG), F(STR_IMM), F(LDR_IMM), F(STRB_IMM),
|
|
|
|
F(LDRB_IMM), F(STRH_IMM), F(LDRH_IMM), F(STR_SPREL), F(LDR_SPREL),
|
|
|
|
F(PUSH), F(POP), F(LDMIA), F(STMIA),
|
|
|
|
F(BCOND), F(BX), F(BLX_REG), F(B), F(BL_LONG_1), F(BL_LONG_2),
|
|
|
|
F(UNK), F(SVC),
|
2019-10-16 21:39:12 +00:00
|
|
|
T_BL_LONG // BL_LONG psudo opcode
|
2019-10-02 23:10:59 +00:00
|
|
|
};
|
|
|
|
#undef F
|
|
|
|
|
|
|
|
void CompileBlock(ARM* cpu)
|
2019-06-21 23:28:32 +00:00
|
|
|
{
|
|
|
|
bool thumb = cpu->CPSR & 0x20;
|
|
|
|
|
2019-07-14 02:33:36 +00:00
|
|
|
if (Config::JIT_MaxBlockSize < 1)
|
|
|
|
Config::JIT_MaxBlockSize = 1;
|
|
|
|
if (Config::JIT_MaxBlockSize > 32)
|
|
|
|
Config::JIT_MaxBlockSize = 32;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
u32 blockAddr = cpu->R[15] - (thumb ? 2 : 4);
|
|
|
|
if (!(cpu->Num == 0
|
|
|
|
? IsMapped<0>(blockAddr)
|
|
|
|
: IsMapped<1>(blockAddr)))
|
|
|
|
{
|
|
|
|
printf("Trying to compile a block in unmapped memory: %x\n", blockAddr);
|
|
|
|
}
|
|
|
|
|
|
|
|
u32 pseudoPhysicalAddr = cpu->Num == 0
|
|
|
|
? TranslateAddr<0>(blockAddr)
|
|
|
|
: TranslateAddr<1>(blockAddr);
|
|
|
|
|
2019-07-14 02:33:36 +00:00
|
|
|
FetchedInstr instrs[Config::JIT_MaxBlockSize];
|
2019-06-21 23:28:32 +00:00
|
|
|
int i = 0;
|
|
|
|
u32 r15 = cpu->R[15];
|
2019-10-02 23:10:59 +00:00
|
|
|
|
|
|
|
u32 addresseRanges[32] = {};
|
|
|
|
u32 numAddressRanges = 0;
|
|
|
|
|
2019-08-17 14:50:48 +00:00
|
|
|
cpu->FillPipeline();
|
2019-06-21 23:28:32 +00:00
|
|
|
u32 nextInstr[2] = {cpu->NextInstr[0], cpu->NextInstr[1]};
|
2019-09-08 12:48:20 +00:00
|
|
|
u32 nextInstrAddr[2] = {blockAddr, r15};
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
JIT_DEBUGPRINT("start block %x %08x (%x) (region invalidates %dx)\n",
|
|
|
|
blockAddr, cpu->CPSR, pseudoPhysicalAddr,
|
2019-10-16 21:39:12 +00:00
|
|
|
CodeRanges[pseudoPhysicalAddr / 512].TimesInvalidated);
|
2019-10-02 23:10:59 +00:00
|
|
|
|
|
|
|
u32 lastSegmentStart = blockAddr;
|
2019-10-18 11:29:17 +00:00
|
|
|
u32 lr;
|
|
|
|
bool hasLink = false;
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2019-06-21 23:28:32 +00:00
|
|
|
do
|
|
|
|
{
|
|
|
|
r15 += thumb ? 2 : 4;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
instrs[i].BranchFlags = 0;
|
2019-08-25 11:06:27 +00:00
|
|
|
instrs[i].SetFlags = 0;
|
2019-06-21 23:28:32 +00:00
|
|
|
instrs[i].Instr = nextInstr[0];
|
2019-10-16 21:39:12 +00:00
|
|
|
nextInstr[0] = nextInstr[1];
|
2019-09-08 12:48:20 +00:00
|
|
|
|
|
|
|
instrs[i].Addr = nextInstrAddr[0];
|
|
|
|
nextInstrAddr[0] = nextInstrAddr[1];
|
|
|
|
nextInstrAddr[1] = r15;
|
2019-10-02 23:10:59 +00:00
|
|
|
JIT_DEBUGPRINT("instr %08x %x\n", instrs[i].Instr & (thumb ? 0xFFFF : ~0), instrs[i].Addr);
|
|
|
|
|
|
|
|
u32 translatedAddr = (cpu->Num == 0
|
|
|
|
? TranslateAddr<0>(instrs[i].Addr)
|
2019-10-16 21:39:12 +00:00
|
|
|
: TranslateAddr<1>(instrs[i].Addr)) & ~0x1FF;
|
2019-10-02 23:10:59 +00:00
|
|
|
if (i == 0 || translatedAddr != addresseRanges[numAddressRanges - 1])
|
|
|
|
{
|
|
|
|
bool returning = false;
|
|
|
|
for (int j = 0; j < numAddressRanges; j++)
|
|
|
|
{
|
|
|
|
if (addresseRanges[j] == translatedAddr)
|
|
|
|
{
|
|
|
|
returning = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!returning)
|
|
|
|
addresseRanges[numAddressRanges++] = translatedAddr;
|
|
|
|
}
|
2019-06-21 23:28:32 +00:00
|
|
|
|
|
|
|
if (cpu->Num == 0)
|
|
|
|
{
|
|
|
|
ARMv5* cpuv5 = (ARMv5*)cpu;
|
|
|
|
if (thumb && r15 & 0x2)
|
|
|
|
{
|
|
|
|
nextInstr[1] >>= 16;
|
|
|
|
instrs[i].CodeCycles = 0;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
nextInstr[1] = cpuv5->CodeRead32(r15, false);
|
|
|
|
instrs[i].CodeCycles = cpu->CodeCycles;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
ARMv4* cpuv4 = (ARMv4*)cpu;
|
|
|
|
if (thumb)
|
|
|
|
nextInstr[1] = cpuv4->CodeRead16(r15);
|
|
|
|
else
|
|
|
|
nextInstr[1] = cpuv4->CodeRead32(r15);
|
|
|
|
instrs[i].CodeCycles = cpu->CodeCycles;
|
|
|
|
}
|
|
|
|
instrs[i].Info = ARMInstrInfo::Decode(thumb, cpu->Num, instrs[i].Instr);
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
cpu->R[15] = r15;
|
|
|
|
cpu->CurInstr = instrs[i].Instr;
|
|
|
|
cpu->CodeCycles = instrs[i].CodeCycles;
|
|
|
|
|
2019-10-18 11:29:17 +00:00
|
|
|
if (instrs[i].Info.DstRegs & (1 << 14))
|
|
|
|
hasLink = false;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
if (thumb)
|
|
|
|
{
|
|
|
|
InterpretTHUMB[instrs[i].Info.Kind](cpu);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (cpu->Num == 0 && instrs[i].Info.Kind == ARMInstrInfo::ak_BLX_IMM)
|
|
|
|
{
|
|
|
|
ARMInterpreter::A_BLX_IMM(cpu);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
u32 icode = ((instrs[i].Instr >> 4) & 0xF) | ((instrs[i].Instr >> 16) & 0xFF0);
|
2020-02-04 16:28:51 +00:00
|
|
|
assert(InterpretARM[instrs[i].Info.Kind] == ARMInterpreter::ARMInstrTable[icode]
|
|
|
|
|| instrs[i].Info.Kind == ARMInstrInfo::ak_MOV_REG_LSL_IMM
|
|
|
|
|| instrs[i].Info.Kind == ARMInstrInfo::ak_Nop);
|
2019-10-02 23:10:59 +00:00
|
|
|
if (cpu->CheckCondition(instrs[i].Cond()))
|
|
|
|
InterpretARM[instrs[i].Info.Kind](cpu);
|
|
|
|
else
|
|
|
|
cpu->AddCycles_C();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
instrs[i].DataCycles = cpu->DataCycles;
|
|
|
|
instrs[i].DataRegion = cpu->DataRegion;
|
|
|
|
|
2019-11-03 14:33:20 +00:00
|
|
|
if (instrs[i].Info.SpecialKind == ARMInstrInfo::special_WriteMem
|
|
|
|
&& instrs[i].Info.SrcRegs == (1 << 15)
|
|
|
|
&& instrs[i].Info.DstRegs == 0)
|
|
|
|
{
|
|
|
|
assert (!thumb);
|
|
|
|
|
|
|
|
u32 addr;
|
|
|
|
if (DecodeLiteral(instrs[i], addr))
|
|
|
|
{
|
|
|
|
JIT_DEBUGPRINT("pc relative write detected\n");
|
|
|
|
u32 translatedAddr = cpu->Num == 0 ? TranslateAddr<0>(addr) : TranslateAddr<1>(addr);
|
|
|
|
|
|
|
|
ARMJIT::InvalidateByAddr(translatedAddr, false);
|
|
|
|
CodeRanges[translatedAddr / 512].InvalidLiterals |= (1 << ((translatedAddr & 0x1FF) / 16));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-09-08 12:48:20 +00:00
|
|
|
if (thumb && instrs[i].Info.Kind == ARMInstrInfo::tk_BL_LONG_2 && i > 0
|
|
|
|
&& instrs[i - 1].Info.Kind == ARMInstrInfo::tk_BL_LONG_1)
|
|
|
|
{
|
|
|
|
instrs[i - 1].Info.Kind = ARMInstrInfo::tk_BL_LONG;
|
|
|
|
instrs[i - 1].Instr = (instrs[i - 1].Instr & 0xFFFF) | (instrs[i].Instr << 16);
|
|
|
|
instrs[i - 1].Info.DstRegs = 0xC000;
|
|
|
|
instrs[i - 1].Info.SrcRegs = 0;
|
|
|
|
instrs[i - 1].Info.EndBlock = true;
|
|
|
|
i--;
|
|
|
|
}
|
2019-08-25 10:28:48 +00:00
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
if (instrs[i].Info.Branches() && Config::JIT_BrancheOptimisations)
|
|
|
|
{
|
|
|
|
bool hasBranched = cpu->R[15] != r15;
|
|
|
|
|
2019-10-18 11:29:17 +00:00
|
|
|
bool link;
|
|
|
|
u32 cond, target, linkAddr;
|
|
|
|
bool staticBranch = DecodeBranch(thumb, instrs[i], cond, hasLink, lr, link, linkAddr, target);
|
2019-10-02 23:10:59 +00:00
|
|
|
JIT_DEBUGPRINT("branch cond %x target %x (%d)\n", cond, target, hasBranched);
|
|
|
|
|
|
|
|
if (staticBranch)
|
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
instrs[i].BranchFlags |= branch_StaticTarget;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
bool isBackJump = false;
|
|
|
|
if (hasBranched)
|
|
|
|
{
|
|
|
|
for (int j = 0; j < i; j++)
|
|
|
|
{
|
|
|
|
if (instrs[i].Addr == target)
|
|
|
|
{
|
|
|
|
isBackJump = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (cond < 0xE && target < instrs[i].Addr && target >= lastSegmentStart)
|
|
|
|
{
|
|
|
|
// we might have an idle loop
|
2019-10-18 11:29:17 +00:00
|
|
|
u32 backwardsOffset = (instrs[i].Addr - target) / (thumb ? 2 : 4);
|
|
|
|
if (IsIdleLoop(&instrs[i - backwardsOffset], backwardsOffset + 1))
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
|
|
|
instrs[i].BranchFlags |= branch_IdleBranch;
|
|
|
|
JIT_DEBUGPRINT("found %s idle loop %d in block %x\n", thumb ? "thumb" : "arm", cpu->Num, blockAddr);
|
|
|
|
}
|
|
|
|
}
|
2019-10-18 11:29:17 +00:00
|
|
|
else if (hasBranched && !isBackJump && i + 1 < Config::JIT_MaxBlockSize)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
|
|
|
u32 targetPseudoPhysical = cpu->Num == 0
|
|
|
|
? TranslateAddr<0>(target)
|
|
|
|
: TranslateAddr<1>(target);
|
2019-10-18 11:29:17 +00:00
|
|
|
|
|
|
|
if (link)
|
|
|
|
{
|
|
|
|
lr = linkAddr;
|
|
|
|
hasLink = true;
|
|
|
|
}
|
2019-10-02 23:10:59 +00:00
|
|
|
|
|
|
|
r15 = target + (thumb ? 2 : 4);
|
|
|
|
assert(r15 == cpu->R[15]);
|
|
|
|
|
|
|
|
JIT_DEBUGPRINT("block lengthened by static branch (target %x)\n", target);
|
|
|
|
|
|
|
|
nextInstr[0] = cpu->NextInstr[0];
|
|
|
|
nextInstr[1] = cpu->NextInstr[1];
|
|
|
|
|
|
|
|
nextInstrAddr[0] = target;
|
|
|
|
nextInstrAddr[1] = r15;
|
|
|
|
|
|
|
|
lastSegmentStart = target;
|
|
|
|
|
|
|
|
instrs[i].Info.EndBlock = false;
|
|
|
|
|
|
|
|
if (cond < 0xE)
|
|
|
|
instrs[i].BranchFlags |= branch_FollowCondTaken;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!hasBranched && cond < 0xE && i + 1 < Config::JIT_MaxBlockSize)
|
|
|
|
{
|
|
|
|
instrs[i].Info.EndBlock = false;
|
|
|
|
instrs[i].BranchFlags |= branch_FollowCondNotTaken;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
i++;
|
2019-09-08 12:48:20 +00:00
|
|
|
|
2019-08-25 10:28:48 +00:00
|
|
|
bool canCompile = compiler->CanCompile(thumb, instrs[i - 1].Info.Kind);
|
2019-10-02 23:10:59 +00:00
|
|
|
bool secondaryFlagReadCond = !canCompile || (instrs[i - 1].BranchFlags & (branch_FollowCondTaken | branch_FollowCondNotTaken));
|
|
|
|
if (instrs[i - 1].Info.ReadFlags != 0 || secondaryFlagReadCond)
|
|
|
|
FloodFillSetFlags(instrs, i - 2, !secondaryFlagReadCond ? instrs[i - 1].Info.ReadFlags : 0xF);
|
2019-10-18 11:29:17 +00:00
|
|
|
} while(!instrs[i - 1].Info.EndBlock && i < Config::JIT_MaxBlockSize && !cpu->Halted && (!cpu->IRQ || (cpu->CPSR & 0x80)));
|
2019-06-21 23:28:32 +00:00
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlock* prevBlock = RestoreCandidates.LookUp(pseudoPhysicalAddr);
|
2019-10-02 23:10:59 +00:00
|
|
|
bool mayRestore = true;
|
2020-04-25 11:40:51 +00:00
|
|
|
if (prevBlock)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
RestoreCandidates.Remove(pseudoPhysicalAddr);
|
2019-10-02 23:10:59 +00:00
|
|
|
if (prevBlock->NumInstrs == i)
|
|
|
|
{
|
|
|
|
for (int j = 0; j < i; j++)
|
|
|
|
{
|
|
|
|
if (prevBlock->Instrs()[j] != instrs[j].Instr)
|
|
|
|
{
|
|
|
|
mayRestore = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
mayRestore = false;
|
2019-08-25 10:28:48 +00:00
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
if (prevBlock->NumAddresses == numAddressRanges)
|
|
|
|
{
|
|
|
|
for (int j = 0; j < numAddressRanges; j++)
|
|
|
|
{
|
|
|
|
if (prevBlock->AddressRanges()[j] != addresseRanges[j])
|
|
|
|
{
|
|
|
|
mayRestore = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
mayRestore = false;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
mayRestore = false;
|
|
|
|
prevBlock = NULL;
|
|
|
|
}
|
2019-06-21 23:28:32 +00:00
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
JitBlock* block;
|
|
|
|
if (!mayRestore)
|
|
|
|
{
|
|
|
|
if (prevBlock)
|
|
|
|
delete prevBlock;
|
|
|
|
|
|
|
|
block = new JitBlock(i, numAddressRanges);
|
|
|
|
for (int j = 0; j < i; j++)
|
|
|
|
block->Instrs()[j] = instrs[j].Instr;
|
|
|
|
for (int j = 0; j < numAddressRanges; j++)
|
|
|
|
block->AddressRanges()[j] = addresseRanges[j];
|
|
|
|
|
|
|
|
block->StartAddr = blockAddr;
|
|
|
|
block->PseudoPhysicalAddr = pseudoPhysicalAddr;
|
|
|
|
|
|
|
|
FloodFillSetFlags(instrs, i - 1, 0xF);
|
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
block->EntryPoint = compiler->CompileBlock(pseudoPhysicalAddr, cpu, thumb, instrs, i);
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
2019-07-21 11:36:48 +00:00
|
|
|
else
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
|
|
|
JIT_DEBUGPRINT("restored! %p\n", prevBlock);
|
|
|
|
block = prevBlock;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (int j = 0; j < numAddressRanges; j++)
|
|
|
|
{
|
|
|
|
assert(addresseRanges[j] == block->AddressRanges()[j]);
|
2019-10-16 21:39:12 +00:00
|
|
|
CodeRanges[addresseRanges[j] / 512].Blocks.Add(block);
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlocks[pseudoPhysicalAddr] = block;
|
|
|
|
FastBlockLookUp.Insert(pseudoPhysicalAddr, compiler->SubEntryOffset(block->EntryPoint));
|
2019-06-21 23:28:32 +00:00
|
|
|
}
|
|
|
|
|
2019-11-03 14:33:20 +00:00
|
|
|
void InvalidateByAddr(u32 pseudoPhysical, bool mayRestore)
|
2019-06-25 15:09:27 +00:00
|
|
|
{
|
2019-10-02 23:10:59 +00:00
|
|
|
JIT_DEBUGPRINT("invalidating by addr %x\n", pseudoPhysical);
|
2019-10-16 21:39:12 +00:00
|
|
|
AddressRange* range = &CodeRanges[pseudoPhysical / 512];
|
2019-10-02 23:10:59 +00:00
|
|
|
int startLength = range->Blocks.Length;
|
|
|
|
for (int i = 0; i < range->Blocks.Length; i++)
|
|
|
|
{
|
|
|
|
assert(range->Blocks.Length == startLength);
|
|
|
|
JitBlock* block = range->Blocks[i];
|
|
|
|
for (int j = 0; j < block->NumAddresses; j++)
|
|
|
|
{
|
|
|
|
u32 addr = block->AddressRanges()[j];
|
2019-10-16 21:39:12 +00:00
|
|
|
if ((addr / 512) != (pseudoPhysical / 512))
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
2019-10-16 21:39:12 +00:00
|
|
|
AddressRange* otherRange = &CodeRanges[addr / 512];
|
2019-10-02 23:10:59 +00:00
|
|
|
assert(otherRange != range);
|
2019-10-16 21:39:12 +00:00
|
|
|
bool removed = otherRange->Blocks.RemoveByValue(block);
|
|
|
|
assert(removed);
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
for (int j = 0; j < block->NumLinks(); j++)
|
|
|
|
compiler->UnlinkBlock(block->Links()[j]);
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlocks.erase(block->PseudoPhysicalAddr);
|
|
|
|
FastBlockLookUp.Remove(block->PseudoPhysicalAddr);
|
2019-08-16 21:17:08 +00:00
|
|
|
|
2019-11-03 14:33:20 +00:00
|
|
|
if (mayRestore)
|
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlock* prevBlock = RestoreCandidates.Insert(block->PseudoPhysicalAddr, block);
|
|
|
|
if (prevBlock)
|
|
|
|
delete prevBlock;
|
2019-11-03 14:33:20 +00:00
|
|
|
}
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
if ((range->TimesInvalidated + 1) > range->TimesInvalidated)
|
|
|
|
range->TimesInvalidated++;
|
|
|
|
|
|
|
|
range->Blocks.Clear();
|
|
|
|
}
|
|
|
|
|
|
|
|
void InvalidateByAddr7(u32 addr)
|
|
|
|
{
|
|
|
|
u32 pseudoPhysical = TranslateAddr<1>(addr);
|
2019-10-16 21:39:12 +00:00
|
|
|
if (__builtin_expect(CodeRanges[pseudoPhysical / 512].Blocks.Length > 0, false))
|
2019-10-02 23:10:59 +00:00
|
|
|
InvalidateByAddr(pseudoPhysical);
|
|
|
|
}
|
|
|
|
|
|
|
|
void InvalidateITCM(u32 addr)
|
|
|
|
{
|
|
|
|
u32 pseudoPhysical = addr + ExeMemRegionOffsets[exeMem_ITCM];
|
2019-10-16 21:39:12 +00:00
|
|
|
if (CodeRanges[pseudoPhysical / 512].Blocks.Length > 0)
|
2019-10-02 23:10:59 +00:00
|
|
|
InvalidateByAddr(pseudoPhysical);
|
|
|
|
}
|
|
|
|
|
|
|
|
void InvalidateAll()
|
|
|
|
{
|
|
|
|
JIT_DEBUGPRINT("invalidating all %x\n", JitBlocks.Length);
|
2020-04-25 11:40:51 +00:00
|
|
|
for (auto it : JitBlocks)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlock* block = it.second;
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
FastBlockLookUp.Remove(block->PseudoPhysicalAddr);
|
|
|
|
|
|
|
|
for (int i = 0; i < block->NumAddresses; i++)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
u32 addr = block->AddressRanges()[i];
|
2019-10-16 21:39:12 +00:00
|
|
|
AddressRange* range = &CodeRanges[addr / 512];
|
2019-10-02 23:10:59 +00:00
|
|
|
range->Blocks.Clear();
|
|
|
|
if (range->TimesInvalidated + 1 > range->TimesInvalidated)
|
|
|
|
range->TimesInvalidated++;
|
|
|
|
}
|
2020-04-25 11:40:51 +00:00
|
|
|
for (int i = 0; i < block->NumLinks(); i++)
|
|
|
|
compiler->UnlinkBlock(block->Links()[i]);
|
|
|
|
block->ResetLinks();
|
2019-10-02 23:10:59 +00:00
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlock* prevBlock = RestoreCandidates.Insert(block->PseudoPhysicalAddr, block);
|
|
|
|
if (prevBlock)
|
|
|
|
delete prevBlock;
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlocks.clear();
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ResetBlockCache()
|
|
|
|
{
|
|
|
|
printf("Resetting JIT block cache...\n");
|
2020-04-25 11:40:51 +00:00
|
|
|
|
|
|
|
FastBlockLookUp.Reset();
|
|
|
|
RestoreCandidates.Reset();
|
|
|
|
for (int i = 0; i < sizeof(RestoreCandidates.Table)/sizeof(RestoreCandidates.Table[0]); i++)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
if (RestoreCandidates.Table[i].ValA)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
delete RestoreCandidates.Table[i].ValA;
|
|
|
|
RestoreCandidates.Table[i].ValA = NULL;
|
|
|
|
}
|
|
|
|
if (RestoreCandidates.Table[i].ValA)
|
|
|
|
{
|
|
|
|
delete RestoreCandidates.Table[i].ValB;
|
|
|
|
RestoreCandidates.Table[i].ValB = NULL;
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
}
|
2020-04-25 11:40:51 +00:00
|
|
|
for (auto it : JitBlocks)
|
2019-10-02 23:10:59 +00:00
|
|
|
{
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlock* block = it.second;
|
2019-10-02 23:10:59 +00:00
|
|
|
for (int j = 0; j < block->NumAddresses; j++)
|
|
|
|
{
|
|
|
|
u32 addr = block->AddressRanges()[j];
|
2019-10-16 21:39:12 +00:00
|
|
|
CodeRanges[addr / 512].Blocks.Clear();
|
|
|
|
CodeRanges[addr / 512].TimesInvalidated = 0;
|
2019-11-03 14:33:20 +00:00
|
|
|
CodeRanges[addr / 512].InvalidLiterals = 0;
|
2019-10-02 23:10:59 +00:00
|
|
|
}
|
|
|
|
delete block;
|
|
|
|
}
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlocks.clear();
|
2019-07-14 02:33:36 +00:00
|
|
|
|
|
|
|
compiler->Reset();
|
2019-06-25 15:09:27 +00:00
|
|
|
}
|
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
JitBlockEntry LookUpBlockEntry(u32 addr)
|
|
|
|
{
|
|
|
|
u32 entryOffset = FastBlockLookUp.LookUp(addr);
|
|
|
|
if (entryOffset != UINT32_MAX)
|
|
|
|
return compiler->AddEntryOffset(entryOffset);
|
|
|
|
|
|
|
|
auto block = JitBlocks.find(addr);
|
|
|
|
if (block != JitBlocks.end())
|
|
|
|
{
|
|
|
|
FastBlockLookUp.Insert(addr, compiler->SubEntryOffset(block->second->EntryPoint));
|
|
|
|
return block->second->EntryPoint;
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <u32 Num>
|
|
|
|
void LinkBlock(ARM* cpu, u32 codeOffset)
|
|
|
|
{
|
|
|
|
u32 targetPseudoPhys = TranslateAddr<Num>(cpu->R[15] - ((cpu->CPSR&0x20)?2:4));
|
|
|
|
auto block = JitBlocks.find(targetPseudoPhys);
|
|
|
|
if (block == JitBlocks.end())
|
|
|
|
{
|
|
|
|
CompileBlock(cpu);
|
|
|
|
block = JitBlocks.find(targetPseudoPhys);
|
|
|
|
}
|
|
|
|
|
|
|
|
JIT_DEBUGPRINT("linking to block %08x\n", targetPseudoPhys);
|
|
|
|
|
|
|
|
block->second->AddLink(codeOffset);
|
|
|
|
compiler->LinkBlock(codeOffset, block->second->EntryPoint);
|
|
|
|
}
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
void* GetFuncForAddr(ARM* cpu, u32 addr, bool store, int size)
|
|
|
|
{
|
|
|
|
if (cpu->Num == 0)
|
|
|
|
{
|
|
|
|
if ((addr & 0xFF000000) == 0x04000000)
|
|
|
|
{
|
2019-10-18 11:29:17 +00:00
|
|
|
if (!store && size == 32 && addr == 0x04100010 && NDS::ExMemCnt[0] & (1<<11))
|
|
|
|
return (void*)NDSCart::ReadROMData;
|
|
|
|
|
2019-10-02 23:10:59 +00:00
|
|
|
/*
|
|
|
|
unfortunately we can't map GPU2D this way
|
|
|
|
since it's hidden inside an object
|
|
|
|
|
|
|
|
though GPU3D registers are accessed much more intensive
|
|
|
|
*/
|
|
|
|
if (addr >= 0x04000320 && addr < 0x040006A4)
|
|
|
|
{
|
|
|
|
switch (size | store)
|
|
|
|
{
|
|
|
|
case 8: return (void*)GPU3D::Read8;
|
|
|
|
case 9: return (void*)GPU3D::Write8;
|
|
|
|
case 16: return (void*)GPU3D::Read16;
|
|
|
|
case 17: return (void*)GPU3D::Write16;
|
|
|
|
case 32: return (void*)GPU3D::Read32;
|
|
|
|
case 33: return (void*)GPU3D::Write32;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (size | store)
|
|
|
|
{
|
|
|
|
case 8: return (void*)NDS::ARM9IORead8;
|
|
|
|
case 9: return (void*)NDS::ARM9IOWrite8;
|
|
|
|
case 16: return (void*)NDS::ARM9IORead16;
|
|
|
|
case 17: return (void*)NDS::ARM9IOWrite16;
|
|
|
|
case 32: return (void*)NDS::ARM9IORead32;
|
|
|
|
case 33: return (void*)NDS::ARM9IOWrite32;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
switch (addr & 0xFF800000)
|
|
|
|
{
|
|
|
|
case 0x04000000:
|
|
|
|
if (addr >= 0x04000400 && addr < 0x04000520)
|
|
|
|
{
|
|
|
|
switch (size | store)
|
|
|
|
{
|
|
|
|
case 8: return (void*)SPU::Read8;
|
|
|
|
case 9: return (void*)SPU::Write8;
|
|
|
|
case 16: return (void*)SPU::Read16;
|
|
|
|
case 17: return (void*)SPU::Write16;
|
|
|
|
case 32: return (void*)SPU::Read32;
|
|
|
|
case 33: return (void*)SPU::Write32;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (size | store)
|
|
|
|
{
|
|
|
|
case 8: return (void*)NDS::ARM7IORead8;
|
|
|
|
case 9: return (void*)NDS::ARM7IOWrite8;
|
|
|
|
case 16: return (void*)NDS::ARM7IORead16;
|
|
|
|
case 17: return (void*)NDS::ARM7IOWrite16;
|
|
|
|
case 32: return (void*)NDS::ARM7IORead32;
|
|
|
|
case 33: return (void*)NDS::ARM7IOWrite32;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case 0x04800000:
|
|
|
|
if (addr < 0x04810000 && size == 16)
|
|
|
|
{
|
|
|
|
if (store)
|
|
|
|
return (void*)Wifi::Write;
|
|
|
|
else
|
|
|
|
return (void*)Wifi::Read;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2020-04-25 11:40:51 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template void ARMJIT::LinkBlock<0>(ARM*, u32);
|
|
|
|
template void ARMJIT::LinkBlock<1>(ARM*, u32);
|