Merge pull request #12969 from mitaclaw/cached-interpreter-2.1a-profile

CachedInterpreter: Software JIT Profiling Support
This commit is contained in:
OatmealDome 2024-08-14 13:09:34 -04:00 committed by GitHub
commit a345cb0131
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 54 additions and 9 deletions

View File

@ -89,12 +89,23 @@ void CachedInterpreter::SingleStep()
ExecuteOneBlock();
}
s32 CachedInterpreter::EndBlock(PowerPC::PowerPCState& ppc_state, const EndBlockOperands& operands)
s32 CachedInterpreter::StartProfiledBlock(PowerPC::PowerPCState& ppc_state,
const StartProfiledBlockOperands& operands)
{
JitBlock::ProfileData::BeginProfiling(operands.profile_data);
return sizeof(AnyCallback) + sizeof(operands);
}
template <bool profiled>
s32 CachedInterpreter::EndBlock(PowerPC::PowerPCState& ppc_state,
const EndBlockOperands<profiled>& operands)
{
const auto& [downcount, num_load_stores, num_fp_inst] = operands;
ppc_state.pc = ppc_state.npc;
ppc_state.downcount -= downcount;
PowerPC::UpdatePerformanceMonitor(downcount, num_load_stores, num_fp_inst, ppc_state);
ppc_state.downcount -= operands.downcount;
PowerPC::UpdatePerformanceMonitor(operands.downcount, operands.num_load_stores,
operands.num_fp_inst, ppc_state);
if constexpr (profiled)
JitBlock::ProfileData::EndProfiling(operands.profile_data, operands.downcount);
return 0;
}
@ -200,10 +211,23 @@ bool CachedInterpreter::HandleFunctionHooking(u32 address)
return false;
js.downcountAmount += js.st.numCycles;
Write(EndBlock, {js.downcountAmount, js.numLoadStoreInst, js.numFloatingPointInst});
WriteEndBlock();
return true;
}
void CachedInterpreter::WriteEndBlock()
{
if (IsProfilingEnabled())
{
Write(EndBlock<true>, {{js.downcountAmount, js.numLoadStoreInst, js.numFloatingPointInst},
js.curBlock->profile_data.get()});
}
else
{
Write(EndBlock<false>, {js.downcountAmount, js.numLoadStoreInst, js.numFloatingPointInst});
}
}
bool CachedInterpreter::SetEmitterStateToFreeCodeRegion()
{
const auto free = m_free_ranges.by_size_begin();
@ -306,6 +330,9 @@ bool CachedInterpreter::DoJit(u32 em_address, JitBlock* b, u32 nextPC)
auto& cpu = m_system.GetCPU();
auto& breakpoints = power_pc.GetBreakPoints();
if (IsProfilingEnabled())
Write(StartProfiledBlock, {js.curBlock->profile_data.get()});
for (u32 i = 0; i < code_block.m_num_instructions; i++)
{
PPCAnalyst::CodeOp& op = m_code_buffer[i];
@ -357,13 +384,13 @@ bool CachedInterpreter::DoJit(u32 em_address, JitBlock* b, u32 nextPC)
if (op.branchIsIdleLoop)
Write(CheckIdle, {m_system.GetCoreTiming(), js.blockStart});
if (op.canEndBlock)
Write(EndBlock, {js.downcountAmount, js.numLoadStoreInst, js.numFloatingPointInst});
WriteEndBlock();
}
}
if (code_block.m_broken)
{
Write(WriteBrokenBlockNPC, {nextPC});
Write(EndBlock, {js.downcountAmount, js.numLoadStoreInst, js.numFloatingPointInst});
WriteEndBlock();
}
if (HasWriteFailed())

View File

@ -54,6 +54,7 @@ private:
void ExecuteOneBlock();
bool HandleFunctionHooking(u32 address);
void WriteEndBlock();
// Finds a free memory region and sets the code emitter to point at that region.
// Returns false if no free memory region can be found.
@ -62,6 +63,8 @@ private:
void FreeRanges();
void ResetFreeMemoryRanges();
struct StartProfiledBlockOperands;
template <bool profiled>
struct EndBlockOperands;
struct InterpretOperands;
struct InterpretAndCheckExceptionsOperands;
@ -70,7 +73,10 @@ private:
struct CheckHaltOperands;
struct CheckIdleOperands;
static s32 EndBlock(PowerPC::PowerPCState& ppc_state, const EndBlockOperands& operands);
static s32 StartProfiledBlock(PowerPC::PowerPCState& ppc_state,
const StartProfiledBlockOperands& profile_data);
template <bool profiled>
static s32 EndBlock(PowerPC::PowerPCState& ppc_state, const EndBlockOperands<profiled>& operands);
template <bool write_pc>
static s32 Interpret(PowerPC::PowerPCState& ppc_state, const InterpretOperands& operands);
template <bool write_pc>
@ -87,7 +93,13 @@ private:
CachedInterpreterBlockCache m_block_cache;
};
struct CachedInterpreter::EndBlockOperands
struct CachedInterpreter::StartProfiledBlockOperands
{
JitBlock::ProfileData* profile_data;
};
template <>
struct CachedInterpreter::EndBlockOperands<false>
{
u32 downcount;
u32 num_load_stores;
@ -95,6 +107,12 @@ struct CachedInterpreter::EndBlockOperands
u32 : 32;
};
template <>
struct CachedInterpreter::EndBlockOperands<true> : CachedInterpreter::EndBlockOperands<false>
{
JitBlock::ProfileData* profile_data;
};
struct CachedInterpreter::InterpretOperands
{
Interpreter& interpreter;