From 81e842e2aa2ae901eda8b29456cba0b63ac2619d Mon Sep 17 00:00:00 2001 From: Jordan Woyak Date: Thu, 6 Mar 2025 02:11:10 -0600 Subject: [PATCH 1/6] CoreTiming: Don't Throttle in event queue processing. --- Source/Core/Core/CoreTiming.cpp | 9 --------- Source/Core/Core/CoreTiming.h | 4 ---- 2 files changed, 13 deletions(-) diff --git a/Source/Core/Core/CoreTiming.cpp b/Source/Core/Core/CoreTiming.cpp index 931e21d396..f90c2c6f8f 100644 --- a/Source/Core/Core/CoreTiming.cpp +++ b/Source/Core/Core/CoreTiming.cpp @@ -18,7 +18,6 @@ #include "Core/AchievementManager.h" #include "Core/CPUThreadConfigCallback.h" -#include "Core/Config/AchievementSettings.h" #include "Core/Config/MainSettings.h" #include "Core/Core.h" #include "Core/PowerPC/PowerPC.h" @@ -333,8 +332,6 @@ void CoreTimingManager::Advance() Event evt = std::move(m_event_queue.front()); std::ranges::pop_heap(m_event_queue, std::ranges::greater{}); m_event_queue.pop_back(); - - Throttle(evt.time); evt.type->callback(m_system, evt.userdata, m_globals.global_timer - evt.time); } @@ -360,11 +357,6 @@ void CoreTimingManager::Throttle(const s64 target_cycle) { // Based on number of cycles and emulation speed, increase the target deadline const s64 cycles = target_cycle - m_throttle_last_cycle; - - // Prevent any throttling code if the amount of time passed is < ~0.122ms - if (cycles < m_throttle_min_clock_per_sleep) - return; - m_throttle_last_cycle = target_cycle; const double speed = Core::GetIsThrottlerTempDisabled() ? 0.0 : m_emulation_speed; @@ -442,7 +434,6 @@ void CoreTimingManager::LogPendingEvents() const void CoreTimingManager::AdjustEventQueueTimes(u32 new_ppc_clock, u32 old_ppc_clock) { m_throttle_clock_per_sec = new_ppc_clock; - m_throttle_min_clock_per_sleep = new_ppc_clock / 1200; for (Event& ev : m_event_queue) { diff --git a/Source/Core/Core/CoreTiming.h b/Source/Core/Core/CoreTiming.h index f35812ba1a..93b3c1e4f1 100644 --- a/Source/Core/Core/CoreTiming.h +++ b/Source/Core/Core/CoreTiming.h @@ -16,7 +16,6 @@ // inside callback: // ScheduleEvent(periodInCycles - cyclesLate, callback, "whatever") -#include #include #include #include @@ -156,8 +155,6 @@ public: Globals& GetGlobals() { return m_globals; } // Throttle the CPU to the specified target cycle. - // Never used outside of CoreTiming, however it remains public - // in order to allow custom throttling implementations to be tested. void Throttle(const s64 target_cycle); TimePoint GetCPUTimePoint(s64 cyclesLate) const; // Used by Dolphin Analytics @@ -203,7 +200,6 @@ private: s64 m_throttle_last_cycle = 0; TimePoint m_throttle_deadline = Clock::now(); s64 m_throttle_clock_per_sec = 0; - s64 m_throttle_min_clock_per_sleep = 0; bool m_throttle_disable_vi_int = false; DT m_max_fallback = {}; From 9675c90890291c245af9bfba61b2d45a7444d7c9 Mon Sep 17 00:00:00 2001 From: Jordan Woyak Date: Sun, 2 Mar 2025 03:19:28 -0600 Subject: [PATCH 2/6] VideoInterface: Throttle prior to SI poll. --- Source/Core/Core/HW/VideoInterface.cpp | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/Source/Core/Core/HW/VideoInterface.cpp b/Source/Core/Core/HW/VideoInterface.cpp index 2f41c1b1e5..bc679492ea 100644 --- a/Source/Core/Core/HW/VideoInterface.cpp +++ b/Source/Core/Core/HW/VideoInterface.cpp @@ -888,10 +888,13 @@ void VideoInterfaceManager::Update(u64 ticks) if (is_at_field_boundary) Core::Callback_NewField(m_system); - // If an SI poll is scheduled to happen on this half-line, do it! + auto& core_timing = m_system.GetCoreTiming(); + // If an SI poll is scheduled to happen on this half-line, do it! if (m_half_line_count == m_half_line_of_next_si_poll) { + // Throttle before SI poll so user input is taken just before needed. (lower input latency) + core_timing.Throttle(ticks); Core::UpdateInputGate(!Config::Get(Config::MAIN_INPUT_BACKGROUND_INPUT), Config::Get(Config::MAIN_LOCK_CURSOR)); auto& si = m_system.GetSerialInterface(); @@ -917,7 +920,6 @@ void VideoInterfaceManager::Update(u64 ticks) m_half_line_count = 0; } - auto& core_timing = m_system.GetCoreTiming(); if (!(m_half_line_count & 1)) { m_ticks_last_line_start = core_timing.GetTicks(); From aa624d8ba8f66e03572fbc1beac6cf67105fb5da Mon Sep 17 00:00:00 2001 From: Jordan Woyak Date: Sun, 2 Mar 2025 03:25:23 -0600 Subject: [PATCH 3/6] BTEmu: Throttle prior to wii remote input update. --- Source/Core/Core/IOS/USB/Bluetooth/BTEmu.cpp | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/Source/Core/Core/IOS/USB/Bluetooth/BTEmu.cpp b/Source/Core/Core/IOS/USB/Bluetooth/BTEmu.cpp index a63ca59ba9..8e89cc927f 100644 --- a/Source/Core/Core/IOS/USB/Bluetooth/BTEmu.cpp +++ b/Source/Core/Core/IOS/USB/Bluetooth/BTEmu.cpp @@ -347,10 +347,13 @@ void BluetoothEmuDevice::Update() wiimote->Update(); const u64 interval = GetSystem().GetSystemTimers().GetTicksPerSecond() / Wiimote::UPDATE_FREQ; - const u64 now = GetSystem().GetCoreTiming().GetTicks(); + auto& core_timing = GetSystem().GetCoreTiming(); + const u64 now = core_timing.GetTicks(); if (now - m_last_ticks > interval) { + // Throttle before Wii Remote update so input is taken just before needed. (lower input latency) + core_timing.Throttle(now); g_controller_interface.SetCurrentInputChannel(ciface::InputChannel::Bluetooth); g_controller_interface.UpdateInput(); From 9ac9813492fda1a84c62d19a2d3b0ed7a19ebe0f Mon Sep 17 00:00:00 2001 From: Jordan Woyak Date: Sun, 2 Mar 2025 23:25:30 -0600 Subject: [PATCH 4/6] SystemTimers: Throttle prior to performance marker. --- Source/Core/Core/HW/SystemTimers.cpp | 2 ++ 1 file changed, 2 insertions(+) diff --git a/Source/Core/Core/HW/SystemTimers.cpp b/Source/Core/Core/HW/SystemTimers.cpp index 022b94bf4d..508b445288 100644 --- a/Source/Core/Core/HW/SystemTimers.cpp +++ b/Source/Core/Core/HW/SystemTimers.cpp @@ -125,6 +125,8 @@ void SystemTimersManager::GPUSleepCallback(Core::System& system, u64 userdata, s void SystemTimersManager::PerfTrackerCallback(Core::System& system, u64 userdata, s64 cycles_late) { auto& core_timing = system.GetCoreTiming(); + // Throttle for accurate performance metrics. + core_timing.Throttle(core_timing.GetTicks() - cycles_late); g_perf_metrics.CountPerformanceMarker(system, cycles_late); // Call this performance tracker again in 1/100th of a second. From c4bd98c6269f41f251d333eeb23cf8ffeb6ec51d Mon Sep 17 00:00:00 2001 From: Jordan Woyak Date: Thu, 6 Mar 2025 03:02:19 -0600 Subject: [PATCH 5/6] VideoInterface: Throttle before VBlank statistics counting. --- Source/Core/Core/HW/VideoInterface.cpp | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/Source/Core/Core/HW/VideoInterface.cpp b/Source/Core/Core/HW/VideoInterface.cpp index bc679492ea..76b31a8dcc 100644 --- a/Source/Core/Core/HW/VideoInterface.cpp +++ b/Source/Core/Core/HW/VideoInterface.cpp @@ -839,6 +839,11 @@ void VideoInterfaceManager::EndField(FieldType field, u64 ticks) if (!Config::Get(Config::GFX_HACK_EARLY_XFB_OUTPUT)) OutputField(field, ticks); + // Note: We really only need to Throttle prior to to presentation, + // but it is needed here if we want accurate "VBlank" statistics, + // when using GPU-on-Thread or Early/Immediate XFB. + m_system.GetCoreTiming().Throttle(ticks); + g_perf_metrics.CountVBlank(); VIEndFieldEvent::Trigger(); Core::OnFrameEnd(m_system); From 7222188cde8f1699e1384d3ec773928f7fb415e2 Mon Sep 17 00:00:00 2001 From: Jordan Woyak Date: Thu, 6 Mar 2025 03:01:53 -0600 Subject: [PATCH 6/6] Core/VideoCommon: Push presentation time calculated from CPU thread to GPU thread. --- Source/Core/Core/CoreTiming.cpp | 30 ++++++++++++++++++++ Source/Core/Core/CoreTiming.h | 4 +++ Source/Core/VideoCommon/AsyncRequests.cpp | 2 +- Source/Core/VideoCommon/AsyncRequests.h | 3 ++ Source/Core/VideoCommon/Present.cpp | 13 ++++++--- Source/Core/VideoCommon/Present.h | 6 ++-- Source/Core/VideoCommon/VideoBackendBase.cpp | 5 ++-- 7 files changed, 52 insertions(+), 11 deletions(-) diff --git a/Source/Core/Core/CoreTiming.cpp b/Source/Core/Core/CoreTiming.cpp index f90c2c6f8f..9987ac84e1 100644 --- a/Source/Core/Core/CoreTiming.cpp +++ b/Source/Core/Core/CoreTiming.cpp @@ -353,6 +353,36 @@ void CoreTimingManager::Advance() power_pc.CheckExternalExceptions(); } +TimePoint CoreTimingManager::GetTargetHostTime(s64 target_cycle) +{ + const double speed = Core::GetIsThrottlerTempDisabled() ? 0.0 : m_emulation_speed; + + if (speed > 0) + { + const s64 cycles = target_cycle - m_throttle_last_cycle; + return m_throttle_deadline + std::chrono::duration_cast
( + DT_s(cycles) / (m_emulation_speed * m_throttle_clock_per_sec)); + } + else + { + return Clock::now(); + } +} + +void CoreTimingManager::SleepUntil(TimePoint time_point) +{ + const TimePoint time = Clock::now(); + + std::this_thread::sleep_until(time_point); + + if (Core::IsCPUThread()) + { + // Count amount of time sleeping for analytics + const TimePoint time_after_sleep = Clock::now(); + g_perf_metrics.CountThrottleSleep(time_after_sleep - time); + } +} + void CoreTimingManager::Throttle(const s64 target_cycle) { // Based on number of cycles and emulation speed, increase the target deadline diff --git a/Source/Core/Core/CoreTiming.h b/Source/Core/Core/CoreTiming.h index 93b3c1e4f1..23bd4c3239 100644 --- a/Source/Core/Core/CoreTiming.h +++ b/Source/Core/Core/CoreTiming.h @@ -98,6 +98,7 @@ public: // doing something evil u64 GetTicks() const; u64 GetIdleTicks() const; + TimePoint GetTargetHostTime(s64 target_cycle); void RefreshConfig(); @@ -157,6 +158,9 @@ public: // Throttle the CPU to the specified target cycle. void Throttle(const s64 target_cycle); + // May be used from any thread. + void SleepUntil(TimePoint time_point); + TimePoint GetCPUTimePoint(s64 cyclesLate) const; // Used by Dolphin Analytics bool GetVISkip() const; // Used By VideoInterface diff --git a/Source/Core/VideoCommon/AsyncRequests.cpp b/Source/Core/VideoCommon/AsyncRequests.cpp index 92c06f0b90..92a7e0c635 100644 --- a/Source/Core/VideoCommon/AsyncRequests.cpp +++ b/Source/Core/VideoCommon/AsyncRequests.cpp @@ -157,7 +157,7 @@ void AsyncRequests::HandleEvent(const AsyncRequests::Event& e) case Event::SWAP_EVENT: g_presenter->ViSwap(e.swap_event.xfbAddr, e.swap_event.fbWidth, e.swap_event.fbStride, - e.swap_event.fbHeight, e.time); + e.swap_event.fbHeight, e.time, e.swap_event.presentation_time); break; case Event::BBOX_READ: diff --git a/Source/Core/VideoCommon/AsyncRequests.h b/Source/Core/VideoCommon/AsyncRequests.h index 5271426f1f..f0b388ffbd 100644 --- a/Source/Core/VideoCommon/AsyncRequests.h +++ b/Source/Core/VideoCommon/AsyncRequests.h @@ -19,6 +19,8 @@ class AsyncRequests public: struct Event { + Event() {} + enum Type { EFB_POKE_COLOR, @@ -55,6 +57,7 @@ public: u32 fbWidth; u32 fbStride; u32 fbHeight; + TimePoint presentation_time; } swap_event; struct diff --git a/Source/Core/VideoCommon/Present.cpp b/Source/Core/VideoCommon/Present.cpp index 8f88c90588..1d1a77b4ca 100644 --- a/Source/Core/VideoCommon/Present.cpp +++ b/Source/Core/VideoCommon/Present.cpp @@ -5,6 +5,7 @@ #include "Common/ChunkFile.h" #include "Core/Config/GraphicsSettings.h" +#include "Core/CoreTiming.h" #include "Core/HW/VideoInterface.h" #include "Core/Host.h" #include "Core/System.h" @@ -17,7 +18,6 @@ #include "VideoCommon/FramebufferManager.h" #include "VideoCommon/OnScreenUI.h" #include "VideoCommon/PostProcessing.h" -#include "VideoCommon/Statistics.h" #include "VideoCommon/VertexManagerBase.h" #include "VideoCommon/VideoConfig.h" #include "VideoCommon/VideoEvents.h" @@ -157,7 +157,8 @@ bool Presenter::FetchXFB(u32 xfb_addr, u32 fb_width, u32 fb_stride, u32 fb_heigh return old_xfb_id == m_last_xfb_id; } -void Presenter::ViSwap(u32 xfb_addr, u32 fb_width, u32 fb_stride, u32 fb_height, u64 ticks) +void Presenter::ViSwap(u32 xfb_addr, u32 fb_width, u32 fb_stride, u32 fb_height, u64 ticks, + TimePoint presentation_time) { bool is_duplicate = FetchXFB(xfb_addr, fb_width, fb_stride, fb_height, ticks); @@ -198,7 +199,7 @@ void Presenter::ViSwap(u32 xfb_addr, u32 fb_width, u32 fb_stride, u32 fb_height, if (!is_duplicate || !g_ActiveConfig.bSkipPresentingDuplicateXFBs) { - Present(); + Present(presentation_time); ProcessFrameDumping(ticks); AfterPresentEvent::Trigger(present_info); @@ -814,7 +815,7 @@ void Presenter::RenderXFBToScreen(const MathUtil::Rectangle& target_rc, } } -void Presenter::Present() +void Presenter::Present(std::optional presentation_time) { m_present_count++; @@ -867,6 +868,10 @@ void Presenter::Present() // Present to the window system. { std::lock_guard guard(m_swap_mutex); + + if (presentation_time.has_value()) + Core::System::GetInstance().GetCoreTiming().SleepUntil(*presentation_time); + g_gfx->PresentBackbuffer(); } diff --git a/Source/Core/VideoCommon/Present.h b/Source/Core/VideoCommon/Present.h index 3f8f43a687..a355af4385 100644 --- a/Source/Core/VideoCommon/Present.h +++ b/Source/Core/VideoCommon/Present.h @@ -14,7 +14,6 @@ #include #include #include -#include #include class AbstractTexture; @@ -36,10 +35,11 @@ public: Presenter(); virtual ~Presenter(); - void ViSwap(u32 xfb_addr, u32 fb_width, u32 fb_stride, u32 fb_height, u64 ticks); + void ViSwap(u32 xfb_addr, u32 fb_width, u32 fb_stride, u32 fb_height, u64 ticks, + TimePoint presentation_time); void ImmediateSwap(u32 xfb_addr, u32 fb_width, u32 fb_stride, u32 fb_height, u64 ticks); - void Present(); + void Present(std::optional presentation_time = std::nullopt); void ClearLastXfbId() { m_last_xfb_id = std::numeric_limits::max(); } bool Initialize(); diff --git a/Source/Core/VideoCommon/VideoBackendBase.cpp b/Source/Core/VideoCommon/VideoBackendBase.cpp index a7a322eab3..c480f3d19b 100644 --- a/Source/Core/VideoCommon/VideoBackendBase.cpp +++ b/Source/Core/VideoCommon/VideoBackendBase.cpp @@ -13,13 +13,13 @@ #include "Common/ChunkFile.h" #include "Common/CommonTypes.h" -#include "Common/Event.h" #include "Common/FileUtil.h" #include "Common/Logging/Log.h" #include "Core/Config/MainSettings.h" #include "Core/ConfigManager.h" #include "Core/Core.h" +#include "Core/CoreTiming.h" #include "Core/DolphinAnalytics.h" #include "Core/System.h" @@ -51,9 +51,7 @@ #include "VideoCommon/FramebufferManager.h" #include "VideoCommon/GeometryShaderManager.h" #include "VideoCommon/GraphicsModSystem/Runtime/GraphicsModManager.h" -#include "VideoCommon/IndexGenerator.h" #include "VideoCommon/OnScreenDisplay.h" -#include "VideoCommon/OpcodeDecoding.h" #include "VideoCommon/PixelEngine.h" #include "VideoCommon/PixelShaderManager.h" #include "VideoCommon/Present.h" @@ -108,6 +106,7 @@ void VideoBackendBase::Video_OutputXFB(u32 xfb_addr, u32 fb_width, u32 fb_stride e.swap_event.fbWidth = fb_width; e.swap_event.fbStride = fb_stride; e.swap_event.fbHeight = fb_height; + e.swap_event.presentation_time = system.GetCoreTiming().GetTargetHostTime(ticks); AsyncRequests::GetInstance()->PushEvent(e, false); } }