GPU: Improve CRTC hblank accuracy

And implement Timer0 gating, it was missing previously.
This commit is contained in:
Stenzek 2024-04-27 21:50:18 +10:00
parent 373721af79
commit 36df91aba0
No known key found for this signature in database
3 changed files with 130 additions and 58 deletions

View File

@ -607,24 +607,10 @@ void GPU::UpdateCRTCConfig()
static constexpr std::array<u16, 8> dot_clock_dividers = {{10, 8, 5, 4, 7, 7, 7, 7}}; static constexpr std::array<u16, 8> dot_clock_dividers = {{10, 8, 5, 4, 7, 7, 7, 7}};
CRTCState& cs = m_crtc_state; CRTCState& cs = m_crtc_state;
if (m_GPUSTAT.pal_mode) cs.vertical_total = m_GPUSTAT.pal_mode ? PAL_TOTAL_LINES : NTSC_TOTAL_LINES;
{ cs.horizontal_total = m_GPUSTAT.pal_mode ? PAL_TICKS_PER_LINE : NTSC_TICKS_PER_LINE;
cs.vertical_total = PAL_TOTAL_LINES; cs.horizontal_active_start = m_GPUSTAT.pal_mode ? PAL_HORIZONTAL_ACTIVE_START : NTSC_HORIZONTAL_ACTIVE_START;
cs.current_scanline %= PAL_TOTAL_LINES; cs.horizontal_active_end = m_GPUSTAT.pal_mode ? PAL_HORIZONTAL_ACTIVE_END : NTSC_HORIZONTAL_ACTIVE_END;
cs.horizontal_total = PAL_TICKS_PER_LINE;
cs.horizontal_sync_start = PAL_HSYNC_TICKS;
cs.current_tick_in_scanline %= System::ScaleTicksToOverclock(PAL_TICKS_PER_LINE);
}
else
{
cs.vertical_total = NTSC_TOTAL_LINES;
cs.current_scanline %= NTSC_TOTAL_LINES;
cs.horizontal_total = NTSC_TICKS_PER_LINE;
cs.horizontal_sync_start = NTSC_HSYNC_TICKS;
cs.current_tick_in_scanline %= System::ScaleTicksToOverclock(NTSC_TICKS_PER_LINE);
}
cs.in_hblank = (cs.current_tick_in_scanline >= cs.horizontal_sync_start);
const u8 horizontal_resolution_index = m_GPUSTAT.horizontal_resolution_1 | (m_GPUSTAT.horizontal_resolution_2 << 2); const u8 horizontal_resolution_index = m_GPUSTAT.horizontal_resolution_1 | (m_GPUSTAT.horizontal_resolution_2 << 2);
cs.dot_clock_divider = dot_clock_dividers[horizontal_resolution_index]; cs.dot_clock_divider = dot_clock_dividers[horizontal_resolution_index];
@ -658,8 +644,17 @@ void GPU::UpdateCRTCConfig()
static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_display_start))); static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_display_start)));
cs.horizontal_display_end = cs.horizontal_display_end =
static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_display_end))); static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_display_end)));
cs.horizontal_active_start =
static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_active_start)));
cs.horizontal_active_end =
static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_active_end)));
cs.horizontal_total = static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_total))); cs.horizontal_total = static_cast<u16>(System::ScaleTicksToOverclock(static_cast<TickCount>(cs.horizontal_total)));
cs.current_tick_in_scanline %= cs.horizontal_total;
cs.UpdateHBlankFlag();
cs.current_scanline %= cs.vertical_total;
System::SetThrottleFrequency(ComputeVerticalFrequency()); System::SetThrottleFrequency(ComputeVerticalFrequency());
UpdateCRTCDisplayParameters(); UpdateCRTCDisplayParameters();
@ -872,20 +867,36 @@ void GPU::UpdateCRTCTickEvent()
ticks_until_event = std::min(ticks_until_event, std::max<TickCount>(ticks_until_irq, 0)); ticks_until_event = std::min(ticks_until_event, std::max<TickCount>(ticks_until_irq, 0));
} }
#if 0 if (Timers::IsSyncEnabled(DOT_TIMER_INDEX))
const TickCount ticks_until_hblank = {
(m_crtc_state.current_tick_in_scanline >= m_crtc_state.horizontal_display_end) ? // This could potentially be optimized to skip the time the gate is active, if we're resetting and free running.
(m_crtc_state.horizontal_total - m_crtc_state.current_tick_in_scanline + m_crtc_state.horizontal_display_end) : // But realistically, I've only seen sync off (most games), or reset+pause on gate (Konami Lightgun games).
(m_crtc_state.horizontal_display_end - m_crtc_state.current_tick_in_scanline); TickCount ticks_until_hblank_start_or_end;
#endif if (m_crtc_state.current_tick_in_scanline >= m_crtc_state.horizontal_active_end)
{
ticks_until_hblank_start_or_end =
m_crtc_state.horizontal_total - m_crtc_state.current_tick_in_scanline + m_crtc_state.horizontal_active_start;
}
else if (m_crtc_state.current_tick_in_scanline < m_crtc_state.horizontal_active_start)
{
ticks_until_hblank_start_or_end = m_crtc_state.horizontal_active_start - m_crtc_state.current_tick_in_scanline;
}
else
{
ticks_until_hblank_start_or_end = m_crtc_state.horizontal_active_end - m_crtc_state.current_tick_in_scanline;
}
ticks_until_event = std::min(ticks_until_event, ticks_until_hblank_start_or_end);
}
m_crtc_tick_event->Schedule(CRTCTicksToSystemTicks(ticks_until_event, m_crtc_state.fractional_ticks)); m_crtc_tick_event->Schedule(CRTCTicksToSystemTicks(ticks_until_event, m_crtc_state.fractional_ticks));
} }
bool GPU::IsCRTCScanlinePending() const bool GPU::IsCRTCScanlinePending() const
{ {
// TODO: Most of these should be fields, not lines.
const TickCount ticks = (GetPendingCRTCTicks() + m_crtc_state.current_tick_in_scanline); const TickCount ticks = (GetPendingCRTCTicks() + m_crtc_state.current_tick_in_scanline);
return (ticks >= (m_crtc_state.in_hblank ? m_crtc_state.horizontal_total : m_crtc_state.horizontal_sync_start)); return (ticks >= m_crtc_state.horizontal_total);
} }
bool GPU::IsCommandCompletionPending() const bool GPU::IsCommandCompletionPending() const
@ -896,28 +907,32 @@ bool GPU::IsCommandCompletionPending() const
void GPU::CRTCTickEvent(TickCount ticks) void GPU::CRTCTickEvent(TickCount ticks)
{ {
// convert cpu/master clock to GPU ticks, accounting for partial cycles because of the non-integer divider // convert cpu/master clock to GPU ticks, accounting for partial cycles because of the non-integer divider
{ const TickCount prev_tick = m_crtc_state.current_tick_in_scanline;
const TickCount gpu_ticks = SystemTicksToCRTCTicks(ticks, &m_crtc_state.fractional_ticks); const TickCount gpu_ticks = SystemTicksToCRTCTicks(ticks, &m_crtc_state.fractional_ticks);
m_crtc_state.current_tick_in_scanline += gpu_ticks; m_crtc_state.current_tick_in_scanline += gpu_ticks;
if (Timers::IsUsingExternalClock(DOT_TIMER_INDEX)) if (Timers::IsUsingExternalClock(DOT_TIMER_INDEX))
{ {
m_crtc_state.fractional_dot_ticks += gpu_ticks; m_crtc_state.fractional_dot_ticks += gpu_ticks;
const TickCount dots = m_crtc_state.fractional_dot_ticks / m_crtc_state.dot_clock_divider; const TickCount dots = m_crtc_state.fractional_dot_ticks / m_crtc_state.dot_clock_divider;
m_crtc_state.fractional_dot_ticks = m_crtc_state.fractional_dot_ticks % m_crtc_state.dot_clock_divider; m_crtc_state.fractional_dot_ticks = m_crtc_state.fractional_dot_ticks % m_crtc_state.dot_clock_divider;
if (dots > 0) if (dots > 0)
Timers::AddTicks(DOT_TIMER_INDEX, dots); Timers::AddTicks(DOT_TIMER_INDEX, dots);
}
} }
if (m_crtc_state.current_tick_in_scanline < m_crtc_state.horizontal_total) if (m_crtc_state.current_tick_in_scanline < m_crtc_state.horizontal_total)
{ {
// short path when we execute <1 line.. this shouldn't occur often. // short path when we execute <1 line.. this shouldn't occur often, except when gated (konami lightgun games).
const bool old_hblank = m_crtc_state.in_hblank; m_crtc_state.UpdateHBlankFlag();
const bool new_hblank = (m_crtc_state.current_tick_in_scanline >= m_crtc_state.horizontal_sync_start); Timers::SetGate(DOT_TIMER_INDEX, m_crtc_state.in_hblank);
m_crtc_state.in_hblank = new_hblank; if (Timers::IsUsingExternalClock(HBLANK_TIMER_INDEX))
if (!old_hblank && new_hblank && Timers::IsUsingExternalClock(HBLANK_TIMER_INDEX)) {
Timers::AddTicks(HBLANK_TIMER_INDEX, 1); const u32 hblank_timer_ticks =
BoolToUInt32(m_crtc_state.current_tick_in_scanline >= m_crtc_state.horizontal_active_end) -
BoolToUInt32(prev_tick >= m_crtc_state.horizontal_active_end);
if (hblank_timer_ticks > 0)
Timers::AddTicks(HBLANK_TIMER_INDEX, static_cast<TickCount>(hblank_timer_ticks));
}
UpdateCRTCTickEvent(); UpdateCRTCTickEvent();
return; return;
@ -927,16 +942,23 @@ void GPU::CRTCTickEvent(TickCount ticks)
m_crtc_state.current_tick_in_scanline %= m_crtc_state.horizontal_total; m_crtc_state.current_tick_in_scanline %= m_crtc_state.horizontal_total;
#if 0 #if 0
Log_WarningPrintf("Old line: %u, new line: %u, drawing %u", m_crtc_state.current_scanline, Log_WarningPrintf("Old line: %u, new line: %u, drawing %u", m_crtc_state.current_scanline,
m_crtc_state.current_scanline + lines_to_draw, lines_to_draw); m_crtc_state.current_scanline + lines_to_draw, lines_to_draw);
#endif #endif
const bool old_hblank = m_crtc_state.in_hblank; m_crtc_state.UpdateHBlankFlag();
const bool new_hblank = (m_crtc_state.current_tick_in_scanline >= m_crtc_state.horizontal_sync_start); Timers::SetGate(DOT_TIMER_INDEX, m_crtc_state.in_hblank);
m_crtc_state.in_hblank = new_hblank;
if (Timers::IsUsingExternalClock(HBLANK_TIMER_INDEX)) if (Timers::IsUsingExternalClock(HBLANK_TIMER_INDEX))
{ {
const u32 hblank_timer_ticks = BoolToUInt32(!old_hblank) + BoolToUInt32(new_hblank) + (lines_to_draw - 1); // lines_to_draw => number of times ticks passed horizontal_total.
Timers::AddTicks(HBLANK_TIMER_INDEX, static_cast<TickCount>(hblank_timer_ticks)); // Subtract one if we were previously in hblank, but only on that line. If it was previously less than
// horizontal_active_start, we still want to add one, because hblank would have gone inactive, and then active again
// during the line. Finally add the current line being drawn, if hblank went inactive->active during the line.
const u32 hblank_timer_ticks =
lines_to_draw - BoolToUInt32(prev_tick >= m_crtc_state.horizontal_active_end) +
BoolToUInt32(m_crtc_state.current_tick_in_scanline >= m_crtc_state.horizontal_active_end);
if (hblank_timer_ticks > 0)
Timers::AddTicks(HBLANK_TIMER_INDEX, static_cast<TickCount>(hblank_timer_ticks));
} }
while (lines_to_draw > 0) while (lines_to_draw > 0)
@ -1080,11 +1102,45 @@ bool GPU::ConvertDisplayCoordinatesToBeamTicksAndLines(float display_x, float di
*out_line = (static_cast<u32>(std::round(display_y)) >> BoolToUInt8(m_GPUSTAT.vertical_interlace)) + *out_line = (static_cast<u32>(std::round(display_y)) >> BoolToUInt8(m_GPUSTAT.vertical_interlace)) +
m_crtc_state.vertical_visible_start; m_crtc_state.vertical_visible_start;
*out_tick = static_cast<u32>(std::round(display_x * static_cast<float>(m_crtc_state.dot_clock_divider))) + *out_tick = static_cast<u32>(System::ScaleTicksToOverclock(
static_cast<TickCount>(std::round(display_x * static_cast<float>(m_crtc_state.dot_clock_divider))))) +
m_crtc_state.horizontal_visible_start; m_crtc_state.horizontal_visible_start;
return true; return true;
} }
void GPU::GetBeamPosition(u32* out_ticks, u32* out_line)
{
const u32 current_tick = (GetPendingCRTCTicks() + m_crtc_state.current_tick_in_scanline);
*out_line =
(m_crtc_state.current_scanline + (current_tick / m_crtc_state.horizontal_total)) % m_crtc_state.vertical_total;
*out_ticks = current_tick % m_crtc_state.horizontal_total;
}
TickCount GPU::GetSystemTicksUntilTicksAndLine(u32 ticks, u32 line)
{
u32 current_tick, current_line;
GetBeamPosition(&current_tick, &current_line);
u32 ticks_to_target;
if (ticks >= current_tick)
{
ticks_to_target = ticks - current_tick;
}
else
{
ticks_to_target = (m_crtc_state.horizontal_total - current_tick) + ticks;
current_line = (current_line + 1) % m_crtc_state.vertical_total;
}
const u32 lines_to_target =
(line >= current_line) ? (line - current_line) : ((m_crtc_state.vertical_total - current_line) + line);
const TickCount total_ticks_to_target =
static_cast<TickCount>((lines_to_target * m_crtc_state.horizontal_total) + ticks_to_target);
return CRTCTicksToSystemTicks(total_ticks_to_target, m_crtc_state.fractional_ticks);
}
u32 GPU::ReadGPUREAD() u32 GPU::ReadGPUREAD()
{ {
if (m_blitter_state != BlitterState::ReadingVRAM) if (m_blitter_state != BlitterState::ReadingVRAM)

View File

@ -67,10 +67,8 @@ public:
enum : u16 enum : u16
{ {
NTSC_TICKS_PER_LINE = 3413, NTSC_TICKS_PER_LINE = 3413,
NTSC_HSYNC_TICKS = 200,
NTSC_TOTAL_LINES = 263, NTSC_TOTAL_LINES = 263,
PAL_TICKS_PER_LINE = 3406, PAL_TICKS_PER_LINE = 3406,
PAL_HSYNC_TICKS = 200, // actually one more on odd lines
PAL_TOTAL_LINES = 314, PAL_TOTAL_LINES = 314,
}; };
@ -183,8 +181,19 @@ public:
bool ConvertDisplayCoordinatesToBeamTicksAndLines(float display_x, float display_y, float x_scale, u32* out_tick, bool ConvertDisplayCoordinatesToBeamTicksAndLines(float display_x, float display_y, float x_scale, u32* out_tick,
u32* out_line) const; u32* out_line) const;
// Returns the current beam position.
void GetBeamPosition(u32* out_ticks, u32* out_line);
// Returns the number of system clock ticks until the specified tick/line.
TickCount GetSystemTicksUntilTicksAndLine(u32 ticks, u32 line);
// Returns the number of visible lines.
ALWAYS_INLINE u16 GetCRTCActiveStartLine() const { return m_crtc_state.vertical_display_start; }
ALWAYS_INLINE u16 GetCRTCActiveEndLine() const { return m_crtc_state.vertical_display_end; }
// Returns the video clock frequency. // Returns the video clock frequency.
TickCount GetCRTCFrequency() const; TickCount GetCRTCFrequency() const;
u16 GetCRTCDotClockDivider() const { return m_crtc_state.dot_clock_divider; }
// Dumps raw VRAM to a file. // Dumps raw VRAM to a file.
bool DumpVRAMToFile(const char* filename); bool DumpVRAMToFile(const char* filename);
@ -517,8 +526,10 @@ protected:
u16 vertical_display_start; u16 vertical_display_start;
u16 vertical_display_end; u16 vertical_display_end;
u16 horizontal_active_start;
u16 horizontal_active_end;
u16 horizontal_total; u16 horizontal_total;
u16 horizontal_sync_start; // <- not currently saved to state, so we don't have to bump the version
u16 vertical_total; u16 vertical_total;
TickCount fractional_ticks; TickCount fractional_ticks;
@ -533,6 +544,12 @@ protected:
u8 interlaced_field; // 0 = odd, 1 = even u8 interlaced_field; // 0 = odd, 1 = even
u8 interlaced_display_field; u8 interlaced_display_field;
u8 active_line_lsb; u8 active_line_lsb;
ALWAYS_INLINE void UpdateHBlankFlag()
{
in_hblank =
(current_tick_in_scanline < horizontal_active_start || current_tick_in_scanline >= horizontal_active_end);
}
} m_crtc_state = {}; } m_crtc_state = {};
BlitterState m_blitter_state = BlitterState::Idle; BlitterState m_blitter_state = BlitterState::Idle;

View File

@ -166,7 +166,9 @@ void Timers::SetGate(u32 timer, bool state)
if (!cs.mode.sync_enable) if (!cs.mode.sync_enable)
return; return;
if (cs.counting_enabled && !cs.use_external_clock) // Because the gate prevents counting in or outside of the gate, we need a correct counter.
// For reset, we _can_ skip it, until the gate clears.
if (!cs.use_external_clock && (cs.mode.sync_mode != SyncMode::ResetOnGate || !state))
s_sysclk_event->InvokeEarly(); s_sysclk_event->InvokeEarly();
if (state) if (state)
@ -415,11 +417,8 @@ void Timers::UpdateCountingEnabled(CounterState& cs)
switch (cs.mode.sync_mode) switch (cs.mode.sync_mode)
{ {
case SyncMode::PauseOnGate: case SyncMode::PauseOnGate:
cs.counting_enabled = !cs.gate;
break;
case SyncMode::ResetOnGate: case SyncMode::ResetOnGate:
cs.counting_enabled = true; cs.counting_enabled = !cs.gate;
break; break;
case SyncMode::ResetAndRunOnGate: case SyncMode::ResetAndRunOnGate:
@ -489,7 +488,7 @@ void Timers::DrawDebugStateWindow()
const float framebuffer_scale = Host::GetOSDScale(); const float framebuffer_scale = Host::GetOSDScale();
ImGui::SetNextWindowSize(ImVec2(800.0f * framebuffer_scale, 100.0f * framebuffer_scale), ImGuiCond_FirstUseEver); ImGui::SetNextWindowSize(ImVec2(800.0f * framebuffer_scale, 115.0f * framebuffer_scale), ImGuiCond_FirstUseEver);
if (!ImGui::Begin("Timer State", nullptr)) if (!ImGui::Begin("Timer State", nullptr))
{ {
ImGui::End(); ImGui::End();