From 9f6c0ca69519be36fdf87372017b74df3c8d0785 Mon Sep 17 00:00:00 2001 From: adelikat Date: Sat, 17 Jan 2015 21:09:33 +0000 Subject: [PATCH] NES - remove the partial class closure on the PPU object files --- .../Consoles/Nintendo/NES/Boards/ExROM.cs | 4 +- .../Consoles/Nintendo/NES/Core.cs | 2 +- .../Consoles/Nintendo/NES/NES.ISettable.cs | 4 +- .../Consoles/Nintendo/NES/PPU.cs | 451 ++++--- .../Consoles/Nintendo/NES/PPU.regs.cs | 1063 ++++++++--------- .../Consoles/Nintendo/NES/PPU.run.cs | 865 +++++++------- 6 files changed, 1190 insertions(+), 1199 deletions(-) diff --git a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Boards/ExROM.cs b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Boards/ExROM.cs index a19af89b18..1080dc4032 100644 --- a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Boards/ExROM.cs +++ b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Boards/ExROM.cs @@ -244,7 +244,7 @@ namespace BizHawk.Emulation.Cores.Nintendo.NES int bank_1k = addr >> 10; int ofs = addr & ((1 << 10) - 1); - if (exram_mode == 1 && NES.ppu.ppuphase == NES.PPU.PPUPHASE.BG) + if (exram_mode == 1 && NES.ppu.ppuphase == PPU.PPUPHASE.BG) { int exram_addr = last_nt_read; int bank_4k = EXRAM[exram_addr] & 0x3F; @@ -266,7 +266,7 @@ namespace BizHawk.Emulation.Cores.Nintendo.NES && NES.ppu.reg_2001.show_obj ) { - if (NES.ppu.ppuphase == NES.PPU.PPUPHASE.OBJ) + if (NES.ppu.ppuphase == PPU.PPUPHASE.OBJ) bank_1k = a_banks_1k[bank_1k]; else bank_1k = b_banks_1k[bank_1k]; diff --git a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Core.cs b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Core.cs index e5931a67b1..d200b43c61 100644 --- a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Core.cs +++ b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/Core.cs @@ -296,7 +296,7 @@ namespace BizHawk.Emulation.Cores.Nintendo.NES #if VS2012 [MethodImpl(MethodImplOptions.AggressiveInlining)] #endif - private void RunCpuOne() + internal void RunCpuOne() { cpu_stepcounter++; if (cpu_stepcounter == cpu_sequence[cpu_step]) diff --git a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/NES.ISettable.cs b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/NES.ISettable.cs index 333a91a1bc..09ba773b20 100644 --- a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/NES.ISettable.cs +++ b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/NES.ISettable.cs @@ -54,8 +54,8 @@ namespace BizHawk.Emulation.Cores.Nintendo.NES return ret; } - private NESSettings Settings = new NESSettings(); - private NESSyncSettings SyncSettings = new NESSyncSettings(); + internal NESSettings Settings = new NESSettings(); + internal NESSyncSettings SyncSettings = new NESSyncSettings(); public class NESSyncSettings { diff --git a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.cs b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.cs index ec9fc98d7b..76985296f3 100644 --- a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.cs +++ b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.cs @@ -6,237 +6,234 @@ using BizHawk.Common; namespace BizHawk.Emulation.Cores.Nintendo.NES { - partial class NES + public sealed partial class PPU { - public sealed partial class PPU + // this only handles region differences within the PPU + int preNMIlines; + int postNMIlines; + bool chopdot; + public enum Region { NTSC, PAL, Dendy, RGB }; + Region _region; + public Region region { set { _region = value; SyncRegion(); } get { return _region; } } + void SyncRegion() { - // this only handles region differences within the PPU - int preNMIlines; - int postNMIlines; - bool chopdot; - public enum Region { NTSC, PAL, Dendy, RGB }; - Region _region; - public Region region { set { _region = value; SyncRegion(); } get { return _region; } } - void SyncRegion() + switch (region) { - switch (region) - { - case Region.NTSC: - preNMIlines = 1; postNMIlines = 20; chopdot = true; break; - case Region.PAL: - preNMIlines = 1; postNMIlines = 70; chopdot = false; break; - case Region.Dendy: - preNMIlines = 51; postNMIlines = 20; chopdot = false; break; - case Region.RGB: - preNMIlines = 1; postNMIlines = 20; chopdot = false; break; - } + case Region.NTSC: + preNMIlines = 1; postNMIlines = 20; chopdot = true; break; + case Region.PAL: + preNMIlines = 1; postNMIlines = 70; chopdot = false; break; + case Region.Dendy: + preNMIlines = 51; postNMIlines = 20; chopdot = false; break; + case Region.RGB: + preNMIlines = 1; postNMIlines = 20; chopdot = false; break; } - - public class DebugCallback - { - public int Scanline; - //public int Dot; //not supported - public Action Callback; - } - - public DebugCallback NTViewCallback; - public DebugCallback PPUViewCallback; - - // true = light sensed - public bool LightGunCallback(int x, int y) - { - // the actual light gun circuit is very complex - // and this doesn't do it justice at all, as expected - - const int radius = 10; // look at pixel values up to this far away, roughly - - int sum = 0; - int ymin = Math.Max(Math.Max(y - radius, ppur.status.sl - 20), 0); - int ymax = Math.Min(y + radius, 239); - int xmin = Math.Max(x - radius, 0); - int xmax = Math.Min(x + radius, 255); - - int ystop = ppur.status.sl - 2; - int xstop = ppur.status.cycle - 20; - - for (int j = ymin; j <= ymax; j++) - { - for (int i = xmin; i <= xmax; i++) - { - if (j >= ystop && i >= xstop || j > ystop) - goto loopout; - - short s = xbuf[j * 256 + i]; - int lum = s & 0x30; - if ((s & 0x0f) >= 0x0e) - lum = 0; - sum += lum; - } - } - loopout: - return sum >= 2000; - } - - - //when the ppu issues a write it goes through here and into the game board - public void ppubus_write(int addr, byte value) - { - nes.Board.AddressPPU(addr); - nes.Board.WritePPU(addr, value); - } - - //when the ppu issues a read it goes through here and into the game board - public byte ppubus_read(int addr, bool ppu) - { - //hardware doesnt touch the bus when the PPU is disabled - if (!reg_2001.PPUON && ppu) - return 0xFF; - - nes.Board.AddressPPU(addr); - return nes.Board.ReadPPU(addr); - } - - //debug tools peek into the ppu through this - public byte ppubus_peek(int addr) - { - return nes.Board.PeekPPU(addr); - } - - public enum PPUPHASE - { - VBL, BG, OBJ - }; - public PPUPHASE ppuphase; - - private readonly NES nes; - public PPU(NES nes) - { - this.nes = nes; - - OAM = new byte[0x100]; - PALRAM = new byte[0x20]; - - //power-up palette verified by blargg's power_up_palette test. - //he speculates that these may differ depending on the system tested.. - //and I don't see why the ppu would waste any effort setting these.. - //but for the sake of uniformity, we'll do it. - Array.Copy(new byte[] { - 0x09,0x01,0x00,0x01,0x00,0x02,0x02,0x0D,0x08,0x10,0x08,0x24,0x00,0x00,0x04,0x2C, - 0x09,0x01,0x34,0x03,0x00,0x04,0x00,0x14,0x08,0x3A,0x00,0x02,0x00,0x20,0x2C,0x08 - }, PALRAM, 0x20); - - Reset(); - } - - public void NESSoftReset() - { - //this hasn't been brought up to date since NEShawk was first made. - //in particular http://wiki.nesdev.com/w/index.php/PPU_power_up_state should be studied, but theres no use til theres test cases - Reset(); - } - - //state - int ppudead; //measured in frames - bool idleSynch; - int NMI_PendingInstructions; - byte PPUGenLatch; - bool vtoggle; - byte VRAMBuffer; - public byte[] OAM; - public byte[] PALRAM; - - public void SyncState(Serializer ser) - { - ser.Sync("ppudead", ref ppudead); - ser.Sync("idleSynch", ref idleSynch); - ser.Sync("NMI_PendingInstructions", ref NMI_PendingInstructions); - ser.Sync("PPUGenLatch", ref PPUGenLatch); - ser.Sync("vtoggle", ref vtoggle); - ser.Sync("VRAMBuffer", ref VRAMBuffer); - ser.Sync("ppu_addr_temp", ref ppu_addr_temp); - - ser.Sync("OAM", ref OAM, false); - ser.Sync("PALRAM", ref PALRAM, false); - - ser.Sync("Reg2002_objoverflow", ref Reg2002_objoverflow); - ser.Sync("Reg2002_objhit", ref Reg2002_objhit); - ser.Sync("Reg2002_vblank_active", ref Reg2002_vblank_active); - ser.Sync("Reg2002_vblank_active_pending", ref Reg2002_vblank_active_pending); - ser.Sync("Reg2002_vblank_clear_pending", ref Reg2002_vblank_clear_pending); - ppur.SyncState(ser); - byte temp8 = reg_2000.Value; ser.Sync("reg_2000.Value", ref temp8); reg_2000.Value = temp8; - temp8 = reg_2001.Value; ser.Sync("reg_2001.Value", ref temp8); reg_2001.Value = temp8; - ser.Sync("reg_2003", ref reg_2003); - - //don't sync framebuffer into binary (rewind) states - if(ser.IsText) - ser.Sync("xbuf", ref xbuf, false); - } - - public void Reset() - { - regs_reset(); - ppudead = 2; - idleSynch = true; - } - -#if VS2012 - [MethodImpl(MethodImplOptions.AggressiveInlining)] -#endif - void TriggerNMI() - { - nes.cpu.NMI = true; - } - - //this gets called once after each cpu instruction executes. - //anything that needs to happen at instruction granularity can get checked here - //to save having to check it at ppu cycle granularity - public void PostCpuInstructionOne() - { - if (NMI_PendingInstructions > 0) - { - NMI_PendingInstructions--; - if (NMI_PendingInstructions <= 0) - { - TriggerNMI(); - } - } - } - -#if VS2012 - [MethodImpl(MethodImplOptions.AggressiveInlining)] -#endif - void runppu(int x) - { - //run one ppu cycle at a time so we can interact with the ppu and clockPPU at high granularity - for (int i = 0; i < x; i++) - { - ppur.status.cycle++; - - //might not actually run a cpu cycle if there are none to be run right now - nes.RunCpuOne(); - - if (Reg2002_vblank_active_pending) - { - //if (Reg2002_vblank_active_pending) - Reg2002_vblank_active = 1; - Reg2002_vblank_active_pending = false; - } - - if (Reg2002_vblank_clear_pending) - { - Reg2002_vblank_active = 0; - Reg2002_vblank_clear_pending = false; - } - - nes.Board.ClockPPU(); - } - } - - //hack - //public bool PAL = false; - //bool SPRITELIMIT = true; - } + + public class DebugCallback + { + public int Scanline; + //public int Dot; //not supported + public Action Callback; + } + + public DebugCallback NTViewCallback; + public DebugCallback PPUViewCallback; + + // true = light sensed + public bool LightGunCallback(int x, int y) + { + // the actual light gun circuit is very complex + // and this doesn't do it justice at all, as expected + + const int radius = 10; // look at pixel values up to this far away, roughly + + int sum = 0; + int ymin = Math.Max(Math.Max(y - radius, ppur.status.sl - 20), 0); + int ymax = Math.Min(y + radius, 239); + int xmin = Math.Max(x - radius, 0); + int xmax = Math.Min(x + radius, 255); + + int ystop = ppur.status.sl - 2; + int xstop = ppur.status.cycle - 20; + + for (int j = ymin; j <= ymax; j++) + { + for (int i = xmin; i <= xmax; i++) + { + if (j >= ystop && i >= xstop || j > ystop) + goto loopout; + + short s = xbuf[j * 256 + i]; + int lum = s & 0x30; + if ((s & 0x0f) >= 0x0e) + lum = 0; + sum += lum; + } + } + loopout: + return sum >= 2000; + } + + + //when the ppu issues a write it goes through here and into the game board + public void ppubus_write(int addr, byte value) + { + nes.Board.AddressPPU(addr); + nes.Board.WritePPU(addr, value); + } + + //when the ppu issues a read it goes through here and into the game board + public byte ppubus_read(int addr, bool ppu) + { + //hardware doesnt touch the bus when the PPU is disabled + if (!reg_2001.PPUON && ppu) + return 0xFF; + + nes.Board.AddressPPU(addr); + return nes.Board.ReadPPU(addr); + } + + //debug tools peek into the ppu through this + public byte ppubus_peek(int addr) + { + return nes.Board.PeekPPU(addr); + } + + public enum PPUPHASE + { + VBL, BG, OBJ + }; + public PPUPHASE ppuphase; + + private readonly NES nes; + public PPU(NES nes) + { + this.nes = nes; + + OAM = new byte[0x100]; + PALRAM = new byte[0x20]; + + //power-up palette verified by blargg's power_up_palette test. + //he speculates that these may differ depending on the system tested.. + //and I don't see why the ppu would waste any effort setting these.. + //but for the sake of uniformity, we'll do it. + Array.Copy(new byte[] { + 0x09,0x01,0x00,0x01,0x00,0x02,0x02,0x0D,0x08,0x10,0x08,0x24,0x00,0x00,0x04,0x2C, + 0x09,0x01,0x34,0x03,0x00,0x04,0x00,0x14,0x08,0x3A,0x00,0x02,0x00,0x20,0x2C,0x08 + }, PALRAM, 0x20); + + Reset(); + } + + public void NESSoftReset() + { + //this hasn't been brought up to date since NEShawk was first made. + //in particular http://wiki.nesdev.com/w/index.php/PPU_power_up_state should be studied, but theres no use til theres test cases + Reset(); + } + + //state + int ppudead; //measured in frames + bool idleSynch; + int NMI_PendingInstructions; + byte PPUGenLatch; + bool vtoggle; + byte VRAMBuffer; + public byte[] OAM; + public byte[] PALRAM; + + public void SyncState(Serializer ser) + { + ser.Sync("ppudead", ref ppudead); + ser.Sync("idleSynch", ref idleSynch); + ser.Sync("NMI_PendingInstructions", ref NMI_PendingInstructions); + ser.Sync("PPUGenLatch", ref PPUGenLatch); + ser.Sync("vtoggle", ref vtoggle); + ser.Sync("VRAMBuffer", ref VRAMBuffer); + ser.Sync("ppu_addr_temp", ref ppu_addr_temp); + + ser.Sync("OAM", ref OAM, false); + ser.Sync("PALRAM", ref PALRAM, false); + + ser.Sync("Reg2002_objoverflow", ref Reg2002_objoverflow); + ser.Sync("Reg2002_objhit", ref Reg2002_objhit); + ser.Sync("Reg2002_vblank_active", ref Reg2002_vblank_active); + ser.Sync("Reg2002_vblank_active_pending", ref Reg2002_vblank_active_pending); + ser.Sync("Reg2002_vblank_clear_pending", ref Reg2002_vblank_clear_pending); + ppur.SyncState(ser); + byte temp8 = reg_2000.Value; ser.Sync("reg_2000.Value", ref temp8); reg_2000.Value = temp8; + temp8 = reg_2001.Value; ser.Sync("reg_2001.Value", ref temp8); reg_2001.Value = temp8; + ser.Sync("reg_2003", ref reg_2003); + + //don't sync framebuffer into binary (rewind) states + if(ser.IsText) + ser.Sync("xbuf", ref xbuf, false); + } + + public void Reset() + { + regs_reset(); + ppudead = 2; + idleSynch = true; + } + +#if VS2012 + [MethodImpl(MethodImplOptions.AggressiveInlining)] +#endif + void TriggerNMI() + { + nes.cpu.NMI = true; + } + + //this gets called once after each cpu instruction executes. + //anything that needs to happen at instruction granularity can get checked here + //to save having to check it at ppu cycle granularity + public void PostCpuInstructionOne() + { + if (NMI_PendingInstructions > 0) + { + NMI_PendingInstructions--; + if (NMI_PendingInstructions <= 0) + { + TriggerNMI(); + } + } + } + +#if VS2012 + [MethodImpl(MethodImplOptions.AggressiveInlining)] +#endif + void runppu(int x) + { + //run one ppu cycle at a time so we can interact with the ppu and clockPPU at high granularity + for (int i = 0; i < x; i++) + { + ppur.status.cycle++; + + //might not actually run a cpu cycle if there are none to be run right now + nes.RunCpuOne(); + + if (Reg2002_vblank_active_pending) + { + //if (Reg2002_vblank_active_pending) + Reg2002_vblank_active = 1; + Reg2002_vblank_active_pending = false; + } + + if (Reg2002_vblank_clear_pending) + { + Reg2002_vblank_active = 0; + Reg2002_vblank_clear_pending = false; + } + + nes.Board.ClockPPU(); + } + } + + //hack + //public bool PAL = false; + //bool SPRITELIMIT = true; + } } diff --git a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.regs.cs b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.regs.cs index 463387340a..203f0820d6 100644 --- a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.regs.cs +++ b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.regs.cs @@ -17,546 +17,543 @@ using BizHawk.Common; namespace BizHawk.Emulation.Cores.Nintendo.NES { - partial class NES + sealed partial class PPU { - sealed partial class PPU + public sealed class Reg_2001 { - public sealed class Reg_2001 + public Bit color_disable; //Color disable (0: normal color; 1: AND all palette entries with 110000, effectively producing a monochrome display) + public Bit show_bg_leftmost; //Show leftmost 8 pixels of background + public Bit show_obj_leftmost; //Show sprites in leftmost 8 pixels + public Bit show_bg; //Show background + public Bit show_obj; //Show sprites + public Bit intense_green; //Intensify greens (and darken other colors) + public Bit intense_blue; //Intensify blues (and darken other colors) + public Bit intense_red; //Intensify reds (and darken other colors) + + public int intensity_lsl_6; //an optimization.. + + public bool PPUON { get { return show_bg || show_obj; } } + + public byte Value { - public Bit color_disable; //Color disable (0: normal color; 1: AND all palette entries with 110000, effectively producing a monochrome display) - public Bit show_bg_leftmost; //Show leftmost 8 pixels of background - public Bit show_obj_leftmost; //Show sprites in leftmost 8 pixels - public Bit show_bg; //Show background - public Bit show_obj; //Show sprites - public Bit intense_green; //Intensify greens (and darken other colors) - public Bit intense_blue; //Intensify blues (and darken other colors) - public Bit intense_red; //Intensify reds (and darken other colors) - - public int intensity_lsl_6; //an optimization.. - - public bool PPUON { get { return show_bg || show_obj; } } - - public byte Value + get { - get - { - return (byte)(color_disable | (show_bg_leftmost << 1) | (show_obj_leftmost << 2) | (show_bg << 3) | (show_obj << 4) | (intense_green << 5) | (intense_blue << 6) | (intense_red << 7)); - } - set - { - color_disable = (value & 1); - show_bg_leftmost = (value >> 1) & 1; - show_obj_leftmost = (value >> 2) & 1; - show_bg = (value >> 3) & 1; - show_obj = (value >> 4) & 1; - intense_green = (value >> 5) & 1; - intense_blue = (value >> 6) & 1; - intense_red = (value >> 7) & 1; - intensity_lsl_6 = ((value >> 5) & 7)<<6; - } + return (byte)(color_disable | (show_bg_leftmost << 1) | (show_obj_leftmost << 2) | (show_bg << 3) | (show_obj << 4) | (intense_green << 5) | (intense_blue << 6) | (intense_red << 7)); + } + set + { + color_disable = (value & 1); + show_bg_leftmost = (value >> 1) & 1; + show_obj_leftmost = (value >> 2) & 1; + show_bg = (value >> 3) & 1; + show_obj = (value >> 4) & 1; + intense_green = (value >> 5) & 1; + intense_blue = (value >> 6) & 1; + intense_red = (value >> 7) & 1; + intensity_lsl_6 = ((value >> 5) & 7)<<6; } } - - - public struct PPUSTATUS - { - public int sl; - public bool rendering { get { return sl >= 0 && sl < 241; } } - public int cycle; - } - - //uses the internal counters concept at http://nesdev.icequake.net/PPU%20addressing.txt - //TODO - this should be turned into a state machine - public sealed class PPUREGS - { - PPU ppu; - public PPUREGS(PPU ppu) - { - this.ppu = ppu; - reset(); - } - - public void SyncState(Serializer ser) - { - ser.Sync("fv", ref fv); - ser.Sync("v", ref v); - ser.Sync("h", ref h); - ser.Sync("vt", ref vt); - ser.Sync("ht", ref ht); - ser.Sync("_fv", ref _fv); - ser.Sync("_v", ref _v); - ser.Sync("_h", ref _h); - ser.Sync("_vt", ref _vt); - ser.Sync("_ht", ref _ht); - ser.Sync("fh", ref fh); - ser.Sync("status.cycle", ref status.cycle); - int junk = 0; - ser.Sync("status.end_cycle", ref junk); - ser.Sync("status.sl", ref status.sl); - } - - //normal clocked regs. as the game can interfere with these at any time, they need to be savestated - public int fv;//3 - public int v;//1 - public int h;//1 - public int vt;//5 - public int ht;//5 - - //temp unlatched regs (need savestating, can be written to at any time) - public int _fv, _vt, _v, _h, _ht; - - //other regs that need savestating - public int fh;//3 (horz scroll) - - //cached state data. these are always reset at the beginning of a frame and don't need saving - //but just to be safe, we're gonna save it - public PPUSTATUS status = new PPUSTATUS(); - - //public int ComputeIndex() - //{ - // return fv | (v << 3) | (h << 4) | (vt << 5) | (ht << 10) | (fh << 15); - //} - //public void DecodeIndex(int index) - //{ - // fv = index & 7; - // v = (index >> 3) & 1; - // h = (index >> 4) & 1; - // vt = (index >> 5) & 0x1F; - // ht = (index >> 10) & 0x1F; - // fh = (index >> 15) & 7; - //} - - //const int tbl_size = 1 << 18; - //int[] tbl_increment_hsc = new int[tbl_size]; - //int[] tbl_increment_vs = new int[tbl_size]; - //public void BuildTables() - //{ - // for (int i = 0; i < tbl_size; i++) - // { - // DecodeIndex(i); - // increment_hsc(); - // tbl_increment_hsc[i] = ComputeIndex(); - // DecodeIndex(i); - // increment_vs(); - // tbl_increment_vs[i] = ComputeIndex(); - // } - //} - - public void reset() - { - fv = v = h = vt = ht = 0; - fh = 0; - _fv = _v = _h = _vt = _ht = 0; - status.cycle = 0; - status.sl = 241; - } - - public void install_latches() - { - fv = _fv; - v = _v; - h = _h; - vt = _vt; - ht = _ht; - } - - public void install_h_latches() - { - ht = _ht; - h = _h; - } - - public void clear_latches() - { - _fv = _v = _h = _vt = _ht = 0; - fh = 0; - } - - public void increment_hsc() - { - //The first one, the horizontal scroll counter, consists of 6 bits, and is - //made up by daisy-chaining the HT counter to the H counter. The HT counter is - //then clocked every 8 pixel dot clocks (or every 8/3 CPU clock cycles). - ht++; - h += (ht >> 5); - ht &= 31; - h &= 1; - } - - public void increment_vs() - { - fv++; - int fv_overflow = (fv >> 3); - vt += fv_overflow; - vt &= 31; //fixed tecmo super bowl - if (vt == 30 && fv_overflow==1) //caution here (only do it at the exact instant of overflow) fixes p'radikus conflict - { - v++; - vt = 0; - } - fv &= 7; - v &= 1; - } - - public int get_ntread() - { - return 0x2000 | (v << 0xB) | (h << 0xA) | (vt << 5) | ht; - } - - public int get_2007access() - { - return ((fv & 3) << 0xC) | (v << 0xB) | (h << 0xA) | (vt << 5) | ht; - } - - //The PPU has an internal 4-position, 2-bit shifter, which it uses for - //obtaining the 2-bit palette select data during an attribute table byte - //fetch. To represent how this data is shifted in the diagram, letters a..c - //are used in the diagram to represent the right-shift position amount to - //apply to the data read from the attribute data (a is always 0). This is why - //you only see bits 0 and 1 used off the read attribute data in the diagram. - public int get_atread() - { - return 0x2000 | (v << 0xB) | (h << 0xA) | 0x3C0 | ((vt & 0x1C) << 1) | ((ht & 0x1C) >> 2); - } - - //address line 3 relates to the pattern table fetch occuring (the PPU always makes them in pairs). - public int get_ptread(int par) - { - int s = ppu.reg_2000.bg_pattern_hi; - return (s << 0xC) | (par << 0x4) | fv; - } - - public void increment2007(bool rendering, bool by32) - { - if (rendering) - { - //don't do this: - //if (by32) increment_vs(); - //else increment_hsc(); - //do this instead: - increment_vs(); //yes, even if we're moving by 32 - return; - } - - //If the VRAM address increment bit (2000.2) is clear (inc. amt. = 1), all the - //scroll counters are daisy-chained (in the order of HT, VT, H, V, FV) so that - //the carry out of each counter controls the next counter's clock rate. The - //result is that all 5 counters function as a single 15-bit one. Any access to - //2007 clocks the HT counter here. - // - //If the VRAM address increment bit is set (inc. amt. = 32), the only - //difference is that the HT counter is no longer being clocked, and the VT - //counter is now being clocked by access to 2007. - if (by32) - { - vt++; - } - else - { - ht++; - vt += (ht >> 5) & 1; - } - h += (vt >> 5); - v += (h >> 1); - fv += (v >> 1); - ht &= 31; - vt &= 31; - h &= 1; - v &= 1; - fv &= 7; - } - }; - - public sealed class Reg_2000 - { - PPU ppu; - public Reg_2000(PPU ppu) - { - this.ppu = ppu; - } - //these bits go straight into PPUR - //(00 = $2000; 01 = $2400; 02 = $2800; 03 = $2c00) - - public Bit vram_incr32; //(0: increment by 1, going across; 1: increment by 32, going down) - public Bit obj_pattern_hi; //Sprite pattern table address for 8x8 sprites (0: $0000; 1: $1000) - public Bit bg_pattern_hi; //Background pattern table address (0: $0000; 1: $1000) - public Bit obj_size_16; //Sprite size (0: 8x8 sprites; 1: 8x16 sprites) - public Bit ppu_layer; //PPU layer select (should always be 0 in the NES; some Nintendo arcade boards presumably had two PPUs) - public Bit vblank_nmi_gen; //Vertical blank NMI generation (0: off; 1: on) - - - public byte Value - { - get - { - return (byte)(ppu.ppur._h | (ppu.ppur._v << 1) | (vram_incr32 << 2) | (obj_pattern_hi << 3) | (bg_pattern_hi << 4) | (obj_size_16 << 5) | (ppu_layer << 6) | (vblank_nmi_gen << 7)); - } - set - { - ppu.ppur._h = value & 1; - ppu.ppur._v = (value >> 1) & 1; - vram_incr32 = (value >> 2) & 1; - obj_pattern_hi = (value >> 3) & 1; - bg_pattern_hi = (value >> 4) & 1; - obj_size_16 = (value >> 5) & 1; - ppu_layer = (value >> 6) & 1; - vblank_nmi_gen = (value >> 7) & 1; - } - } - } - - - Bit Reg2002_objoverflow; //Sprite overflow. The PPU can handle only eight sprites on one scanline and sets this bit if it starts drawing sprites. - Bit Reg2002_objhit; //Sprite 0 overlap. Set when a nonzero pixel of sprite 0 is drawn overlapping a nonzero background pixel. Used for raster timing. - Bit Reg2002_vblank_active; //Vertical blank start (0: has not started; 1: has started) - bool Reg2002_vblank_active_pending; //set if Reg2002_vblank_active is pending - bool Reg2002_vblank_clear_pending; //ppu's clear of vblank flag is pending - public PPUREGS ppur; - public Reg_2000 reg_2000; - public Reg_2001 reg_2001; - byte reg_2003; - void regs_reset() - { - //TODO - would like to reconstitute the entire PPU instead of all this.. - reg_2000 = new Reg_2000(this); - reg_2001 = new Reg_2001(); - ppur = new PPUREGS(this); - Reg2002_objoverflow = false; - Reg2002_objhit = false; - Reg2002_vblank_active = false; - PPUGenLatch = 0; - reg_2003 = 0; - vtoggle = false; - VRAMBuffer = 0; - } - //--------------------- - - //PPU CONTROL (write) - void write_2000(byte value) - { - if (!reg_2000.vblank_nmi_gen & ((value & 0x80) != 0) && (Reg2002_vblank_active) && !Reg2002_vblank_clear_pending) - { - //if we just unleashed the vblank interrupt then activate it now - NMI_PendingInstructions = 2; - } - reg_2000.Value = value; - } - byte read_2000() { return PPUGenLatch; } - byte peek_2000() { return PPUGenLatch; } - - //PPU MASK (write) - void write_2001(byte value) - { - //printf("%04x:$%02x, %d\n",A,V,scanline); - reg_2001.Value = value; - } - byte read_2001() { return PPUGenLatch; } - byte peek_2001() { return PPUGenLatch; } - - //PPU STATUS (read) - void write_2002(byte value) { } - byte read_2002() - { - //once we thought we clear latches here, but that caused midframe glitches. - //i think we should only reset the state machine for 2005/2006 - //ppur.clear_latches(); - - byte ret = peek_2002(); - - vtoggle = false; - Reg2002_vblank_active = 0; - Reg2002_vblank_active_pending = false; - - return ret; - } - byte peek_2002() - { - return (byte)((Reg2002_vblank_active << 7) | (Reg2002_objhit << 6) | (Reg2002_objoverflow << 5) | (PPUGenLatch & 0x1F)); - } - - void clear_2002() - { - Reg2002_objhit = Reg2002_objoverflow = 0; - Reg2002_vblank_clear_pending = true; - } - - //OAM ADDRESS (write) - void write_2003(byte value) - { - //just record the oam buffer write target - reg_2003 = value; - } - byte read_2003() { return PPUGenLatch; } - byte peek_2003() { return PPUGenLatch; } - - //OAM DATA (write) - void write_2004(byte value) - { - if ((reg_2003 & 3) == 2) value &= 0xE3; //some of the OAM bits are unwired so we mask them out here - //otherwise we just write this value and move on to the next oam byte - OAM[reg_2003] = value; - reg_2003++; - } - byte read_2004() { return OAM[reg_2003]; } - byte peek_2004() { return OAM[reg_2003]; } - - //SCROLL (write) - void write_2005(byte value) - { - if (!vtoggle) - { - ppur._ht= value >> 3; - ppur.fh = value & 7; - //nes.LogLine("scroll wrote ht = {0} and fh = {1}", ppur._ht, ppur.fh); - } - else - { - ppur._vt = value >> 3; - ppur._fv = value & 7; - //nes.LogLine("scroll wrote vt = {0} and fv = {1}", ppur._vt, ppur._fv); - } - vtoggle ^= true; - } - byte read_2005() { return PPUGenLatch; } - byte peek_2005() { return PPUGenLatch; } - - //VRAM address register (write) - void write_2006(byte value) - { - if (!vtoggle) - { - ppur._vt &= 0x07; - ppur._vt |= (value & 0x3) << 3; - ppur._h = (value >> 2) & 1; - ppur._v = (value >> 3) & 1; - ppur._fv = (value >> 4) & 3; - //nes.LogLine("addr wrote fv = {0}", ppur._fv); - } - else - { - ppur._vt &= 0x18; - ppur._vt |= (value >> 5); - ppur._ht = value & 31; - ppur.install_latches(); - //nes.LogLine("addr wrote vt = {0}, ht = {1}", ppur._vt, ppur._ht); - - //normally the address isnt observed by the board till it gets clocked by a read or write. - //but maybe thats just because a ppu read/write shoves it on the address bus - //apparently this shoves it on the address bus, too, or else blargg's mmc3 tests dont pass - nes.Board.AddressPPU(ppur.get_2007access()); - } - - vtoggle ^= true; - } - byte read_2006() { return PPUGenLatch; } - byte peek_2006() { return PPUGenLatch; } - - //VRAM data register (r/w) - void write_2007(byte value) - { - //does this take 4x longer? nestopia indicates so perhaps... - - int addr = ppur.get_2007access() & 0x3FFF; - if ((addr & 0x3F00) == 0x3F00) - { - //handle palette. this is being done nestopia style, because i found some documentation for it (appendix 1) - addr &= 0x1F; - byte color = (byte)(value & 0x3F); //are these bits really unwired? can they be read back somehow? - - //this little hack will help you debug things while the screen is black - //color = (byte)(addr & 0x3F); - - PALRAM[addr] = color; - if ((addr & 3) == 0) - { - PALRAM[addr ^ 0x10] = color; - } - } - else - { - ppubus_write(addr, value); - } - - ppur.increment2007(ppur.status.rendering && reg_2001.PPUON, reg_2000.vram_incr32 != 0); - - //see comments in $2006 - nes.Board.AddressPPU(ppur.get_2007access()); - } - byte read_2007() - { - int addr = ppur.get_2007access() & 0x3FFF; - - //ordinarily we return the buffered values - byte ret = VRAMBuffer; - - //in any case, we read from the ppu bus - VRAMBuffer = ppubus_read(addr,false); - - //but reads from the palette are implemented in the PPU and return immediately - if ((addr & 0x3F00) == 0x3F00) - { - //TODO apply greyscale shit? - ret = PALRAM[addr & 0x1F]; - } - - ppur.increment2007(ppur.status.rendering && reg_2001.PPUON, reg_2000.vram_incr32 != 0); - - //see comments in $2006 - nes.Board.AddressPPU(ppur.get_2007access()); - - return ret; - } - byte peek_2007() - { - int addr = ppur.get_2007access() & 0x3FFF; - - //ordinarily we return the buffered values - byte ret = VRAMBuffer; - - //in any case, we read from the ppu bus - // can't do this in peek; updates the value that will be used later - // VRAMBuffer = ppubus_peek(addr); - - //but reads from the palette are implemented in the PPU and return immediately - if ((addr & 0x3F00) == 0x3F00) - { - //TODO apply greyscale shit? - ret = PALRAM[addr & 0x1F]; - } - - return ret; - } - //-------- - - public byte ReadReg(int addr) - { - switch (addr) - { - case 0: return read_2000(); case 1: return read_2001(); case 2: return read_2002(); case 3: return read_2003(); - case 4: return read_2004(); case 5: return read_2005(); case 6: return read_2006(); case 7: return read_2007(); - default: throw new InvalidOperationException(); - } - } - public byte PeekReg(int addr) - { - switch (addr) - { - case 0: return peek_2000(); case 1: return peek_2001(); case 2: return peek_2002(); case 3: return peek_2003(); - case 4: return peek_2004(); case 5: return peek_2005(); case 6: return peek_2006(); case 7: return peek_2007(); - default: throw new InvalidOperationException(); - } - } - public void WriteReg(int addr, byte value) - { - PPUGenLatch = value; - switch (addr) - { - case 0: write_2000(value); break; case 1: write_2001(value); break; case 2: write_2002(value); break; case 3: write_2003(value); break; - case 4: write_2004(value); break; case 5: write_2005(value); break; case 6: write_2006(value); break; case 7: write_2007(value); break; - default: throw new InvalidOperationException(); - } - } } + + + public struct PPUSTATUS + { + public int sl; + public bool rendering { get { return sl >= 0 && sl < 241; } } + public int cycle; + } + + //uses the internal counters concept at http://nesdev.icequake.net/PPU%20addressing.txt + //TODO - this should be turned into a state machine + public sealed class PPUREGS + { + PPU ppu; + public PPUREGS(PPU ppu) + { + this.ppu = ppu; + reset(); + } + + public void SyncState(Serializer ser) + { + ser.Sync("fv", ref fv); + ser.Sync("v", ref v); + ser.Sync("h", ref h); + ser.Sync("vt", ref vt); + ser.Sync("ht", ref ht); + ser.Sync("_fv", ref _fv); + ser.Sync("_v", ref _v); + ser.Sync("_h", ref _h); + ser.Sync("_vt", ref _vt); + ser.Sync("_ht", ref _ht); + ser.Sync("fh", ref fh); + ser.Sync("status.cycle", ref status.cycle); + int junk = 0; + ser.Sync("status.end_cycle", ref junk); + ser.Sync("status.sl", ref status.sl); + } + + //normal clocked regs. as the game can interfere with these at any time, they need to be savestated + public int fv;//3 + public int v;//1 + public int h;//1 + public int vt;//5 + public int ht;//5 + + //temp unlatched regs (need savestating, can be written to at any time) + public int _fv, _vt, _v, _h, _ht; + + //other regs that need savestating + public int fh;//3 (horz scroll) + + //cached state data. these are always reset at the beginning of a frame and don't need saving + //but just to be safe, we're gonna save it + public PPUSTATUS status = new PPUSTATUS(); + + //public int ComputeIndex() + //{ + // return fv | (v << 3) | (h << 4) | (vt << 5) | (ht << 10) | (fh << 15); + //} + //public void DecodeIndex(int index) + //{ + // fv = index & 7; + // v = (index >> 3) & 1; + // h = (index >> 4) & 1; + // vt = (index >> 5) & 0x1F; + // ht = (index >> 10) & 0x1F; + // fh = (index >> 15) & 7; + //} + + //const int tbl_size = 1 << 18; + //int[] tbl_increment_hsc = new int[tbl_size]; + //int[] tbl_increment_vs = new int[tbl_size]; + //public void BuildTables() + //{ + // for (int i = 0; i < tbl_size; i++) + // { + // DecodeIndex(i); + // increment_hsc(); + // tbl_increment_hsc[i] = ComputeIndex(); + // DecodeIndex(i); + // increment_vs(); + // tbl_increment_vs[i] = ComputeIndex(); + // } + //} + + public void reset() + { + fv = v = h = vt = ht = 0; + fh = 0; + _fv = _v = _h = _vt = _ht = 0; + status.cycle = 0; + status.sl = 241; + } + + public void install_latches() + { + fv = _fv; + v = _v; + h = _h; + vt = _vt; + ht = _ht; + } + + public void install_h_latches() + { + ht = _ht; + h = _h; + } + + public void clear_latches() + { + _fv = _v = _h = _vt = _ht = 0; + fh = 0; + } + + public void increment_hsc() + { + //The first one, the horizontal scroll counter, consists of 6 bits, and is + //made up by daisy-chaining the HT counter to the H counter. The HT counter is + //then clocked every 8 pixel dot clocks (or every 8/3 CPU clock cycles). + ht++; + h += (ht >> 5); + ht &= 31; + h &= 1; + } + + public void increment_vs() + { + fv++; + int fv_overflow = (fv >> 3); + vt += fv_overflow; + vt &= 31; //fixed tecmo super bowl + if (vt == 30 && fv_overflow==1) //caution here (only do it at the exact instant of overflow) fixes p'radikus conflict + { + v++; + vt = 0; + } + fv &= 7; + v &= 1; + } + + public int get_ntread() + { + return 0x2000 | (v << 0xB) | (h << 0xA) | (vt << 5) | ht; + } + + public int get_2007access() + { + return ((fv & 3) << 0xC) | (v << 0xB) | (h << 0xA) | (vt << 5) | ht; + } + + //The PPU has an internal 4-position, 2-bit shifter, which it uses for + //obtaining the 2-bit palette select data during an attribute table byte + //fetch. To represent how this data is shifted in the diagram, letters a..c + //are used in the diagram to represent the right-shift position amount to + //apply to the data read from the attribute data (a is always 0). This is why + //you only see bits 0 and 1 used off the read attribute data in the diagram. + public int get_atread() + { + return 0x2000 | (v << 0xB) | (h << 0xA) | 0x3C0 | ((vt & 0x1C) << 1) | ((ht & 0x1C) >> 2); + } + + //address line 3 relates to the pattern table fetch occuring (the PPU always makes them in pairs). + public int get_ptread(int par) + { + int s = ppu.reg_2000.bg_pattern_hi; + return (s << 0xC) | (par << 0x4) | fv; + } + + public void increment2007(bool rendering, bool by32) + { + if (rendering) + { + //don't do this: + //if (by32) increment_vs(); + //else increment_hsc(); + //do this instead: + increment_vs(); //yes, even if we're moving by 32 + return; + } + + //If the VRAM address increment bit (2000.2) is clear (inc. amt. = 1), all the + //scroll counters are daisy-chained (in the order of HT, VT, H, V, FV) so that + //the carry out of each counter controls the next counter's clock rate. The + //result is that all 5 counters function as a single 15-bit one. Any access to + //2007 clocks the HT counter here. + // + //If the VRAM address increment bit is set (inc. amt. = 32), the only + //difference is that the HT counter is no longer being clocked, and the VT + //counter is now being clocked by access to 2007. + if (by32) + { + vt++; + } + else + { + ht++; + vt += (ht >> 5) & 1; + } + h += (vt >> 5); + v += (h >> 1); + fv += (v >> 1); + ht &= 31; + vt &= 31; + h &= 1; + v &= 1; + fv &= 7; + } + }; + + public sealed class Reg_2000 + { + PPU ppu; + public Reg_2000(PPU ppu) + { + this.ppu = ppu; + } + //these bits go straight into PPUR + //(00 = $2000; 01 = $2400; 02 = $2800; 03 = $2c00) + + public Bit vram_incr32; //(0: increment by 1, going across; 1: increment by 32, going down) + public Bit obj_pattern_hi; //Sprite pattern table address for 8x8 sprites (0: $0000; 1: $1000) + public Bit bg_pattern_hi; //Background pattern table address (0: $0000; 1: $1000) + public Bit obj_size_16; //Sprite size (0: 8x8 sprites; 1: 8x16 sprites) + public Bit ppu_layer; //PPU layer select (should always be 0 in the NES; some Nintendo arcade boards presumably had two PPUs) + public Bit vblank_nmi_gen; //Vertical blank NMI generation (0: off; 1: on) + + + public byte Value + { + get + { + return (byte)(ppu.ppur._h | (ppu.ppur._v << 1) | (vram_incr32 << 2) | (obj_pattern_hi << 3) | (bg_pattern_hi << 4) | (obj_size_16 << 5) | (ppu_layer << 6) | (vblank_nmi_gen << 7)); + } + set + { + ppu.ppur._h = value & 1; + ppu.ppur._v = (value >> 1) & 1; + vram_incr32 = (value >> 2) & 1; + obj_pattern_hi = (value >> 3) & 1; + bg_pattern_hi = (value >> 4) & 1; + obj_size_16 = (value >> 5) & 1; + ppu_layer = (value >> 6) & 1; + vblank_nmi_gen = (value >> 7) & 1; + } + } + } + + + Bit Reg2002_objoverflow; //Sprite overflow. The PPU can handle only eight sprites on one scanline and sets this bit if it starts drawing sprites. + Bit Reg2002_objhit; //Sprite 0 overlap. Set when a nonzero pixel of sprite 0 is drawn overlapping a nonzero background pixel. Used for raster timing. + Bit Reg2002_vblank_active; //Vertical blank start (0: has not started; 1: has started) + bool Reg2002_vblank_active_pending; //set if Reg2002_vblank_active is pending + bool Reg2002_vblank_clear_pending; //ppu's clear of vblank flag is pending + public PPUREGS ppur; + public Reg_2000 reg_2000; + public Reg_2001 reg_2001; + byte reg_2003; + void regs_reset() + { + //TODO - would like to reconstitute the entire PPU instead of all this.. + reg_2000 = new Reg_2000(this); + reg_2001 = new Reg_2001(); + ppur = new PPUREGS(this); + Reg2002_objoverflow = false; + Reg2002_objhit = false; + Reg2002_vblank_active = false; + PPUGenLatch = 0; + reg_2003 = 0; + vtoggle = false; + VRAMBuffer = 0; + } + //--------------------- + + //PPU CONTROL (write) + void write_2000(byte value) + { + if (!reg_2000.vblank_nmi_gen & ((value & 0x80) != 0) && (Reg2002_vblank_active) && !Reg2002_vblank_clear_pending) + { + //if we just unleashed the vblank interrupt then activate it now + NMI_PendingInstructions = 2; + } + reg_2000.Value = value; + } + byte read_2000() { return PPUGenLatch; } + byte peek_2000() { return PPUGenLatch; } + + //PPU MASK (write) + void write_2001(byte value) + { + //printf("%04x:$%02x, %d\n",A,V,scanline); + reg_2001.Value = value; + } + byte read_2001() { return PPUGenLatch; } + byte peek_2001() { return PPUGenLatch; } + + //PPU STATUS (read) + void write_2002(byte value) { } + byte read_2002() + { + //once we thought we clear latches here, but that caused midframe glitches. + //i think we should only reset the state machine for 2005/2006 + //ppur.clear_latches(); + + byte ret = peek_2002(); + + vtoggle = false; + Reg2002_vblank_active = 0; + Reg2002_vblank_active_pending = false; + + return ret; + } + byte peek_2002() + { + return (byte)((Reg2002_vblank_active << 7) | (Reg2002_objhit << 6) | (Reg2002_objoverflow << 5) | (PPUGenLatch & 0x1F)); + } + + void clear_2002() + { + Reg2002_objhit = Reg2002_objoverflow = 0; + Reg2002_vblank_clear_pending = true; + } + + //OAM ADDRESS (write) + void write_2003(byte value) + { + //just record the oam buffer write target + reg_2003 = value; + } + byte read_2003() { return PPUGenLatch; } + byte peek_2003() { return PPUGenLatch; } + + //OAM DATA (write) + void write_2004(byte value) + { + if ((reg_2003 & 3) == 2) value &= 0xE3; //some of the OAM bits are unwired so we mask them out here + //otherwise we just write this value and move on to the next oam byte + OAM[reg_2003] = value; + reg_2003++; + } + byte read_2004() { return OAM[reg_2003]; } + byte peek_2004() { return OAM[reg_2003]; } + + //SCROLL (write) + void write_2005(byte value) + { + if (!vtoggle) + { + ppur._ht= value >> 3; + ppur.fh = value & 7; + //nes.LogLine("scroll wrote ht = {0} and fh = {1}", ppur._ht, ppur.fh); + } + else + { + ppur._vt = value >> 3; + ppur._fv = value & 7; + //nes.LogLine("scroll wrote vt = {0} and fv = {1}", ppur._vt, ppur._fv); + } + vtoggle ^= true; + } + byte read_2005() { return PPUGenLatch; } + byte peek_2005() { return PPUGenLatch; } + + //VRAM address register (write) + void write_2006(byte value) + { + if (!vtoggle) + { + ppur._vt &= 0x07; + ppur._vt |= (value & 0x3) << 3; + ppur._h = (value >> 2) & 1; + ppur._v = (value >> 3) & 1; + ppur._fv = (value >> 4) & 3; + //nes.LogLine("addr wrote fv = {0}", ppur._fv); + } + else + { + ppur._vt &= 0x18; + ppur._vt |= (value >> 5); + ppur._ht = value & 31; + ppur.install_latches(); + //nes.LogLine("addr wrote vt = {0}, ht = {1}", ppur._vt, ppur._ht); + + //normally the address isnt observed by the board till it gets clocked by a read or write. + //but maybe thats just because a ppu read/write shoves it on the address bus + //apparently this shoves it on the address bus, too, or else blargg's mmc3 tests dont pass + nes.Board.AddressPPU(ppur.get_2007access()); + } + + vtoggle ^= true; + } + byte read_2006() { return PPUGenLatch; } + byte peek_2006() { return PPUGenLatch; } + + //VRAM data register (r/w) + void write_2007(byte value) + { + //does this take 4x longer? nestopia indicates so perhaps... + + int addr = ppur.get_2007access() & 0x3FFF; + if ((addr & 0x3F00) == 0x3F00) + { + //handle palette. this is being done nestopia style, because i found some documentation for it (appendix 1) + addr &= 0x1F; + byte color = (byte)(value & 0x3F); //are these bits really unwired? can they be read back somehow? + + //this little hack will help you debug things while the screen is black + //color = (byte)(addr & 0x3F); + + PALRAM[addr] = color; + if ((addr & 3) == 0) + { + PALRAM[addr ^ 0x10] = color; + } + } + else + { + ppubus_write(addr, value); + } + + ppur.increment2007(ppur.status.rendering && reg_2001.PPUON, reg_2000.vram_incr32 != 0); + + //see comments in $2006 + nes.Board.AddressPPU(ppur.get_2007access()); + } + byte read_2007() + { + int addr = ppur.get_2007access() & 0x3FFF; + + //ordinarily we return the buffered values + byte ret = VRAMBuffer; + + //in any case, we read from the ppu bus + VRAMBuffer = ppubus_read(addr,false); + + //but reads from the palette are implemented in the PPU and return immediately + if ((addr & 0x3F00) == 0x3F00) + { + //TODO apply greyscale shit? + ret = PALRAM[addr & 0x1F]; + } + + ppur.increment2007(ppur.status.rendering && reg_2001.PPUON, reg_2000.vram_incr32 != 0); + + //see comments in $2006 + nes.Board.AddressPPU(ppur.get_2007access()); + + return ret; + } + byte peek_2007() + { + int addr = ppur.get_2007access() & 0x3FFF; + + //ordinarily we return the buffered values + byte ret = VRAMBuffer; + + //in any case, we read from the ppu bus + // can't do this in peek; updates the value that will be used later + // VRAMBuffer = ppubus_peek(addr); + + //but reads from the palette are implemented in the PPU and return immediately + if ((addr & 0x3F00) == 0x3F00) + { + //TODO apply greyscale shit? + ret = PALRAM[addr & 0x1F]; + } + + return ret; + } + //-------- + + public byte ReadReg(int addr) + { + switch (addr) + { + case 0: return read_2000(); case 1: return read_2001(); case 2: return read_2002(); case 3: return read_2003(); + case 4: return read_2004(); case 5: return read_2005(); case 6: return read_2006(); case 7: return read_2007(); + default: throw new InvalidOperationException(); + } + } + public byte PeekReg(int addr) + { + switch (addr) + { + case 0: return peek_2000(); case 1: return peek_2001(); case 2: return peek_2002(); case 3: return peek_2003(); + case 4: return peek_2004(); case 5: return peek_2005(); case 6: return peek_2006(); case 7: return peek_2007(); + default: throw new InvalidOperationException(); + } + } + public void WriteReg(int addr, byte value) + { + PPUGenLatch = value; + switch (addr) + { + case 0: write_2000(value); break; case 1: write_2001(value); break; case 2: write_2002(value); break; case 3: write_2003(value); break; + case 4: write_2004(value); break; case 5: write_2005(value); break; case 6: write_2006(value); break; case 7: write_2007(value); break; + default: throw new InvalidOperationException(); + } + } } } diff --git a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.run.cs b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.run.cs index 307c79177c..2dfc15cc7d 100644 --- a/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.run.cs +++ b/BizHawk.Emulation.Cores/Consoles/Nintendo/NES/PPU.run.cs @@ -8,464 +8,461 @@ using BizHawk.Common; namespace BizHawk.Emulation.Cores.Nintendo.NES { - partial class NES + sealed partial class PPU { - sealed partial class PPU + const int kFetchTime = 2; + + struct BGDataRecord { + public byte nt, at; + public byte pt_0, pt_1; + }; + + public short[] xbuf = new short[256*240]; + + int ppu_addr_temp; + void Read_bgdata(ref BGDataRecord bgdata) { - const int kFetchTime = 2; - - struct BGDataRecord { - public byte nt, at; - public byte pt_0, pt_1; - }; - - public short[] xbuf = new short[256*240]; - - int ppu_addr_temp; - void Read_bgdata(ref BGDataRecord bgdata) + for (int i = 0; i < 8; i++) + Read_bgdata(i,ref bgdata); + } + void Read_bgdata(int cycle, ref BGDataRecord bgdata) + { + switch (cycle) { - for (int i = 0; i < 8; i++) - Read_bgdata(i,ref bgdata); - } - void Read_bgdata(int cycle, ref BGDataRecord bgdata) - { - switch (cycle) - { - case 0: - ppu_addr_temp = ppur.get_ntread(); - bgdata.nt = ppubus_read(ppu_addr_temp, true); - runppu(1); - break; - case 1: - runppu(1); - break; - case 2: - { - ppu_addr_temp = ppur.get_atread(); - byte at = ppubus_read(ppu_addr_temp, true); - - //modify at to get appropriate palette shift - if ((ppur.vt & 2) != 0) at >>= 4; - if ((ppur.ht & 2) != 0) at >>= 2; - at &= 0x03; - at <<= 2; - bgdata.at = at; - - //horizontal scroll clocked at cycle 3 and then - //vertical scroll at 251 - runppu(1); - if (reg_2001.PPUON) - { - ppur.increment_hsc(); - if (ppur.status.cycle == 251) - ppur.increment_vs(); - } - break; - } - case 3: - runppu(1); - break; - case 4: - ppu_addr_temp = ppur.get_ptread(bgdata.nt); - bgdata.pt_0 = ppubus_read(ppu_addr_temp, true); - runppu(1); - break; - case 5: - runppu(1); - break; - case 6: - ppu_addr_temp |= 8; - bgdata.pt_1 = ppubus_read(ppu_addr_temp, true); - runppu(1); - break; - case 7: - runppu(1); - break; - } //switch(cycle) - } - - unsafe struct TempOAM - { - public fixed byte oam[4]; - public fixed byte patterns[2]; - public byte index; - public byte present; - } - - //TODO - check flashing sirens in werewolf - short PaletteAdjustPixel(int pixel) - { - //tack on the deemph bits. THESE MAY BE ORDERED WRONG. PLEASE CHECK IN THE PALETTE CODE - return (short)(pixel | reg_2001.intensity_lsl_6); - } - - const int kLineTime = 341; - public unsafe void FrameAdvance() - { - BGDataRecord *bgdata = stackalloc BGDataRecord[34]; //one at the end is junk, it can never be rendered - - //262 scanlines - if (ppudead != 0) - { - FrameAdvance_ppudead(); - return; - } - - Reg2002_vblank_active_pending = true; - ppuphase = PPUPHASE.VBL; - ppur.status.sl = 241; - - //Not sure if this is correct. According to Matt Conte and my own tests, it is. Timing is probably off, though. - //NOTE: Not having this here breaks a Super Donkey Kong game. - reg_2003 = 0; - - //this was repeatedly finetuned from the fceux days thrugh the old cpu core and into the new one to pass 05-nmi_timing.nes - //note that there is still some leniency. for instance, 4,2 will pass in addition to 3,3 - const int delay = 6; - runppu(3); - bool nmi_destiny = reg_2000.vblank_nmi_gen && Reg2002_vblank_active; - runppu(3); - if (nmi_destiny) TriggerNMI(); - runppu(postNMIlines * kLineTime - delay); - - //this seems to run just before the dummy scanline begins - clear_2002(); - - TempOAM* oams = stackalloc TempOAM[128]; - int* oamcounts = stackalloc int[2]; - int oamslot=0; - int oamcount=0; - - idleSynch ^= true; - - //render 241 scanlines (including 1 dummy at beginning) - for (int sl = 0; sl < 241; sl++) - { - ppur.status.cycle = 0; - - ppur.status.sl = sl; - - int yp = sl - 1; - ppuphase = PPUPHASE.BG; - - if (NTViewCallback != null && yp == NTViewCallback.Scanline) NTViewCallback.Callback(); - if (PPUViewCallback != null && yp == PPUViewCallback.Scanline) PPUViewCallback.Callback(); - - //twiddle the oam buffers - int scanslot = oamslot ^ 1; - int renderslot = oamslot; - oamslot ^= 1; - - oamcount = oamcounts[renderslot]; - - //ok, we're also going to draw here. - //unless we're on the first dummy scanline - if (sl != 0) + case 0: + ppu_addr_temp = ppur.get_ntread(); + bgdata.nt = ppubus_read(ppu_addr_temp, true); + runppu(1); + break; + case 1: + runppu(1); + break; + case 2: { - //the main scanline rendering loop: - //32 times, we will fetch a tile and then render 8 pixels. - //two of those tiles were read in the last scanline. - int yp_shift = yp << 8; - for (int xt = 0; xt < 32; xt++) - { - int xstart = xt << 3; - oamcount = oamcounts[renderslot]; - int target = yp_shift + xstart; - int rasterpos = xstart; + ppu_addr_temp = ppur.get_atread(); + byte at = ppubus_read(ppu_addr_temp, true); - //check all the conditions that can cause things to render in these 8px - bool renderspritenow = reg_2001.show_obj && (xt > 0 || reg_2001.show_obj_leftmost); - bool renderbgnow = reg_2001.show_bg && (xt > 0 || reg_2001.show_bg_leftmost); + //modify at to get appropriate palette shift + if ((ppur.vt & 2) != 0) at >>= 4; + if ((ppur.ht & 2) != 0) at >>= 2; + at &= 0x03; + at <<= 2; + bgdata.at = at; - for (int xp = 0; xp < 8; xp++, rasterpos++) - { - //process the current clock's worth of bg data fetching - //this needs to be split into 8 pieces or else exact sprite 0 hitting wont work due to the cpu not running while the sprite renders below - Read_bgdata(xp, ref bgdata[xt + 2]); - - //bg pos is different from raster pos due to its offsetability. - //so adjust for that here - int bgpos = rasterpos + ppur.fh; - int bgpx = bgpos & 7; - int bgtile = bgpos >> 3; - - int pixel = 0, pixelcolor; - - //generate the BG data - if (renderbgnow) - { - byte pt_0 = bgdata[bgtile].pt_0; - byte pt_1 = bgdata[bgtile].pt_1; - int sel = 7 - bgpx; - pixel = ((pt_0 >> sel) & 1) | (((pt_1 >> sel) & 1) << 1); - if (pixel != 0) - pixel |= bgdata[bgtile].at; - pixelcolor = PALRAM[pixel]; - } - else - { - if (!renderspritenow) - { - //according to qeed's doc, use palette 0 or $2006's value if it is & 0x3Fxx - //EDIT - this requires corect emulation of PPU OFF state, and seems only to apply when the PPU is OFF - // not sure why this was off, but having it on fixes full_nes_palette, and it's a behavior that's been - // verified on the decapped PPU - - // if there's anything wrong with how we're doing this, someone please chime in - int addr = ppur.get_2007access(); - if ((addr & 0x3F00) == 0x3F00) - { - // System.Console.WriteLine("{0:X4}", addr); - pixel = addr & 0x1F; - } - } - pixelcolor = PALRAM[pixel]; - pixelcolor |= 0x8000; //whats this? i think its a flag to indicate a hidden background to be used by the canvas filling logic later - } - - if (!nes.Settings.DispBackground) - pixelcolor = 0x8000; //whats this? i think its a flag to indicate a hidden background to be used by the canvas filling logic later - - //look for a sprite to be drawn - bool havepixel = false; - int renderslot_shift = renderslot << 6; - for (int s = 0; s < oamcount; s++) - { - TempOAM* oam = &oams[renderslot_shift + s]; - int x = oam->oam[3]; - if (rasterpos >= x && rasterpos < x + 8) - { - //build the pixel. - //fetch the LSB of the patterns - int spixel = oam->patterns[0] & 1; - spixel |= (oam->patterns[1] & 1) << 1; - - //shift down the patterns so the next pixel is in the LSB - oam->patterns[0] >>= 1; - oam->patterns[1] >>= 1; - - //bail out if we already have a pixel from a higher priority sprite. - //notice that we continue looping anyway, so that we can shift down the patterns - //transparent pixel bailout - if (!renderspritenow || havepixel || spixel == 0) continue; - - havepixel = true; - - //TODO - make sure we dont trigger spritehit if the edges are masked for either BG or OBJ - //spritehit: - //1. is it sprite#0? - //2. is the bg pixel nonzero? - //then, it is spritehit. - Reg2002_objhit |= (oam->index == 0 && pixel != 0 && rasterpos < 255); - //priority handling, if in front of BG: - bool drawsprite = !(((oam->oam[2] & 0x20) != 0) && ((pixel & 3) != 0)); - if (drawsprite && nes.Settings.DispSprites) - { - //bring in the palette bits and palettize - spixel |= (oam->oam[2] & 3) << 2; - //save it for use in the framebuffer - pixelcolor = PALRAM[0x10 + spixel]; - } - } //rasterpos in sprite range - } //oamcount loop - if (reg_2001.color_disable) - pixelcolor &= 0x30; - - xbuf[target] = PaletteAdjustPixel(pixelcolor); - - target++; - } //loop across 8 pixels - } //loop across 32 tiles - } - else - for (int xt = 0; xt < 32; xt++) - Read_bgdata(ref bgdata[xt + 2]); - - //look for sprites (was supposed to run concurrent with bg rendering) - oamcounts[scanslot] = 0; - oamcount = 0; - int spriteHeight = reg_2000.obj_size_16 ? 16 : 8; - - int scanslot_lshift = scanslot << 6; - - for (int i = 0; i < 64; i++) - { - oams[scanslot_lshift + i].present = 0; - int spr = i * 4; - if (yp >= OAM[spr] && yp < OAM[spr] + spriteHeight) - { - //if we already have maxsprites, then this new one causes an overflow, - //set the flag and bail out. - //should we set this flag anyway?? - if (oamcount >= 8 && reg_2001.PPUON) - { - Reg2002_objoverflow = true; - if(!nes.Settings.AllowMoreThanEightSprites) - break; - } - //just copy some bytes into the internal sprite buffer - TempOAM* oam = &oams[scanslot_lshift + oamcount]; - for (int j = 0; j < 4; j++) - oam->oam[j] = OAM[spr + j]; - oam->present = 1; - //note that we stuff the oam index into [6]. - //i need to turn this into a struct so we can have fewer magic numbers - oams[scanslot_lshift + oamcount].index = (byte)i; - oamcount++; - } - } - oamcounts[scanslot] = oamcount; - - ppuphase = PPUPHASE.OBJ; - - //fetch sprite patterns - int oam_todo = oamcount; - if (oam_todo < 8) - oam_todo = 8; - for (int s = 0; s < oam_todo; s++) - { - //if this is a real sprite sprite, then it is not above the 8 sprite limit. - //this is how we support the no 8 sprite limit feature. - //not that at some point we may need a virtual CALL_PPUREAD which just peeks and doesnt increment any counters - //this could be handy for the debugging tools also - bool realSprite = (s < 8); - bool junksprite = (s >= oamcount || !reg_2001.PPUON); - - TempOAM* oam = &oams[scanslot_lshift + s]; - int line = yp - oam->oam[0]; - if ((oam->oam[2] & 0x80) != 0) //vflip - line = spriteHeight - line - 1; - - int patternNumber = oam->oam[1]; - int patternAddress; - - //create deterministic dummy fetch pattern. - if (oam->present == 0) - { - //according to nintendulator: - //* On the first empty sprite slot, read the Y-coordinate of sprite #63 followed by $FF for the remaining 7 cycles - //* On all subsequent empty sprite slots, read $FF for all 8 reads - //well, we shall just read $FF and that is good enough for now to make mmc3 work - patternNumber = 0xFF; - line = 0; - } - - //8x16 sprite handling: - if (reg_2000.obj_size_16) - { - int bank = (patternNumber & 1) << 12; - patternNumber = patternNumber & ~1; - patternNumber |= (line >> 3) & 1; - patternAddress = (patternNumber << 4) | bank; - } - else - patternAddress = (patternNumber << 4) | (reg_2000.obj_pattern_hi << 12); - - //offset into the pattern for the current line. - //tricky: tall sprites have already had lines>8 taken care of by getting a new pattern number above. - //so we just need the line offset for the second pattern - patternAddress += line & 7; - - //garbage nametable fetches + scroll resets - int garbage_todo = 2; - ppubus_read(ppur.get_ntread(), true); + //horizontal scroll clocked at cycle 3 and then + //vertical scroll at 251 + runppu(1); if (reg_2001.PPUON) { - if (sl == 0 && ppur.status.cycle == 304) - { - runppu(1); - if (reg_2001.PPUON) ppur.install_latches(); - runppu(1); - garbage_todo = 0; - } - if ((sl != 0) && ppur.status.cycle == 256) - { - runppu(1); - //at 257: 3d world runner is ugly if we do this at 256 - if (reg_2001.PPUON) ppur.install_h_latches(); - runppu(1); - garbage_todo = 0; - } + ppur.increment_hsc(); + if (ppur.status.cycle == 251) + ppur.increment_vs(); } - if (realSprite) runppu(garbage_todo); + break; + } + case 3: + runppu(1); + break; + case 4: + ppu_addr_temp = ppur.get_ptread(bgdata.nt); + bgdata.pt_0 = ppubus_read(ppu_addr_temp, true); + runppu(1); + break; + case 5: + runppu(1); + break; + case 6: + ppu_addr_temp |= 8; + bgdata.pt_1 = ppubus_read(ppu_addr_temp, true); + runppu(1); + break; + case 7: + runppu(1); + break; + } //switch(cycle) + } - ppubus_read(ppur.get_atread(), true); //at or nt? + unsafe struct TempOAM + { + public fixed byte oam[4]; + public fixed byte patterns[2]; + public byte index; + public byte present; + } + + //TODO - check flashing sirens in werewolf + short PaletteAdjustPixel(int pixel) + { + //tack on the deemph bits. THESE MAY BE ORDERED WRONG. PLEASE CHECK IN THE PALETTE CODE + return (short)(pixel | reg_2001.intensity_lsl_6); + } + + const int kLineTime = 341; + public unsafe void FrameAdvance() + { + BGDataRecord *bgdata = stackalloc BGDataRecord[34]; //one at the end is junk, it can never be rendered + + //262 scanlines + if (ppudead != 0) + { + FrameAdvance_ppudead(); + return; + } + + Reg2002_vblank_active_pending = true; + ppuphase = PPUPHASE.VBL; + ppur.status.sl = 241; + + //Not sure if this is correct. According to Matt Conte and my own tests, it is. Timing is probably off, though. + //NOTE: Not having this here breaks a Super Donkey Kong game. + reg_2003 = 0; + + //this was repeatedly finetuned from the fceux days thrugh the old cpu core and into the new one to pass 05-nmi_timing.nes + //note that there is still some leniency. for instance, 4,2 will pass in addition to 3,3 + const int delay = 6; + runppu(3); + bool nmi_destiny = reg_2000.vblank_nmi_gen && Reg2002_vblank_active; + runppu(3); + if (nmi_destiny) TriggerNMI(); + runppu(postNMIlines * kLineTime - delay); + + //this seems to run just before the dummy scanline begins + clear_2002(); + + TempOAM* oams = stackalloc TempOAM[128]; + int* oamcounts = stackalloc int[2]; + int oamslot=0; + int oamcount=0; + + idleSynch ^= true; + + //render 241 scanlines (including 1 dummy at beginning) + for (int sl = 0; sl < 241; sl++) + { + ppur.status.cycle = 0; + + ppur.status.sl = sl; + + int yp = sl - 1; + ppuphase = PPUPHASE.BG; + + if (NTViewCallback != null && yp == NTViewCallback.Scanline) NTViewCallback.Callback(); + if (PPUViewCallback != null && yp == PPUViewCallback.Scanline) PPUViewCallback.Callback(); + + //twiddle the oam buffers + int scanslot = oamslot ^ 1; + int renderslot = oamslot; + oamslot ^= 1; + + oamcount = oamcounts[renderslot]; + + //ok, we're also going to draw here. + //unless we're on the first dummy scanline + if (sl != 0) + { + //the main scanline rendering loop: + //32 times, we will fetch a tile and then render 8 pixels. + //two of those tiles were read in the last scanline. + int yp_shift = yp << 8; + for (int xt = 0; xt < 32; xt++) + { + int xstart = xt << 3; + oamcount = oamcounts[renderslot]; + int target = yp_shift + xstart; + int rasterpos = xstart; + + //check all the conditions that can cause things to render in these 8px + bool renderspritenow = reg_2001.show_obj && (xt > 0 || reg_2001.show_obj_leftmost); + bool renderbgnow = reg_2001.show_bg && (xt > 0 || reg_2001.show_bg_leftmost); + + for (int xp = 0; xp < 8; xp++, rasterpos++) + { + //process the current clock's worth of bg data fetching + //this needs to be split into 8 pieces or else exact sprite 0 hitting wont work due to the cpu not running while the sprite renders below + Read_bgdata(xp, ref bgdata[xt + 2]); + + //bg pos is different from raster pos due to its offsetability. + //so adjust for that here + int bgpos = rasterpos + ppur.fh; + int bgpx = bgpos & 7; + int bgtile = bgpos >> 3; + + int pixel = 0, pixelcolor; + + //generate the BG data + if (renderbgnow) + { + byte pt_0 = bgdata[bgtile].pt_0; + byte pt_1 = bgdata[bgtile].pt_1; + int sel = 7 - bgpx; + pixel = ((pt_0 >> sel) & 1) | (((pt_1 >> sel) & 1) << 1); + if (pixel != 0) + pixel |= bgdata[bgtile].at; + pixelcolor = PALRAM[pixel]; + } + else + { + if (!renderspritenow) + { + //according to qeed's doc, use palette 0 or $2006's value if it is & 0x3Fxx + //EDIT - this requires corect emulation of PPU OFF state, and seems only to apply when the PPU is OFF + // not sure why this was off, but having it on fixes full_nes_palette, and it's a behavior that's been + // verified on the decapped PPU + + // if there's anything wrong with how we're doing this, someone please chime in + int addr = ppur.get_2007access(); + if ((addr & 0x3F00) == 0x3F00) + { + // System.Console.WriteLine("{0:X4}", addr); + pixel = addr & 0x1F; + } + } + pixelcolor = PALRAM[pixel]; + pixelcolor |= 0x8000; //whats this? i think its a flag to indicate a hidden background to be used by the canvas filling logic later + } + + if (!nes.Settings.DispBackground) + pixelcolor = 0x8000; //whats this? i think its a flag to indicate a hidden background to be used by the canvas filling logic later + + //look for a sprite to be drawn + bool havepixel = false; + int renderslot_shift = renderslot << 6; + for (int s = 0; s < oamcount; s++) + { + TempOAM* oam = &oams[renderslot_shift + s]; + int x = oam->oam[3]; + if (rasterpos >= x && rasterpos < x + 8) + { + //build the pixel. + //fetch the LSB of the patterns + int spixel = oam->patterns[0] & 1; + spixel |= (oam->patterns[1] & 1) << 1; + + //shift down the patterns so the next pixel is in the LSB + oam->patterns[0] >>= 1; + oam->patterns[1] >>= 1; + + //bail out if we already have a pixel from a higher priority sprite. + //notice that we continue looping anyway, so that we can shift down the patterns + //transparent pixel bailout + if (!renderspritenow || havepixel || spixel == 0) continue; + + havepixel = true; + + //TODO - make sure we dont trigger spritehit if the edges are masked for either BG or OBJ + //spritehit: + //1. is it sprite#0? + //2. is the bg pixel nonzero? + //then, it is spritehit. + Reg2002_objhit |= (oam->index == 0 && pixel != 0 && rasterpos < 255); + //priority handling, if in front of BG: + bool drawsprite = !(((oam->oam[2] & 0x20) != 0) && ((pixel & 3) != 0)); + if (drawsprite && nes.Settings.DispSprites) + { + //bring in the palette bits and palettize + spixel |= (oam->oam[2] & 3) << 2; + //save it for use in the framebuffer + pixelcolor = PALRAM[0x10 + spixel]; + } + } //rasterpos in sprite range + } //oamcount loop + if (reg_2001.color_disable) + pixelcolor &= 0x30; + + xbuf[target] = PaletteAdjustPixel(pixelcolor); + + target++; + } //loop across 8 pixels + } //loop across 32 tiles + } + else + for (int xt = 0; xt < 32; xt++) + Read_bgdata(ref bgdata[xt + 2]); + + //look for sprites (was supposed to run concurrent with bg rendering) + oamcounts[scanslot] = 0; + oamcount = 0; + int spriteHeight = reg_2000.obj_size_16 ? 16 : 8; + + int scanslot_lshift = scanslot << 6; + + for (int i = 0; i < 64; i++) + { + oams[scanslot_lshift + i].present = 0; + int spr = i * 4; + if (yp >= OAM[spr] && yp < OAM[spr] + spriteHeight) + { + //if we already have maxsprites, then this new one causes an overflow, + //set the flag and bail out. + //should we set this flag anyway?? + if (oamcount >= 8 && reg_2001.PPUON) + { + Reg2002_objoverflow = true; + if(!nes.Settings.AllowMoreThanEightSprites) + break; + } + //just copy some bytes into the internal sprite buffer + TempOAM* oam = &oams[scanslot_lshift + oamcount]; + for (int j = 0; j < 4; j++) + oam->oam[j] = OAM[spr + j]; + oam->present = 1; + //note that we stuff the oam index into [6]. + //i need to turn this into a struct so we can have fewer magic numbers + oams[scanslot_lshift + oamcount].index = (byte)i; + oamcount++; + } + } + oamcounts[scanslot] = oamcount; + + ppuphase = PPUPHASE.OBJ; + + //fetch sprite patterns + int oam_todo = oamcount; + if (oam_todo < 8) + oam_todo = 8; + for (int s = 0; s < oam_todo; s++) + { + //if this is a real sprite sprite, then it is not above the 8 sprite limit. + //this is how we support the no 8 sprite limit feature. + //not that at some point we may need a virtual CALL_PPUREAD which just peeks and doesnt increment any counters + //this could be handy for the debugging tools also + bool realSprite = (s < 8); + bool junksprite = (s >= oamcount || !reg_2001.PPUON); + + TempOAM* oam = &oams[scanslot_lshift + s]; + int line = yp - oam->oam[0]; + if ((oam->oam[2] & 0x80) != 0) //vflip + line = spriteHeight - line - 1; + + int patternNumber = oam->oam[1]; + int patternAddress; + + //create deterministic dummy fetch pattern. + if (oam->present == 0) + { + //according to nintendulator: + //* On the first empty sprite slot, read the Y-coordinate of sprite #63 followed by $FF for the remaining 7 cycles + //* On all subsequent empty sprite slots, read $FF for all 8 reads + //well, we shall just read $FF and that is good enough for now to make mmc3 work + patternNumber = 0xFF; + line = 0; + } + + //8x16 sprite handling: + if (reg_2000.obj_size_16) + { + int bank = (patternNumber & 1) << 12; + patternNumber = patternNumber & ~1; + patternNumber |= (line >> 3) & 1; + patternAddress = (patternNumber << 4) | bank; + } + else + patternAddress = (patternNumber << 4) | (reg_2000.obj_pattern_hi << 12); + + //offset into the pattern for the current line. + //tricky: tall sprites have already had lines>8 taken care of by getting a new pattern number above. + //so we just need the line offset for the second pattern + patternAddress += line & 7; + + //garbage nametable fetches + scroll resets + int garbage_todo = 2; + ppubus_read(ppur.get_ntread(), true); + if (reg_2001.PPUON) + { + if (sl == 0 && ppur.status.cycle == 304) + { + runppu(1); + if (reg_2001.PPUON) ppur.install_latches(); + runppu(1); + garbage_todo = 0; + } + if ((sl != 0) && ppur.status.cycle == 256) + { + runppu(1); + //at 257: 3d world runner is ugly if we do this at 256 + if (reg_2001.PPUON) ppur.install_h_latches(); + runppu(1); + garbage_todo = 0; + } + } + if (realSprite) runppu(garbage_todo); + + ppubus_read(ppur.get_atread(), true); //at or nt? + if (realSprite) runppu(kFetchTime); + + // TODO - fake sprites should not come through ppubus_read but rather peek it + // (at least, they should not probe it with AddressPPU. maybe the difference between peek and read is not necessary) + + if (junksprite) + { + if (realSprite) + { + ppubus_read(patternAddress, true); + ppubus_read(patternAddress, true); + runppu(kFetchTime * 2); + } + } + else + { + int addr = patternAddress; + oam->patterns[0] = ppubus_read(addr, true); if (realSprite) runppu(kFetchTime); - // TODO - fake sprites should not come through ppubus_read but rather peek it - // (at least, they should not probe it with AddressPPU. maybe the difference between peek and read is not necessary) + addr += 8; + oam->patterns[1] = ppubus_read(addr, true); + if (realSprite) runppu(kFetchTime); - if (junksprite) + // hflip + if ((oam->oam[2] & 0x40) == 0) { - if (realSprite) - { - ppubus_read(patternAddress, true); - ppubus_read(patternAddress, true); - runppu(kFetchTime * 2); - } + oam->patterns[0] = BitReverse.Byte8[oam->patterns[0]]; + oam->patterns[1] = BitReverse.Byte8[oam->patterns[1]]; } - else - { - int addr = patternAddress; - oam->patterns[0] = ppubus_read(addr, true); - if (realSprite) runppu(kFetchTime); + } + } // sprite pattern fetch loop - addr += 8; - oam->patterns[1] = ppubus_read(addr, true); - if (realSprite) runppu(kFetchTime); + ppuphase = PPUPHASE.BG; - // hflip - if ((oam->oam[2] & 0x40) == 0) - { - oam->patterns[0] = BitReverse.Byte8[oam->patterns[0]]; - oam->patterns[1] = BitReverse.Byte8[oam->patterns[1]]; - } - } - } // sprite pattern fetch loop + // fetch BG: two tiles for next line + for (int xt = 0; xt < 2; xt++) + Read_bgdata(ref bgdata[xt]); - ppuphase = PPUPHASE.BG; + // this sequence is tuned to pass 10-even_odd_timing.nes + runppu(kFetchTime); + bool evenOddDestiny = reg_2001.show_bg; + runppu(kFetchTime); - // fetch BG: two tiles for next line - for (int xt = 0; xt < 2; xt++) - Read_bgdata(ref bgdata[xt]); + // After memory access 170, the PPU simply rests for 4 cycles (or the + // equivelant of half a memory access cycle) before repeating the whole + // pixel/scanline rendering process. If the scanline being rendered is the very + // first one on every second frame, then this delay simply doesn't exist. + if (sl == 0 && idleSynch && evenOddDestiny && chopdot) + { } + else + runppu(1); + } // scanline loop - // this sequence is tuned to pass 10-even_odd_timing.nes - runppu(kFetchTime); - bool evenOddDestiny = reg_2001.show_bg; - runppu(kFetchTime); + ppur.status.sl = 241; - // After memory access 170, the PPU simply rests for 4 cycles (or the - // equivelant of half a memory access cycle) before repeating the whole - // pixel/scanline rendering process. If the scanline being rendered is the very - // first one on every second frame, then this delay simply doesn't exist. - if (sl == 0 && idleSynch && evenOddDestiny && chopdot) - { } - else - runppu(1); - } // scanline loop + //idle for pre NMI lines + runppu(preNMIlines * kLineTime); - ppur.status.sl = 241; - - //idle for pre NMI lines - runppu(preNMIlines * kLineTime); - - } //FrameAdvance + } //FrameAdvance - void FrameAdvance_ppudead() - { - //not quite emulating all the NES power up behavior - //since it is known that the NES ignores writes to some - //register before around a full frame, but no games - //should write to those regs during that time, it needs - //to wait for vblank - ppur.status.sl = 241; - runppu(postNMIlines * kLineTime); - ppur.status.sl = 0; - runppu(241 * kLineTime); - runppu(preNMIlines * kLineTime); - --ppudead; - } + void FrameAdvance_ppudead() + { + //not quite emulating all the NES power up behavior + //since it is known that the NES ignores writes to some + //register before around a full frame, but no games + //should write to those regs during that time, it needs + //to wait for vblank + ppur.status.sl = 241; + runppu(postNMIlines * kLineTime); + ppur.status.sl = 0; + runppu(241 * kLineTime); + runppu(preNMIlines * kLineTime); + --ppudead; } } }