mirror of https://github.com/PCSX2/pcsx2.git
SPU2: Improve DMA Write timing. Better sync DMA speeds with IOP
It takes 4 cycles per word, according to No$PSX documents Also fixed an issue with when ADMA refills the buffer, fixes The Simpsons (for real this time)
This commit is contained in:
parent
f07ca859e5
commit
a94561fba7
|
@ -43,7 +43,7 @@ static void __fastcall psxDmaGeneric(u32 madr, u32 bcr, u32 chcr, u32 spuCore)
|
|||
//Console.Status("cycles sent to SPU2 %x\n", psxRegs.cycle - psxCounters[6].sCycleT);
|
||||
|
||||
psxCounters[6].sCycleT = psxRegs.cycle;
|
||||
psxCounters[6].CycleT = size * 2;
|
||||
psxCounters[6].CycleT = size * 4;
|
||||
|
||||
psxNextCounter -= (psxRegs.cycle - psxNextsCounter);
|
||||
psxNextsCounter = psxRegs.cycle;
|
||||
|
|
|
@ -16,6 +16,7 @@
|
|||
#include "PrecompiledHeader.h"
|
||||
#include "Global.h"
|
||||
#include "Dma.h"
|
||||
#include "IopCommon.h"
|
||||
|
||||
#include "spu2.h" // temporary until I resolve cyclePtr/TimeUpdate dependencies.
|
||||
|
||||
|
@ -139,14 +140,14 @@ void V_Core::StartADMAWrite(u16* pMem, u32 sz)
|
|||
|
||||
if (MsgAutoDMA())
|
||||
ConLog("* SPU2: DMA%c AutoDMA Transfer of %d bytes to %x (%02x %x %04x).\n",
|
||||
GetDmaIndexChar(), size << 1, TSA, DMABits, AutoDMACtrl, (~Regs.ATTR) & 0x7fff);
|
||||
GetDmaIndexChar(), size << 1, TSA, DMABits, AutoDMACtrl, (~Regs.ATTR) & 0xffff);
|
||||
|
||||
InputDataProgress = 0;
|
||||
if ((AutoDMACtrl & (Index + 1)) == 0)
|
||||
{
|
||||
TSA = 0x2000 + (Index << 10);
|
||||
DMAICounter = size;
|
||||
LastClock = lClocks;
|
||||
DMAICounter = size * 4;
|
||||
LastClock = *cyclePtr;
|
||||
}
|
||||
else if (size >= 512)
|
||||
{
|
||||
|
@ -171,8 +172,8 @@ void V_Core::StartADMAWrite(u16* pMem, u32 sz)
|
|||
// Klonoa 2
|
||||
if (size == 512)
|
||||
{
|
||||
DMAICounter = size;
|
||||
LastClock = lClocks;
|
||||
DMAICounter = size * 4;
|
||||
LastClock = *cyclePtr;
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -180,9 +181,10 @@ void V_Core::StartADMAWrite(u16* pMem, u32 sz)
|
|||
}
|
||||
else
|
||||
{
|
||||
LastClock = lClocks;
|
||||
size = sz;
|
||||
InputDataLeft = 0;
|
||||
DMAICounter = 1;
|
||||
DMAICounter = size * 4;
|
||||
LastClock = *cyclePtr;
|
||||
}
|
||||
TADR = MADR + (size << 1);
|
||||
}
|
||||
|
@ -206,6 +208,37 @@ void V_Core::StartADMAWrite(u16* pMem, u32 sz)
|
|||
|
||||
void V_Core::PlainDMAWrite(u16* pMem, u32 size)
|
||||
{
|
||||
if (cyclePtr != nullptr)
|
||||
TimeUpdate(*cyclePtr);
|
||||
TSA &= 0xfffff;
|
||||
ReadSize = size;
|
||||
IsDMARead = false;
|
||||
LastClock = *cyclePtr;
|
||||
DMAICounter = std::min(ReadSize, (u32)0x100) * 4;
|
||||
Regs.STATX &= ~0x80;
|
||||
Regs.STATX |= 0x400;
|
||||
TADR = MADR + (size << 1);
|
||||
|
||||
if (((psxCounters[6].sCycleT + psxCounters[6].CycleT) - psxRegs.cycle) > DMAICounter)
|
||||
{
|
||||
psxCounters[6].sCycleT = psxRegs.cycle;
|
||||
psxCounters[6].CycleT = DMAICounter;
|
||||
|
||||
psxNextCounter -= (psxRegs.cycle - psxNextsCounter);
|
||||
psxNextsCounter = psxRegs.cycle;
|
||||
if (psxCounters[6].CycleT < psxNextCounter)
|
||||
psxNextCounter = psxCounters[6].CycleT;
|
||||
}
|
||||
|
||||
if (MsgDMA())
|
||||
ConLog("* SPU2: DMA%c Write Transfer of %d bytes to %x (%02x %x %04x). IRQE = %d IRQA = %x \n",
|
||||
GetDmaIndexChar(), size << 1, TSA, DMABits, AutoDMACtrl, Regs.ATTR & 0xffff,
|
||||
Cores[Index].IRQEnable, Cores[Index].IRQA);
|
||||
}
|
||||
|
||||
void V_Core::FinishDMAwrite()
|
||||
{
|
||||
|
||||
// Perform an alignment check.
|
||||
// Not really important. Everything should work regardless,
|
||||
// but it could be indicative of an emulation foopah elsewhere.
|
||||
|
@ -220,18 +253,18 @@ void V_Core::PlainDMAWrite(u16* pMem, u32 size)
|
|||
|
||||
if (TSA & 7)
|
||||
{
|
||||
ConLog("* SPU2 DMA Write > Misaligned target. Core: %d IOP: %p TSA: 0x%x Size: 0x%x\n", Index, (void*)pMem, TSA, size);
|
||||
ConLog("* SPU2 DMA Write > Misaligned target. Core: %d IOP: %p TSA: 0x%x Size: 0x%x\n", Index, (void*)DMAPtr, TSA, ReadSize);
|
||||
}
|
||||
}
|
||||
|
||||
if (Index == 0)
|
||||
DMA4LogWrite(pMem, size << 1);
|
||||
DMA4LogWrite(DMAPtr, ReadSize << 1);
|
||||
else
|
||||
DMA7LogWrite(pMem, size << 1);
|
||||
DMA7LogWrite(DMAPtr, ReadSize << 1);
|
||||
|
||||
TSA &= 0xfffff;
|
||||
|
||||
u32 buff1end = TSA + size;
|
||||
u32 buff1end = TSA + std::min(ReadSize, (u32)0x100);
|
||||
u32 buff2end = 0;
|
||||
if (buff1end > 0x100000)
|
||||
{
|
||||
|
@ -258,7 +291,7 @@ void V_Core::PlainDMAWrite(u16* pMem, u32 size)
|
|||
// It starts at TSA and goes to buff1end.
|
||||
|
||||
const u32 buff1size = (buff1end - TSA);
|
||||
memcpy(GetMemPtr(TSA), pMem, buff1size * 2);
|
||||
memcpy(GetMemPtr(TSA), DMAPtr, buff1size * 2);
|
||||
|
||||
u32 TDA;
|
||||
|
||||
|
@ -274,8 +307,7 @@ void V_Core::PlainDMAWrite(u16* pMem, u32 size)
|
|||
|
||||
// Emulation Grayarea: Should addresses wrap around to zero, or wrap around to
|
||||
// 0x2800? Hard to know for sure (almost no games depend on this)
|
||||
|
||||
memcpy(GetMemPtr(0), &pMem[buff1size], buff2end * 2);
|
||||
memcpy(GetMemPtr(0), &DMAPtr[buff1size], buff2end * 2);
|
||||
TDA = (buff2end) & 0xfffff;
|
||||
|
||||
// Flag interrupt? If IRQA occurs between start and dest, flag it.
|
||||
|
@ -333,15 +365,32 @@ void V_Core::PlainDMAWrite(u16* pMem, u32 size)
|
|||
}
|
||||
#endif
|
||||
}
|
||||
LastClock = lClocks;
|
||||
|
||||
TSA = TDA;
|
||||
DMAICounter = size;
|
||||
TADR = MADR + (size << 1);
|
||||
DMAPtr += std::min(ReadSize, (u32)0x100);
|
||||
ReadSize -= std::min(ReadSize, (u32)0x100);
|
||||
if (ReadSize == 0)
|
||||
DMAICounter = 0;
|
||||
else
|
||||
{
|
||||
DMAICounter = std::min(ReadSize, (u32)0x100) * 4;
|
||||
|
||||
if (((psxCounters[6].sCycleT + psxCounters[6].CycleT) - psxRegs.cycle) > DMAICounter)
|
||||
{
|
||||
psxCounters[6].sCycleT = psxRegs.cycle;
|
||||
psxCounters[6].CycleT = DMAICounter;
|
||||
|
||||
psxNextCounter -= (psxRegs.cycle - psxNextsCounter);
|
||||
psxNextsCounter = psxRegs.cycle;
|
||||
if (psxCounters[6].CycleT < psxNextCounter)
|
||||
psxNextCounter = psxCounters[6].CycleT;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void V_Core::FinishDMAread()
|
||||
{
|
||||
u32 buff1end = TSA + ReadSize;
|
||||
u32 buff1end = TSA + std::min(ReadSize, (u32)0x100);
|
||||
u32 buff2end = 0;
|
||||
if (buff1end > 0x100000)
|
||||
{
|
||||
|
@ -354,17 +403,15 @@ void V_Core::FinishDMAread()
|
|||
// Note on TSA's position after our copy finishes:
|
||||
// IRQA should be measured by the end of the writepos+0x20. But the TDA
|
||||
// should be written back at the precise endpoint of the xfer.
|
||||
|
||||
u32 TDA;
|
||||
|
||||
if (buff2end > 0)
|
||||
{
|
||||
// second branch needs cleared:
|
||||
// It starts at the beginning of memory and moves forward to buff2end
|
||||
|
||||
memcpy(&DMARPtr[buff1size], GetMemPtr(0), buff2end * 2);
|
||||
|
||||
TDA = (buff2end + 0x20) & 0xfffff;
|
||||
TDA = (buff2end) & 0xfffff;
|
||||
|
||||
// Flag interrupt? If IRQA occurs between start and dest, flag it.
|
||||
// Important: Test both core IRQ settings for either DMA!
|
||||
|
@ -383,7 +430,7 @@ void V_Core::FinishDMAread()
|
|||
// Buffer doesn't wrap/overflow!
|
||||
// Just set the TDA and check for an IRQ...
|
||||
|
||||
TDA = (buff1end + 0x20) & 0xfffff;
|
||||
TDA = (buff1end) & 0xfffff;
|
||||
|
||||
// Flag interrupt? If IRQA occurs between start and dest, flag it.
|
||||
// Important: Test both core IRQ settings for either DMA!
|
||||
|
@ -398,21 +445,61 @@ void V_Core::FinishDMAread()
|
|||
}
|
||||
|
||||
TSA = TDA;
|
||||
IsDMARead = false;
|
||||
DMARPtr += std::min(ReadSize, (u32)0x100);
|
||||
ReadSize -= std::min(ReadSize, (u32)0x100);
|
||||
if (ReadSize == 0)
|
||||
{
|
||||
IsDMARead = false;
|
||||
DMAICounter = 0;
|
||||
}
|
||||
else
|
||||
{
|
||||
DMAICounter = std::min(ReadSize, (u32)0x100) * 4;
|
||||
|
||||
if (((psxCounters[6].sCycleT + psxCounters[6].CycleT) - psxRegs.cycle) > DMAICounter)
|
||||
{
|
||||
psxCounters[6].sCycleT = psxRegs.cycle;
|
||||
psxCounters[6].CycleT = DMAICounter;
|
||||
|
||||
psxNextCounter -= (psxRegs.cycle - psxNextsCounter);
|
||||
psxNextsCounter = psxRegs.cycle;
|
||||
if (psxCounters[6].CycleT < psxNextCounter)
|
||||
psxNextCounter = psxCounters[6].CycleT;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void V_Core::DoDMAread(u16* pMem, u32 size)
|
||||
{
|
||||
TSA &= 0xfffff;
|
||||
if (cyclePtr != nullptr)
|
||||
TimeUpdate(*cyclePtr);
|
||||
|
||||
DMARPtr = pMem;
|
||||
TSA &= 0xfffff;
|
||||
ReadSize = size;
|
||||
IsDMARead = true;
|
||||
LastClock = lClocks;
|
||||
DMAICounter = size;
|
||||
LastClock = *cyclePtr;
|
||||
DMAICounter = std::min(ReadSize, (u32)0x100) * 4;
|
||||
Regs.STATX &= ~0x80;
|
||||
Regs.STATX |= 0x400;
|
||||
//Regs.ATTR |= 0x30;
|
||||
TADR = MADR + (size << 1);
|
||||
|
||||
if (((psxCounters[6].sCycleT + psxCounters[6].CycleT) - psxRegs.cycle) > DMAICounter)
|
||||
{
|
||||
psxCounters[6].sCycleT = psxRegs.cycle;
|
||||
psxCounters[6].CycleT = DMAICounter;
|
||||
|
||||
psxNextCounter -= (psxRegs.cycle - psxNextsCounter);
|
||||
psxNextsCounter = psxRegs.cycle;
|
||||
if (psxCounters[6].CycleT < psxNextCounter)
|
||||
psxNextCounter = psxCounters[6].CycleT;
|
||||
}
|
||||
|
||||
if (MsgDMA())
|
||||
ConLog("* SPU2: DMA%c Read Transfer of %d bytes from %x (%02x %x %04x). IRQE = %d IRQA = %x \n",
|
||||
GetDmaIndexChar(), size << 1, TSA, DMABits, AutoDMACtrl, Regs.ATTR & 0xffff,
|
||||
Cores[Index].IRQEnable, Cores[Index].IRQA);
|
||||
}
|
||||
|
||||
void V_Core::DoDMAwrite(u16* pMem, u32 size)
|
||||
|
@ -423,8 +510,8 @@ void V_Core::DoDMAwrite(u16* pMem, u32 size)
|
|||
{
|
||||
Regs.STATX &= ~0x80;
|
||||
//Regs.ATTR |= 0x30;
|
||||
DMAICounter = 1;
|
||||
LastClock = lClocks;
|
||||
DMAICounter = 1 * 4;
|
||||
LastClock = *cyclePtr;
|
||||
return;
|
||||
}
|
||||
|
||||
|
@ -453,14 +540,8 @@ void V_Core::DoDMAwrite(u16* pMem, u32 size)
|
|||
}
|
||||
else
|
||||
{
|
||||
if (MsgDMA())
|
||||
ConLog("* SPU2: DMA%c Transfer of %d bytes to %x (%02x %x %04x). IRQE = %d IRQA = %x \n",
|
||||
GetDmaIndexChar(), size << 1, TSA, DMABits, AutoDMACtrl, Regs.ATTR & 0x7fff,
|
||||
Cores[Index].IRQEnable, Cores[Index].IRQA);
|
||||
|
||||
PlainDMAWrite(pMem, size);
|
||||
}
|
||||
Regs.STATX &= ~0x80;
|
||||
Regs.STATX |= 0x400;
|
||||
//Regs.ATTR |= 0x30;
|
||||
}
|
||||
|
|
|
@ -142,7 +142,7 @@ StereoOut32 V_Core::ReadInput()
|
|||
|
||||
InputPosRead++;
|
||||
|
||||
if (AutoDMACtrl & (Index + 1) && (InputPosRead == 0x100 || InputPosRead == 0x200))
|
||||
if (AutoDMACtrl & (Index + 1) && (InputPosRead == 0x180 || InputPosRead == 0x80))
|
||||
{
|
||||
AdmaInProgress = 0;
|
||||
if (InputDataLeft >= 0x200)
|
||||
|
|
|
@ -533,6 +533,7 @@ struct V_Core
|
|||
void AutoDMAReadBuffer(int mode);
|
||||
void StartADMAWrite(u16* pMem, u32 sz);
|
||||
void PlainDMAWrite(u16* pMem, u32 sz);
|
||||
void FinishDMAwrite();
|
||||
};
|
||||
|
||||
extern V_Core Cores[2];
|
||||
|
|
|
@ -134,7 +134,6 @@ void SPU2interruptDMA4()
|
|||
FileLog("[%10d] SPU2 interruptDMA4\n", Cycles);
|
||||
Cores[0].Regs.STATX |= 0x80;
|
||||
Cores[0].Regs.STATX &= ~0x400;
|
||||
Cores[0].Regs.ATTR &= ~0x30;
|
||||
}
|
||||
|
||||
void SPU2interruptDMA7()
|
||||
|
@ -142,7 +141,6 @@ void SPU2interruptDMA7()
|
|||
FileLog("[%10d] SPU2 interruptDMA7\n", Cycles);
|
||||
Cores[1].Regs.STATX |= 0x80;
|
||||
Cores[1].Regs.STATX &= ~0x400;
|
||||
Cores[1].Regs.ATTR &= ~0x30;
|
||||
}
|
||||
|
||||
void SPU2readDMA7Mem(u16* pMem, u32 size)
|
||||
|
|
|
@ -402,16 +402,21 @@ __forceinline void TimeUpdate(u32 cClocks)
|
|||
TickInterval = 768; // Reset to default, in case the user hotswitched from async to something else.
|
||||
|
||||
//Update DMA4 interrupt delay counter
|
||||
if (Cores[0].DMAICounter > 0 && (cClocks - Cores[0].LastClock) > 0)
|
||||
if (Cores[0].DMAICounter > 0 && (*cyclePtr - Cores[0].LastClock) > 0)
|
||||
{
|
||||
const u32 amt = std::min(cClocks - Cores[0].LastClock, (u32)Cores[0].DMAICounter);
|
||||
const u32 amt = std::min(*cyclePtr - Cores[0].LastClock, (u32)Cores[0].DMAICounter);
|
||||
Cores[0].DMAICounter -= amt;
|
||||
Cores[0].LastClock = cClocks;
|
||||
Cores[0].MADR += amt * 2;
|
||||
Cores[0].LastClock = *cyclePtr;
|
||||
Cores[0].MADR += amt / 2;
|
||||
if (Cores[0].DMAICounter <= 0)
|
||||
{
|
||||
if (Cores[0].IsDMARead)
|
||||
Cores[0].FinishDMAread();
|
||||
if (((Cores[0].AutoDMACtrl & 1) != 1))
|
||||
{
|
||||
if (Cores[0].IsDMARead)
|
||||
Cores[0].FinishDMAread();
|
||||
else
|
||||
Cores[0].FinishDMAwrite();
|
||||
}
|
||||
|
||||
for (int i = 0; i < 2; i++)
|
||||
{
|
||||
|
@ -427,27 +432,33 @@ __forceinline void TimeUpdate(u32 cClocks)
|
|||
}
|
||||
}
|
||||
}
|
||||
|
||||
//ConLog("counter set and callback!\n");
|
||||
Cores[0].DMAICounter = 0;
|
||||
if (!SPU2_dummy_callback)
|
||||
spu2DMA4Irq();
|
||||
else
|
||||
SPU2interruptDMA4();
|
||||
if (!Cores[0].DMAICounter)
|
||||
{
|
||||
Cores[0].MADR = Cores[0].TADR;
|
||||
if (!SPU2_dummy_callback)
|
||||
spu2DMA4Irq();
|
||||
else
|
||||
SPU2interruptDMA4();
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
//Update DMA7 interrupt delay counter
|
||||
if (Cores[1].DMAICounter > 0 && (cClocks - Cores[1].LastClock) > 0)
|
||||
if (Cores[1].DMAICounter > 0 && (*cyclePtr - Cores[1].LastClock) > 0)
|
||||
{
|
||||
const u32 amt = std::min(cClocks - Cores[1].LastClock, (u32)Cores[1].DMAICounter);
|
||||
const u32 amt = std::min(*cyclePtr - Cores[1].LastClock, (u32)Cores[1].DMAICounter);
|
||||
Cores[1].DMAICounter -= amt;
|
||||
Cores[1].LastClock = cClocks;
|
||||
Cores[1].MADR += amt * 2;
|
||||
Cores[1].LastClock = *cyclePtr;
|
||||
Cores[1].MADR += amt / 2;
|
||||
if (Cores[1].DMAICounter <= 0)
|
||||
{
|
||||
if (Cores[1].IsDMARead)
|
||||
Cores[1].FinishDMAread();
|
||||
if (((Cores[1].AutoDMACtrl & 2) != 2))
|
||||
{
|
||||
if (Cores[1].IsDMARead)
|
||||
Cores[1].FinishDMAread();
|
||||
else
|
||||
Cores[1].FinishDMAwrite();
|
||||
}
|
||||
|
||||
for (int i = 0; i < 2; i++)
|
||||
{
|
||||
|
@ -464,12 +475,14 @@ __forceinline void TimeUpdate(u32 cClocks)
|
|||
}
|
||||
}
|
||||
|
||||
Cores[1].DMAICounter = 0;
|
||||
//ConLog( "* SPU2 > DMA 7 Callback! %d\n", Cycles );
|
||||
if (!SPU2_dummy_callback)
|
||||
spu2DMA7Irq();
|
||||
else
|
||||
SPU2interruptDMA7();
|
||||
if (!Cores[1].DMAICounter)
|
||||
{
|
||||
Cores[1].MADR = Cores[1].TADR;
|
||||
if (!SPU2_dummy_callback)
|
||||
spu2DMA7Irq();
|
||||
else
|
||||
SPU2interruptDMA7();
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -1232,9 +1245,7 @@ static void __fastcall RegWrite_Core(u16 value)
|
|||
thiscore.Mute = 0;
|
||||
//thiscore.CoreEnabled=(value>>15) & 0x01; //1 bit
|
||||
// no clue
|
||||
if (value >> 15)
|
||||
thiscore.Regs.STATX = 0;
|
||||
thiscore.Regs.ATTR = value & 0x7fff;
|
||||
thiscore.Regs.ATTR = value & 0xffff;
|
||||
|
||||
if (fxenable && !thiscore.FxEnable && (thiscore.EffectsStartA != thiscore.ExtEffectsStartA || thiscore.EffectsEndA != thiscore.ExtEffectsEndA))
|
||||
{
|
||||
|
@ -1244,11 +1255,10 @@ static void __fastcall RegWrite_Core(u16 value)
|
|||
thiscore.RevBuffers.NeedsUpdated = true;
|
||||
}
|
||||
|
||||
if (oldDmaMode != thiscore.DmaMode)
|
||||
{
|
||||
// FIXME... maybe: if this mode was cleared in the middle of a DMA, should we interrupt it?
|
||||
thiscore.Regs.STATX &= ~0x400; // ready to transfer
|
||||
}
|
||||
if (!thiscore.DmaMode)
|
||||
thiscore.Regs.STATX &= ~0x80;
|
||||
else if(!oldDmaMode)
|
||||
thiscore.Regs.STATX |= 0x80;
|
||||
|
||||
if (value & 0x000E)
|
||||
{
|
||||
|
|
Loading…
Reference in New Issue