SPU2ghz: Fixed a memory corruption bug in the rolled back DMA write code. Hopefully this DMA write code will fix that bug without breaking Arc the Lad and similar games.

git-svn-id: http://pcsx2-playground.googlecode.com/svn/trunk@334 a6443dda-0b58-4228-96e9-037be469359c
This commit is contained in:
Jake.Stine 2008-11-17 17:11:11 +00:00 committed by Gregory Hainaut
parent 7e828a69ee
commit 96560444ea
3 changed files with 99 additions and 64 deletions

View File

@ -492,7 +492,7 @@ BOOL CALLBACK ConfigProc(HWND hWnd,UINT uMsg,WPARAM wParam,LPARAM lParam)
// Debugging / Logging Flags:
SET_CHECK(IDC_EFFECTS, EffectsEnabled);
SET_CHECK(IDC_DEBUG, DebugEnabled);
SET_CHECK(IDC_MSGKEY, _MsgToConsole);
SET_CHECK(IDC_MSGSHOW, _MsgToConsole);
SET_CHECK(IDC_MSGKEY, _MsgKeyOnOff);
SET_CHECK(IDC_MSGVOICE,_MsgVoiceOff);
SET_CHECK(IDC_MSGDMA, _MsgDMA);

View File

@ -92,9 +92,9 @@ void DMALogClose() {
__forceinline u16 DmaRead(u32 core)
{
Cores[core].TDA&=0xfffff;
const u16 ret = (u16)spu2M_Read(Cores[core].TDA);
Cores[core].TDA++;
Cores[core].TDA&=0xfffff;
return ret;
}
@ -189,27 +189,24 @@ void StartADMAWrite(int core,u16 *pMem, u32 sz)
void DoDMAWrite(int core,u16 *pMem,u32 size)
{
u32 i;
// Perform an alignment check.
// Not really important. Everything should work regardless,
// but it could be indicative of an emulation foopah elsewhere.
#ifndef PUBLIC
uptr pa = ((uptr)pMem)&7;
uptr pm = Cores[core].TSA&0x7;
if( pa )
{
// Perform an alignment check.
// Not really important. Everything should work regardless,
// but it could be indicative of an emulation foopah elsewhere.
uptr pa = ((uptr)pMem)&7;
uptr pm = Cores[core].TSA&0x7;
if( pa )
{
fprintf(stderr, "* SPU2 DMA Write > Missaligned SOURCE! Core: %d TSA: 0x%x TDA: 0x%x Size: 0x%x\n", core, Cores[core].TSA, Cores[core].TDA, size);
}
if( pm )
{
fprintf(stderr, "* SPU2 DMA Write > Missaligned TARGET! Core: %d TSA: 0x%x TDA: 0x%x Size: 0x%x\n", core, Cores[core].TSA, Cores[core].TDA, size );
}
fprintf(stderr, "* SPU2 DMA Write > Missaligned SOURCE! Core: %d TSA: 0x%x TDA: 0x%x Size: 0x%x\n", core, Cores[core].TSA, Cores[core].TDA, size);
}
if( pm )
{
fprintf(stderr, "* SPU2 DMA Write > Missaligned TARGET! Core: %d TSA: 0x%x TDA: 0x%x Size: 0x%x\n", core, Cores[core].TSA, Cores[core].TDA, size );
}
#endif
if(core==0)
DMA4LogWrite(pMem,size<<1);
@ -218,49 +215,91 @@ void DoDMAWrite(int core,u16 *pMem,u32 size)
if(MsgDMA()) ConLog(" * SPU2: DMA%c Transfer of %d bytes to %x (%02x %x %04x).\n",(core==0)?'4':'7',size<<1,Cores[core].TSA,Cores[core].DMABits,Cores[core].AutoDMACtrl,(~Cores[core].Regs.ATTR)&0x7fff);
// Optimized!
// Instead of checking the adpcm cache for every word, we check for every block.
// split the DMA copy into two chunks if needed.
// Instead of checking the adpcm cache for every word, we check for every ADPCM block.
// That way we can use the optimized fast write instruction to commit the memory.
Cores[core].TDA = Cores[core].TSA & 0xfffff;
Cores[core].TSA &= 0xfffff;
u32 buff1end = Cores[core].TSA + size;
u32 buff2end=0;
if( buff1end > 0xfffff )
{
u32 nexta = Cores[core].TDA >> 3;
u32 flagbitmask = 1ul << ( nexta & 31 );
nexta >>= 5;
buff2end = buff1end - 0xfffff;
buff1end = 0xfffff;
}
// Traverse from start to finish in 8 word blocks,
// and clear the pcm cache flag for each block.
u32 stmp = ( size + 7 ) >> 3; // round up
for( i=0; i<stmp; i++ )
// Ideally we would only mask bits actually written to, but it's a complex algorithm
// that is way more work than it's worth. Instead we just mask out entire bytes, which
// means that in rare cases some games may end up having to re-decode some blocks
// unnecessarily. To minimize the chance of that, I mask at the byte level instead
// of the dword level, so at worst there are only 7 extra blocks to the front or back
// of the DMA transfer that get cleared when they shouldn't be.
// First Branch needs cleared:
// It starts at TSA and goes to buff1end.
const u32 buff1size = (buff1end-Cores[core].TSA);
memcpy( GetMemPtr( Cores[core].TSA ), pMem, buff1size*2 );
// Note: When clearing cache flags, the *endpoint* needs to be rounded upward.
// just rounding the count upward could cause problems if both start and end
// points are mis-aligned.
const u32 roundUp = (1<<(3+3))-1;
const u32 flagTSA = Cores[core].TSA >> (3+3);
const u32 flagTDA = (buff1end + roundUp) >> (3 + 3); // endpoint, rounded up
u8* cache = (u8*)pcm_cache_flags;
memset( &cache[flagTSA], 0, flagTDA - flagTSA );
if( buff2end > 0 )
{
// second branch needs cleared:
// It starts at the beginning of memory and moves forward to buff2end
const u32 endpt2 = (buff2end + roundUp) >> (3+3);
memcpy( GetMemPtr( 0 ), &pMem[buff1size], buff2end*2 );
memset( pcm_cache_flags, 0, endpt2 );
Cores[core].TDA = buff2end;
if(Cores[core].IRQEnable)
{
pcm_cache_flags[nexta] &= ~flagbitmask;
flagbitmask <<= 1;
if( flagbitmask == 0 )
// Flag interrupt?
// If IRQA occurs between start and dest, flag it.
// Since the buffer wraps, the conditional might seem odd, but it works.
if( ( Cores[core].IRQA >= Cores[core].TSA ) ||
( Cores[core].IRQA <= Cores[core].TDA ) )
{
nexta++;
flagbitmask = 1;
Spdif.Info=4<<core;
SetIrqCall();
}
}
}
else
{
// Buffer doesn't wrap/overflow!
// Just set the TDA and check for an IRQ...
Cores[core].TDA = buff1end;
if(Cores[core].IRQEnable)
{
// Flag interrupt?
// If IRQA occurs between start and dest, flag it:
if( ( Cores[core].IRQA >= Cores[core].TSA ) &&
( Cores[core].IRQA <= Cores[core].TDA ) )
{
Spdif.Info=4<<core;
SetIrqCall();
}
}
}
for(i=0;i<size;i++)
{
*GetMemPtr( Cores[core].TDA ) = pMem[i];
//spu2M_Write( Cores[core].TDA, pMem[i] );
Cores[core].TDA++;
Cores[core].TDA&=0xfffff;
}
i=Cores[core].TSA;
Cores[core].TDA=Cores[core].TSA+size;
if((Cores[core].TDA>0xFFFFF)||((Cores[core].TDA>=Cores[core].IRQA)&&(i<=Cores[core].IRQA))) {
if(Cores[core].IRQEnable)
{
Spdif.Info=4<<core;
SetIrqCall();
}
}
Cores[core].TSA=Cores[core].TDA&0xFFFF0;
Cores[core].DMAICounter=size;
Cores[core].TADR=Cores[core].MADR+(size<<1);
@ -321,7 +360,6 @@ void SPU2writeDMA(int core, u16* pMem, u32 size)
}
else
{
DoDMAWrite(core,pMem,size);
}
Cores[core].Regs.STATX &= ~0x80;
@ -382,3 +420,4 @@ void CALLBACK SPU2interruptDMA7() {
Cores[1].Regs.STATX |= 0x80;
//Cores[1].Regs.ATTR &= ~0x30;
}

View File

@ -22,9 +22,6 @@
#include "regtable.h"
#include "svnrev.h"
// DLL Interface exportation:
void StartVoices(int core, u32 value);
void StopVoices(int core, u32 value);
@ -456,7 +453,8 @@ EXPORT_C_(s32) SPU2open(void *pDsp)
FileLog("[%10d] SPU2 Open\n",Cycles);
/*if(debugDialogOpen==0)
/*
if(debugDialogOpen==0)
{
hDebugDialog = CreateDialogParam(hInstance,MAKEINTRESOURCE(IDD_DEBUG),0,DebugProc,0);
ShowWindow(hDebugDialog,SW_SHOWNORMAL);
@ -656,7 +654,7 @@ void UpdateDebugDialog()
{
printf(" *** Warning! Core %d Voice %d: StartA should be %06x, and is %06x.\n",
c,v,vcd.lastSetStartA,vc.StartA);
vcd.lastSetStartA = vcd.lastSetStartA;
vcd.lastSetStartA = vc.StartA;
}
}
}
@ -715,12 +713,11 @@ void __fastcall TimeUpdate(u32 cClocks)
lClocks = cClocks-dClocks;
}
//UpdateDebugDialog();
//Update Mixing Progress
while(dClocks>=TickInterval)
{
//UpdateDebugDialog();
if(has_to_call_irq)
{
ConLog(" * SPU2: Irq Called (%04x).\n",Spdif.Info);
@ -889,7 +886,7 @@ void UpdateSpdifMode()
__forceinline void RegLog(int level, char *RName,u32 mem,u32 core,u16 value)
{
if(level>1)
if( level > 1 )
FileLog("[%10d] SPU2 write mem %08x (core %d, register %s) value %04x\n",Cycles,mem,core,RName,value);
}
@ -1601,12 +1598,11 @@ static __forceinline void SPU2_FastWrite( u32 rmem, u16 value )
break;
default:
SPU2writeLog(mem,value);
*(regtable[mem>>1])=value;
break;
}
SPU2writeLog(mem,value);
if ((mem>=0x07C0) && (mem<0x07CE))
{
UpdateSpdifMode();
@ -1932,7 +1928,7 @@ void VoiceStart(int core,int vc)
{
if(Cores[core].Voices[vc].StartA&7)
{
printf(" *** Missaligned StartA %05x!\n",Cores[core].Voices[vc].StartA);
fprintf( stderr, " *** Missaligned StartA %05x!\n",Cores[core].Voices[vc].StartA);
Cores[core].Voices[vc].StartA=(Cores[core].Voices[vc].StartA+0xFFFF8)+0x8;
}