SPU2Ghz: Had to revert dma.cpp to rev244 for the most part. The dma cache system in DoDMAWrite() broke Arc the Lad dma audio. The auido starts to loop a bit in rev 264 and from there on it gets worse.

Sorry for not finding this earlier, I hope the cache can get fixed so we can include it again.

git-svn-id: http://pcsx2-playground.googlecode.com/svn/trunk@333 a6443dda-0b58-4228-96e9-037be469359c
This commit is contained in:
ramapcsx2 2008-11-15 18:31:51 +00:00 committed by Gregory Hainaut
parent d0c0b20505
commit 7e828a69ee
1 changed files with 33 additions and 81 deletions

View File

@ -92,9 +92,9 @@ void DMALogClose() {
__forceinline u16 DmaRead(u32 core)
{
Cores[core].TDA&=0xfffff;
const u16 ret = (u16)spu2M_Read(Cores[core].TDA);
Cores[core].TDA++;
Cores[core].TDA&=0xfffff;
return ret;
}
@ -189,6 +189,8 @@ void StartADMAWrite(int core,u16 *pMem, u32 sz)
void DoDMAWrite(int core,u16 *pMem,u32 size)
{
u32 i;
{
// Perform an alignment check.
// Not really important. Everything should work regardless,
@ -216,102 +218,52 @@ void DoDMAWrite(int core,u16 *pMem,u32 size)
if(MsgDMA()) ConLog(" * SPU2: DMA%c Transfer of %d bytes to %x (%02x %x %04x).\n",(core==0)?'4':'7',size<<1,Cores[core].TSA,Cores[core].DMABits,Cores[core].AutoDMACtrl,(~Cores[core].Regs.ATTR)&0x7fff);
// split the DMA copy into two chunks if needed.
// Optimized!
// Instead of checking the adpcm cache for every word, we check for every block.
// That way we can use the optimized fast write instruction to commit the memory.
Cores[core].TDA = Cores[core].TSA & 0xfffff;
u32 buff1end = Cores[core].TDA + size;
s32 buff2end = buff1end - 0xfffff;
if( buff2end > 0 )
buff1end = 0xfffff;
{
u32 nexta = Cores[core].TDA >> 3; // next address in 8 word blocks
const u32 leftsidebit = nexta & 31;
u32 rightsidebit; // assigned later
u32 nexta = Cores[core].TDA >> 3;
u32 flagbitmask = 1ul << ( nexta & 31 );
nexta >>= 5;
// Left side remainder:
// this produces a bitmask of the left side remainder of the cache flags:
pcm_cache_flags[nexta] &= (1ul << leftsidebit)-1;
// middle run!
// Traverse from start to finish in 8*32 word blocks,
// and clear all the the pcm cache flags for each block.
const u32 buff1size = (buff1end-Cores[core].TDA);
memcpy( GetMemPtr( Cores[core].TDA ), pMem, buff1size*2 );
//for(; Cores[core].TDA<buff1end; ++Cores[core].TDA, ++pMem)
// *GetMemPtr( Cores[core].TDA ) = *pMem;
buff1end >>= (3+5); // 8 words per block, 32 blocks per int.
memset( &pcm_cache_flags[nexta], 0, sizeof( u32 ) * (buff1end-nexta) );
if( buff2end > 0 )
// Traverse from start to finish in 8 word blocks,
// and clear the pcm cache flag for each block.
u32 stmp = ( size + 7 ) >> 3; // round up
for( i=0; i<stmp; i++ )
{
// second branch needs cleared:
// It starts at the beginning of memory and moves forward to buff2end
const u32 endpt2 = buff2end >> (3+5); // 8 words per block, 32 blocks per int.
memset( pcm_cache_flags, 0, sizeof( u32 ) * endpt2 );
memcpy( GetMemPtr( 0 ), &pMem[buff1size], buff2end*2 );
//for(Cores[core].TDA=0; Cores[core].TDA<(u32)buff2end; ++Cores[core].TDA, ++pMem)
// *GetMemPtr( Cores[core].TDA ) = *pMem;
rightsidebit = buff2end >> 3;
nexta = endpt2;
if(Cores[core].IRQEnable)
pcm_cache_flags[nexta] &= ~flagbitmask;
flagbitmask <<= 1;
if( flagbitmask == 0 )
{
// Flag interrupt?
// If IRQA occurs between start and dest, flag it.
// Since the buffer wraps, the conditional might seem odd, but it works.
if( ( Cores[core].IRQA >= Cores[core].TDA ) ||
( Cores[core].IRQA <= (u32)buff2end ) )
{
Spdif.Info=4<<core;
SetIrqCall();
}
}
Cores[core].TDA = buff2end;
}
else
{
rightsidebit = buff1end >> 3;
nexta = buff1end;
Cores[core].TDA = buff1end;
if(Cores[core].IRQEnable)
{
// Flag interrupt?
// If IRQA occurs between start and dest, flag it:
if( ( Cores[core].IRQA >= Cores[core].TSA ) &&
( Cores[core].IRQA <= Cores[core].TDA ) )
{
Spdif.Info=4<<core;
SetIrqCall();
}
nexta++;
flagbitmask = 1;
}
}
// clear the right-side remainder:
pcm_cache_flags[nexta] &= ~((1ul << (32-(rightsidebit&31)))-1);
}
//Cores[core].TDA=Cores[core].TSA+size;
for(i=0;i<size;i++)
{
*GetMemPtr( Cores[core].TDA ) = pMem[i];
//spu2M_Write( Cores[core].TDA, pMem[i] );
Cores[core].TDA++;
Cores[core].TDA&=0xfffff;
}
i=Cores[core].TSA;
Cores[core].TDA=Cores[core].TSA+size;
if((Cores[core].TDA>0xFFFFF)||((Cores[core].TDA>=Cores[core].IRQA)&&(i<=Cores[core].IRQA))) {
if(Cores[core].IRQEnable)
{
Spdif.Info=4<<core;
SetIrqCall();
}
}
Cores[core].TSA=Cores[core].TDA&0xFFFF0;
Cores[core].DMAICounter=size;
Cores[core].TADR=Cores[core].MADR+(size<<1);
}
void SPU2readDMA(int core, u16* pMem, u32 size)
@ -369,6 +321,7 @@ void SPU2writeDMA(int core, u16* pMem, u32 size)
}
else
{
DoDMAWrite(core,pMem,size);
}
Cores[core].Regs.STATX &= ~0x80;
@ -429,4 +382,3 @@ void CALLBACK SPU2interruptDMA7() {
Cores[1].Regs.STATX |= 0x80;
//Cores[1].Regs.ATTR &= ~0x30;
}