Yes, more Vif work. writeX, writeY, writeZ, and writeW are all merged into one function.

git-svn-id: http://pcsx2.googlecode.com/svn/trunk@939 96395faa-99c1-11dd-bbfe-3dabce05a288
This commit is contained in:
arcum42 2009-04-09 23:57:58 +00:00
parent ccacbedc50
commit 98258eeffe
2 changed files with 145 additions and 279 deletions

View File

@ -44,7 +44,7 @@ enum UnpackOffset
OFFSET_X = 0, OFFSET_X = 0,
OFFSET_Y = 1, OFFSET_Y = 1,
OFFSET_Z = 2, OFFSET_Z = 2,
OFFSET_W =3 OFFSET_W = 3
}; };
#define spr0 ((DMACh*)&PS2MEM_HW[0xD000]) #define spr0 ((DMACh*)&PS2MEM_HW[0xD000])
@ -54,25 +54,29 @@ __forceinline static int _limit(int a, int max)
return (a > max) ? max : a; return (a > max) ? max : a;
} }
static __releaseinline void writeX(u32 &dest, u32 data) static __releaseinline void writeXYZW(u32 offnum, u32 &dest, u32 data)
{ {
int n; int n;
u32 vifRowReg = getVifRowRegs(offnum);
if (_vifRegs->code & 0x10000000) if (_vifRegs->code & 0x10000000)
{ {
switch (_vif->cl) switch (_vif->cl)
{ {
case 0: case 0:
n = (_vifRegs->mask) & 0x3; if (offnum == OFFSET_X)
n = (_vifRegs->mask) & 0x3;
else
n = (_vifRegs->mask >> (offnum * 2)) & 0x3;
break; break;
case 1: case 1:
n = (_vifRegs->mask >> 8) & 0x3; n = (_vifRegs->mask >> ( 8 + (offnum * 2))) & 0x3;
break; break;
case 2: case 2:
n = (_vifRegs->mask >> 16) & 0x3; n = (_vifRegs->mask >> (16 + (offnum * 2))) & 0x3;
break; break;
default: default:
n = (_vifRegs->mask >> 24) & 0x3; n = (_vifRegs->mask >> (24 + (offnum * 2))) & 0x3;
break; break;
} }
} }
@ -85,271 +89,48 @@ static __releaseinline void writeX(u32 &dest, u32 data)
{ {
dest = data; dest = data;
} }
else if (_vifRegs->mode == 1) else switch (_vifRegs->mode)
{ {
dest = data + _vifRegs->r0; case 1:
} dest = data + vifRowReg;
else if (_vifRegs->mode == 2) break;
{ case 2:
_vifRegs->r0 += data; vifRowReg += data;
dest = _vifRegs->r0; dest = vifRowReg;
} break;
else default:
{ dest = data;
dest = data; break;
} }
break; break;
case 1: case 1:
dest = _vifRegs->r0; dest = vifRowReg;
break; break;
case 2: case 2:
switch (_vif->cl) if (_vif->cl > 2)
{ dest = getVifColRegs(3);
case 0: else
dest = _vifRegs->c0; dest = getVifColRegs(_vif->cl);
break;
case 1:
dest = _vifRegs->c1;
break;
case 2:
dest = _vifRegs->c2;
break;
default:
dest = _vifRegs->c3;
break;
}
break; break;
} }
setVifRowRegs(offnum, vifRowReg);
// VIF_LOG("writeX %8.8x : Mode %d, r0 = %x, data %8.8x", *dest,_vifRegs->mode,_vifRegs->r0,data); // VIF_LOG("writeX %8.8x : Mode %d, r0 = %x, data %8.8x", *dest,_vifRegs->mode,_vifRegs->r0,data);
} }
static __releaseinline void writeY(u32 &dest, u32 data) template <class T>
static __releaseinline void _UNPACKpart(u32 offnum, u32 &x, T y, int size)
{ {
int n; if (size > 0)
if (_vifRegs->code & 0x10000000)
{ {
switch (_vif->cl) writeXYZW(offnum, x, y);
{ _vifRegs->offset++;
case 0:
n = (_vifRegs->mask >> 2) & 0x3;
break;
case 1:
n = (_vifRegs->mask >> 10) & 0x3;
break;
case 2:
n = (_vifRegs->mask >> 18) & 0x3;
break;
default:
n = (_vifRegs->mask >> 26) & 0x3;
break;
}
} }
else n = 0;
switch (n)
{
case 0:
if ((_vif->cmd & 0x6F) == 0x6f)
{
dest = data;
}
else if (_vifRegs->mode == 1)
{
dest = data + _vifRegs->r1;
}
else if (_vifRegs->mode == 2)
{
_vifRegs->r1 += data;
dest = _vifRegs->r1;
}
else
{
dest = data;
}
break;
case 1:
dest = _vifRegs->r1;
break;
case 2:
switch (_vif->cl)
{
case 0:
dest = _vifRegs->c0;
break;
case 1:
dest = _vifRegs->c1;
break;
case 2:
dest = _vifRegs->c2;
break;
default:
dest = _vifRegs->c3;
break;
}
break;
}
// VIF_LOG("writeY %8.8x : Mode %d, r1 = %x, data %8.8x", *dest,_vifRegs->mode,_vifRegs->r1,data);
}
static __releaseinline void writeZ(u32 &dest, u32 data)
{
int n;
if (_vifRegs->code & 0x10000000)
{
switch (_vif->cl)
{
case 0:
n = (_vifRegs->mask >> 4) & 0x3;
break;
case 1:
n = (_vifRegs->mask >> 12) & 0x3;
break;
case 2:
n = (_vifRegs->mask >> 20) & 0x3;
break;
default:
n = (_vifRegs->mask >> 28) & 0x3;
break;
}
}
else n = 0;
switch (n)
{
case 0:
if ((_vif->cmd & 0x6F) == 0x6f)
{
dest = data;
}
else if (_vifRegs->mode == 1)
{
dest = data + _vifRegs->r2;
}
else if (_vifRegs->mode == 2)
{
_vifRegs->r2 += data;
dest = _vifRegs->r2;
}
else
{
dest = data;
}
break;
case 1:
dest = _vifRegs->r2;
break;
case 2:
switch (_vif->cl)
{
case 0:
dest = _vifRegs->c0;
break;
case 1:
dest = _vifRegs->c1;
break;
case 2:
dest = _vifRegs->c2;
break;
default:
dest = _vifRegs->c3;
break;
}
break;
}
// VIF_LOG("writeZ %8.8x : Mode %d, r2 = %x, data %8.8x", *dest,_vifRegs->mode,_vifRegs->r2,data);
}
static __releaseinline void writeW(u32 &dest, u32 data)
{
int n;
if (_vifRegs->code & 0x10000000)
{
switch (_vif->cl)
{
case 0:
n = (_vifRegs->mask >> 6) & 0x3;
break;
case 1:
n = (_vifRegs->mask >> 14) & 0x3;
break;
case 2:
n = (_vifRegs->mask >> 22) & 0x3;
break;
default:
n = (_vifRegs->mask >> 30) & 0x3;
break;
}
}
else n = 0;
switch (n)
{
case 0:
if ((_vif->cmd & 0x6F) == 0x6f)
{
dest = data;
}
else if (_vifRegs->mode == 1)
{
dest = data + _vifRegs->r3;
}
else if (_vifRegs->mode == 2)
{
_vifRegs->r3 += data;
dest = _vifRegs->r3;
}
else
{
dest = data;
}
break;
case 1:
dest = _vifRegs->r3;
break;
case 2:
switch (_vif->cl)
{
case 0:
dest = _vifRegs->c0;
break;
case 1:
dest = _vifRegs->c1;
break;
case 2:
dest = _vifRegs->c2;
break;
default:
dest = _vifRegs->c3;
break;
}
break;
}
// VIF_LOG("writeW %8.8x : Mode %d, r3 = %x, data %8.8x", *dest,_vifRegs->mode,_vifRegs->r3,data);
} }
template <class T> template <class T>
static void _UNPACKpart(u32 offnum, u32 &x, T y) static __releaseinline void _UNPACKpart(u32 offnum, u32 &x, T y)
{ {
switch (offnum) writeXYZW(offnum, x, y);
{
case OFFSET_X:
writeX(x,y);
break;
case OFFSET_Y:
writeY(x,y);
break;
case OFFSET_Z:
writeZ(x,y);
break;
case OFFSET_W:
writeW(x,y);
break;
default:
break;
}
_vifRegs->offset++; _vifRegs->offset++;
} }
@ -357,24 +138,22 @@ template <class T>
void __fastcall UNPACK_S(u32 *dest, T *data, int size) void __fastcall UNPACK_S(u32 *dest, T *data, int size)
{ {
//S-# will always be a complete packet, no matter what. So we can skip the offset bits //S-# will always be a complete packet, no matter what. So we can skip the offset bits
writeX(*dest++, *data); writeXYZW(OFFSET_X, *dest++, *data);
writeY(*dest++, *data); writeXYZW(OFFSET_Y, *dest++, *data);
writeZ(*dest++, *data); writeXYZW(OFFSET_Z, *dest++, *data);
writeW(*dest , *data); writeXYZW(OFFSET_W, *dest , *data);
} }
template <class T> template <class T>
void __fastcall UNPACK_V2(u32 *dest, T *data, int size) void __fastcall UNPACK_V2(u32 *dest, T *data, int size)
{ {
if(_vifRegs->offset == OFFSET_X && size > 0) if(_vifRegs->offset == OFFSET_X)
{ {
_UNPACKpart(_vifRegs->offset, *dest++, *data++); _UNPACKpart(_vifRegs->offset, *dest++, *data++, size--);
size--;
} }
if(_vifRegs->offset == OFFSET_Y && size > 0) if(_vifRegs->offset == OFFSET_Y)
{ {
_UNPACKpart(_vifRegs->offset, *dest++, *data); _UNPACKpart(_vifRegs->offset, *dest++, *data, size--);
size--;
} }
if(_vifRegs->offset == OFFSET_Z) if(_vifRegs->offset == OFFSET_Z)
{ {
@ -383,24 +162,22 @@ void __fastcall UNPACK_V2(u32 *dest, T *data, int size)
if(_vifRegs->offset == OFFSET_W) if(_vifRegs->offset == OFFSET_W)
{ {
_UNPACKpart(_vifRegs->offset, *dest, *data); _UNPACKpart(_vifRegs->offset, *dest, *data);
_vifRegs->offset = 0; _vifRegs->offset = OFFSET_X;
} }
} }
template <class T> template <class T>
void __fastcall UNPACK_V3(u32 *dest, T *data, int size) void __fastcall UNPACK_V3(u32 *dest, T *data, int size)
{ {
if(_vifRegs->offset == OFFSET_X && size > 0) if(_vifRegs->offset == OFFSET_X)
{ {
_UNPACKpart(_vifRegs->offset, *dest++, *data++); _UNPACKpart(_vifRegs->offset, *dest++, *data++, size--);
size--;
} }
if(_vifRegs->offset == OFFSET_Y && size > 0) if(_vifRegs->offset == OFFSET_Y)
{ {
_UNPACKpart(_vifRegs->offset, *dest++, *data++); _UNPACKpart(_vifRegs->offset, *dest++, *data++, size--);
size--;
} }
if(_vifRegs->offset == OFFSET_Z && size > 0) if(_vifRegs->offset == OFFSET_Z)
{ {
_UNPACKpart(_vifRegs->offset, *dest++, *data++); _UNPACKpart(_vifRegs->offset, *dest++, *data++);
} }
@ -409,7 +186,7 @@ void __fastcall UNPACK_V3(u32 *dest, T *data, int size)
//V3-# does some bizzare thing with alignment, every 6qw of data the W becomes 0 (strange console!) //V3-# does some bizzare thing with alignment, every 6qw of data the W becomes 0 (strange console!)
//Ape Escape doesnt seem to like it tho (what the hell?) gonna have to investigate //Ape Escape doesnt seem to like it tho (what the hell?) gonna have to investigate
_UNPACKpart(_vifRegs->offset, *dest, *data); _UNPACKpart(_vifRegs->offset, *dest, *data);
_vifRegs->offset = 0; _vifRegs->offset = OFFSET_X;
} }
} }
@ -418,20 +195,19 @@ void __fastcall UNPACK_V4(u32 *dest, T *data , int size)
{ {
while (size > 0) while (size > 0)
{ {
_UNPACKpart(_vifRegs->offset, *dest++, *data++); _UNPACKpart(_vifRegs->offset, *dest++, *data++, size--);
size--;
} }
if (_vifRegs->offset > OFFSET_W) _vifRegs->offset = 0; if (_vifRegs->offset > OFFSET_W) _vifRegs->offset = OFFSET_X;
} }
void __fastcall UNPACK_V4_5(u32 *dest, u32 *data, int size) void __fastcall UNPACK_V4_5(u32 *dest, u32 *data, int size)
{ {
//As with S-#, this will always be a complete packet //As with S-#, this will always be a complete packet
writeX(*dest++, ((*data & 0x001f) << 3)); writeXYZW(OFFSET_X, *dest++, ((*data & 0x001f) << 3));
writeY(*dest++, ((*data & 0x03e0) >> 2)); writeXYZW(OFFSET_Y, *dest++, ((*data & 0x03e0) >> 2));
writeZ(*dest++, ((*data & 0x7c00) >> 7)); writeXYZW(OFFSET_Z, *dest++, ((*data & 0x7c00) >> 7));
writeW(*dest, ((*data & 0x8000) >> 8)); writeXYZW(OFFSET_W, *dest, ((*data & 0x8000) >> 8));
} }
void __fastcall UNPACK_S_32(u32 *dest, u32 *data, int size) void __fastcall UNPACK_S_32(u32 *dest, u32 *data, int size)

View File

@ -87,6 +87,96 @@ extern "C"
extern u32* _vifCol; extern u32* _vifCol;
} }
__forceinline void setVifRowRegs(u32 reg, u32 data)
{
switch (reg)
{
case 0:
_vifRegs->r0 = data;
break;
case 1:
_vifRegs->r1 = data;
break;
case 2:
_vifRegs->r2 = data;
break;
case 3:
_vifRegs->r3 = data;
break;
default:
assert(0);
break;
}
}
__forceinline u32 getVifRowRegs(u32 reg)
{
switch (reg)
{
case 0:
return _vifRegs->r0;
break;
case 1:
return _vifRegs->r1;
break;
case 2:
return _vifRegs->r2;
break;
case 3:
return _vifRegs->r3;
break;
default:
assert(0);
return 0;
break;
}
}
__forceinline void setVifColRegs(u32 reg, u32 data)
{
switch (reg)
{
case 0:
_vifRegs->c0 = data;
break;
case 1:
_vifRegs->c1 = data;
break;
case 2:
_vifRegs->c2 = data;
break;
case 3:
_vifRegs->c3 = data;
break;
default:
assert(0);
break;
}
}
__forceinline u32 getVifColRegs(u32 reg)
{
switch (reg)
{
case 0:
return _vifRegs->c0;
break;
case 1:
return _vifRegs->c1;
break;
case 2:
return _vifRegs->c2;
break;
case 3:
return _vifRegs->c3;
break;
default:
assert(0);
return 0;
break;
}
}
#define vif0Regs ((VIFregisters*)&PS2MEM_HW[0x3800]) #define vif0Regs ((VIFregisters*)&PS2MEM_HW[0x3800])
#define vif1Regs ((VIFregisters*)&PS2MEM_HW[0x3c00]) #define vif1Regs ((VIFregisters*)&PS2MEM_HW[0x3c00])