GS: Improvements to MTBA address calculation

This commit is contained in:
refractionpcsx2 2022-03-07 01:58:52 +00:00
parent fc6ec2cc02
commit 8f0dc34847
1 changed files with 40 additions and 49 deletions

View File

@ -902,7 +902,10 @@ void GSState::GIFRegHandlerTEX0(const GIFReg* RESTRICT r)
GL_REG("TEX0_%d = 0x%x_%x", i, r->U32[1], r->U32[0]); GL_REG("TEX0_%d = 0x%x_%x", i, r->U32[1], r->U32[0]);
GIFRegTEX0 TEX0 = r->TEX0; GIFRegTEX0 TEX0 = r->TEX0;
const bool MTBAreload = ((tex_flushed && (i == m_env.PRIM.CTXT)) || (r->TEX0.TBP0 != m_env.CTXT[i].TEX0.TBP0)) ? true : false; GIFRegMIPTBP1 temp_MIPTBP1;
bool MTBAReloaded = false;
// Max allowed MTBA size for 32bit swizzled textures (including 8H 4HL etc) is 512, 16bit and normal 8/4bit formats can be 1024
const u32 maxTex = (GSLocalMemory::m_psm[TEX0.PSM].bpp < 32) ? 10 : 9;
// Spec max is 10 // Spec max is 10
// //
@ -918,61 +921,53 @@ void GSState::GIFRegHandlerTEX0(const GIFReg* RESTRICT r)
TEX0.TW = std::clamp<u32>(TEX0.TW, 0, 10); TEX0.TW = std::clamp<u32>(TEX0.TW, 0, 10);
TEX0.TH = std::clamp<u32>(TEX0.TH, 0, 10); TEX0.TH = std::clamp<u32>(TEX0.TH, 0, 10);
ApplyTEX0<i>(TEX0); // MTBA loads are triggered by writes to TEX0 (but not TEX2!)
// Textures MUST be a minimum width of 32 pixels
// When the texture cache reloads any MIPS need to update too, so let's do that here. // Format must be a color, Z formats do not trigger MTBA (but are valid for Mipmapping)
// This is essentially triggered by the texture page change, so if TEXFLUSH is called and a draw doesn't proceed it, or TBP changes. if (m_env.CTXT[i].TEX1.MTBA && TEX0.TW >= 5 && TEX0.TW <= maxTex && (TEX0.PSM & 0x30) != 0x30)
// Textures must be of equal width/height and a minimum of 32x32
if (MTBAreload && m_env.CTXT[i].TEX1.MTBA && m_env.CTXT[i].TEX0.TW == m_env.CTXT[i].TEX0.TH && m_env.CTXT[i].TEX0.TW >= 5)
{ {
// NOTE 1: TEX1.MXL must not be automatically set to 3 here. // NOTE 1: TEX1.MXL must not be automatically set to 3 here and it has no effect on MTBA.
// NOTE 2: Mipmap levels are tightly packed, if (tbw << 6) > (1 << tw) then the left-over space to the right is used. (common for PSM_PSMT4) // NOTE 2: Mipmap levels are packed with a minimum distance between them of 1 block, even down at 4bit textures under 16x16.
// NOTE 3: Non-rectangular textures are treated as rectangular when calculating the occupied space (height is extended, not sure about width) // NOTE 3: Everything is derrived from the width of the texture, TBW and TH are completely ignored (useful for handling non-rectangular ones)
// NOTE 4: Cartoon Network Racing's menu is VERY sensitive to this as it uses 4bit sized textures for the sky.
u32 bp = TEX0.TBP0;
u32 bw = std::max(1u, (1u << TEX0.TW) >> 6);
u32 bp = m_env.CTXT[i].TEX0.TBP0; // Address is calculated as a 4bit address space, then converted (/8) to 32bit address space
u32 bw = m_env.CTXT[i]. TEX0.TBW; // ((w * w * bpp) / 8) / 64. No the 'w' is not a typo ;)
u32 w = 1u << m_env.CTXT[i].TEX0.TW; const u32 bpp = GSLocalMemory::m_psm[TEX0.PSM].bpp >> 2;
u32 h = 1u << m_env.CTXT[i].TEX0.TH; u32 tex_size = ((1u << TEX0.TW) * (1u << TEX0.TW) * bpp) >> 9;
u32 minwidth = m_env.CTXT[i].TEX1.MMIN >= 4 ? 8 : 1;
const u32 bpp = GSLocalMemory::m_psm[m_env.CTXT[i].TEX0.PSM].bpp; bp += tex_size;
bw = std::max<u32>(bw >> 1, 1);
tex_size = std::max<u32>(tex_size >> 2, 1);
bp += (int)((w * h * ((float)bpp / 8))) >> 8; temp_MIPTBP1.TBP1 = bp;
temp_MIPTBP1.TBW1 = bw;
if (w > minwidth) bp += tex_size;
{ bw = std::max<u32>(bw >> 1, 1);
bw = std::max<u32>(bw >> 1, 1); tex_size = std::max<u32>(tex_size >> 2, 1);
w = std::max<u32>(w >> 1, 1);
h = std::max<u32>(h >> 1, 1);
}
m_env.CTXT[i].MIPTBP1.TBP1 = bp; temp_MIPTBP1.TBP2 = bp;
m_env.CTXT[i].MIPTBP1.TBW1 = bw; temp_MIPTBP1.TBW2 = bw;
bp += (int)((w * h * ((float)bpp / 8))) >> 8; bp += tex_size;
bw = std::max<u32>(bw >> 1, 1);
if (w > minwidth) temp_MIPTBP1.TBP3 = bp;
{ temp_MIPTBP1.TBW3 = bw;
bw = std::max<u32>(bw >> 1, 1);
w = std::max<u32>(w >> 1, 1);
h = std::max<u32>(h >> 1, 1);
}
m_env.CTXT[i].MIPTBP1.TBP2 = bp; if (temp_MIPTBP1 != m_env.CTXT[i].MIPTBP1)
m_env.CTXT[i].MIPTBP1.TBW2 = bw; Flush();
bp += (int)((w * h * ((float)bpp / 8))) >> 8; MTBAReloaded = true;
if (w > minwidth)
{
bw = std::max<u32>(bw >> 1, 1);
}
m_env.CTXT[i].MIPTBP1.TBP3 = bp;
m_env.CTXT[i].MIPTBP1.TBW3 = bw;
} }
tex_flushed = false; ApplyTEX0<i>(TEX0);
if (MTBAReloaded)
m_env.CTXT[i].MIPTBP1 = temp_MIPTBP1;
} }
template <int i> template <int i>
@ -1140,7 +1135,6 @@ void GSState::GIFRegHandlerTEXFLUSH(const GIFReg* RESTRICT r)
{ {
GL_REG("TEXFLUSH = 0x%x_%x PRIM TME %x", r->U32[1], r->U32[0], PRIM->TME); GL_REG("TEXFLUSH = 0x%x_%x PRIM TME %x", r->U32[1], r->U32[0], PRIM->TME);
tex_flushed = true;
// Some games do a single sprite draw to itself, then flush the texture cache, then use that texture again. // Some games do a single sprite draw to itself, then flush the texture cache, then use that texture again.
// This won't get picked up by the new autoflush logic (which checks for page crossings for the PS2 Texture Cache flush) // This won't get picked up by the new autoflush logic (which checks for page crossings for the PS2 Texture Cache flush)
// so we need to do it here. // so we need to do it here.
@ -2846,9 +2840,6 @@ __forceinline void GSState::VertexKick(u32 skip)
default: default:
__assume(0); __assume(0);
} }
if (PRIM->TME)
tex_flushed = false;
} }
/// Checks if region repeat is used (applying it does something to at least one of the values in min...max) /// Checks if region repeat is used (applying it does something to at least one of the values in min...max)
@ -3279,7 +3270,7 @@ bool GSState::IsOpaque()
bool GSState::IsMipMapDraw() bool GSState::IsMipMapDraw()
{ {
return m_context->TEX1.MXL > 0 && m_context->TEX1.MMIN >= 2 && m_context->TEX1.MMIN <= 5 && m_vt.m_lod.y > 0 && (!m_context->TEX1.MTBA || m_context->TEX0.TH == m_context->TEX0.TW); return m_context->TEX1.MXL > 0 && m_context->TEX1.MMIN >= 2 && m_context->TEX1.MMIN <= 5 && m_vt.m_lod.y > 0;
} }
bool GSState::IsMipMapActive() bool GSState::IsMipMapActive()